2024-06-07 01:25:42 +02:00
< div class = "caption_settings" >
< div class = "inline-drawer" >
< div class = "inline-drawer-toggle inline-drawer-header" >
2024-06-14 21:46:40 +02:00
< b data-i18n = "Image Captioning" > Image Captioning< / b >
2024-06-07 01:25:42 +02:00
< div class = "inline-drawer-icon fa-solid fa-circle-chevron-down down" > < / div >
< / div >
< div class = "inline-drawer-content" >
2024-06-14 21:46:40 +02:00
< label for = "caption_source" data-i18n = "Source" > Source< / label >
2024-06-07 01:25:42 +02:00
< select id = "caption_source" class = "text_pole" >
2024-06-14 21:46:40 +02:00
< option value = "local" data-i18n = "Local" > Local< / option >
< option value = "multimodal" data-i18n = "Multimodal (OpenAI / Anthropic / llama / Google)" > Multimodal (OpenAI / Anthropic / llama / Google)< / option >
< option value = "extras" data-i18n = "Extras" > Extras< / option >
< option value = "horde" data-i18n = "Horde" > Horde< / option >
2024-06-07 01:25:42 +02:00
< / select >
< div id = "caption_multimodal_block" class = "flex-container wide100p" >
< div class = "flex1 flex-container flexFlowColumn flexNoGap" >
2024-06-14 21:46:40 +02:00
< label for = "caption_multimodal_api" data-i18n = "API" > API< / label >
2024-06-07 01:25:42 +02:00
< select id = "caption_multimodal_api" class = "flex1 text_pole" >
< option value = "anthropic" > Anthropic< / option >
2024-06-14 21:46:40 +02:00
< option value = "custom" data-i18n = "Custom (OpenAI-compatible)" > Custom (OpenAI-compatible)< / option >
2024-06-07 01:25:42 +02:00
< option value = "google" > Google MakerSuite< / option >
< option value = "koboldcpp" > KoboldCpp< / option >
< option value = "llamacpp" > llama.cpp< / option >
< option value = "ollama" > Ollama< / option >
< option value = "openai" > OpenAI< / option >
< option value = "openrouter" > OpenRouter< / option >
2024-06-14 21:46:40 +02:00
< option value = "ooba" data-i18n = "Text Generation WebUI (oobabooga)" > Text Generation WebUI (oobabooga)< / option >
2024-06-28 23:33:12 +02:00
< option value = "vllm" > vLLM< / option >
2024-06-07 01:25:42 +02:00
< / select >
< / div >
< div class = "flex1 flex-container flexFlowColumn flexNoGap" >
2024-06-14 21:46:40 +02:00
< label for = "caption_multimodal_model" data-i18n = "Model" > Model< / label >
2024-06-07 01:25:42 +02:00
< select id = "caption_multimodal_model" class = "flex1 text_pole" >
< option data-type = "openai" value = "gpt-4-vision-preview" > gpt-4-vision-preview< / option >
< option data-type = "openai" value = "gpt-4-turbo" > gpt-4-turbo< / option >
< option data-type = "openai" value = "gpt-4o" > gpt-4o< / option >
2024-06-20 17:31:55 +02:00
< option data-type = "anthropic" value = "claude-3-5-sonnet-20240620" > claude-3-5-sonnet-20240620< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "anthropic" value = "claude-3-opus-20240229" > claude-3-opus-20240229< / option >
< option data-type = "anthropic" value = "claude-3-sonnet-20240229" > claude-3-sonnet-20240229< / option >
< option data-type = "anthropic" value = "claude-3-haiku-20240307" > claude-3-haiku-20240307< / option >
< option data-type = "google" value = "gemini-pro-vision" > gemini-pro-vision< / option >
< option data-type = "google" value = "gemini-1.5-flash-latest" > gemini-1.5-flash-latest< / option >
< option data-type = "openrouter" value = "openai/gpt-4-vision-preview" > openai/gpt-4-vision-preview< / option >
< option data-type = "openrouter" value = "openai/gpt-4o" > openai/gpt-4o< / option >
< option data-type = "openrouter" value = "openai/gpt-4-turbo" > openai/gpt-4-turbo< / option >
< option data-type = "openrouter" value = "haotian-liu/llava-13b" > haotian-liu/llava-13b< / option >
< option data-type = "openrouter" value = "fireworks/firellava-13b" > fireworks/firellava-13b< / option >
2024-06-20 17:31:55 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3.5-sonnet" > anthropic/claude-3.5-sonnet< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3-haiku" > anthropic/claude-3-haiku< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-sonnet" > anthropic/claude-3-sonnet< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-opus" > anthropic/claude-3-opus< / option >
2024-06-20 17:31:55 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3.5-sonnet:beta" > anthropic/claude-3.5-sonnet:beta< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3-haiku:beta" > anthropic/claude-3-haiku:beta< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-sonnet:beta" > anthropic/claude-3-sonnet:beta< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-opus:beta" > anthropic/claude-3-opus:beta< / option >
< option data-type = "openrouter" value = "nousresearch/nous-hermes-2-vision-7b" > nousresearch/nous-hermes-2-vision-7b< / option >
< option data-type = "openrouter" value = "google/gemini-pro-vision" > google/gemini-pro-vision< / option >
< option data-type = "openrouter" value = "google/gemini-flash-1.5" > google/gemini-flash-1.5< / option >
< option data-type = "openrouter" value = "liuhaotian/llava-yi-34b" > liuhaotian/llava-yi-34b< / option >
2024-06-14 21:46:40 +02:00
< option data-type = "ollama" value = "ollama_current" data-i18n = "currently_selected" > [Currently selected]< / option >
2024-06-22 15:28:57 +02:00
< option data-type = "ollama" value = "bakllava" > bakllava< / option >
< option data-type = "ollama" value = "llava" > llava< / option >
< option data-type = "ollama" value = "llava-llama3" > llava-llama3< / option >
< option data-type = "ollama" value = "llava-phi3" > llava-phi3< / option >
< option data-type = "ollama" value = "moondream" > moondream< / option >
2024-06-14 21:46:40 +02:00
< option data-type = "llamacpp" value = "llamacpp_current" data-i18n = "currently_loaded" > [Currently loaded]< / option >
< option data-type = "ooba" value = "ooba_current" data-i18n = "currently_loaded" > [Currently loaded]< / option >
< option data-type = "koboldcpp" value = "koboldcpp_current" data-i18n = "currently_loaded" > [Currently loaded]< / option >
2024-06-28 23:33:12 +02:00
< option data-type = "vllm" value = "vllm_current" data-i18n = "currently_selected" > [Currently selected]< / option >
2024-06-14 21:46:40 +02:00
< option data-type = "custom" value = "custom_current" data-i18n = "currently_selected" > [Currently selected]< / option >
2024-06-07 01:25:42 +02:00
< / select >
< / div >
2024-06-22 15:28:57 +02:00
< div data-type = "ollama" >
The model must be downloaded first! Do it with the < code > ollama pull< / code > command or < a href = "#" id = "caption_ollama_pull" > click here< / a > .
< / div >
2024-06-07 01:25:42 +02:00
< label data-type = "openai,anthropic,google" class = "checkbox_label flexBasis100p" for = "caption_allow_reverse_proxy" title = "Allow using reverse proxy if defined and valid." >
< input id = "caption_allow_reverse_proxy" type = "checkbox" class = "checkbox" >
2024-06-14 21:46:40 +02:00
< span data-i18n = "Allow reverse proxy" > Allow reverse proxy< / span >
2024-06-07 01:25:42 +02:00
< / label >
< div class = "flexBasis100p m-b-1" >
2024-06-14 21:46:40 +02:00
< small > < b data-i18n = "Hint:" > Hint:< / b > < span data-i18n = "Set your API keys and endpoints in the 'API Connections' tab first." > Set your API keys and endpoints in the 'API Connections' tab first.< / span > < / small >
2024-06-07 01:25:42 +02:00
< / div >
< / div >
< div id = "caption_prompt_block" >
2024-06-14 21:46:40 +02:00
< label for = "caption_prompt" data-i18n = "Caption Prompt" > Caption Prompt< / label >
2024-06-07 01:25:42 +02:00
< textarea id = "caption_prompt" class = "text_pole" rows = "1" placeholder = "< Use default >" > ${PROMPT_DEFAULT}< / textarea >
< label class = "checkbox_label margin-bot-10px" for = "caption_prompt_ask" title = "Ask for a custom prompt every time an image is captioned." >
< input id = "caption_prompt_ask" type = "checkbox" class = "checkbox" >
2024-06-14 21:46:40 +02:00
< span data-i18n = "Ask every time" > Ask every time< / span >
2024-06-07 01:25:42 +02:00
< / label >
< / div >
2024-06-16 13:39:46 +02:00
< label for = "caption_template" > < span data-i18n = "Message Template" > Message Template< / span > < small > < span data-i18n = "(use _space" > (use < / span > < code > { { caption} } < / code > < span data-i18n = "macro)" > macro)< / span > < / small > < / label >
2024-06-07 01:25:42 +02:00
< textarea id = "caption_template" class = "text_pole" rows = "2" placeholder = "< Use default >" > ${TEMPLATE_DEFAULT}< / textarea >
< label class = "checkbox_label margin-bot-10px" for = "caption_refine_mode" >
< input id = "caption_refine_mode" type = "checkbox" class = "checkbox" >
2024-06-14 21:46:40 +02:00
< span data-i18n = "Edit captions before saving" > Edit captions before saving< / span >
2024-06-07 01:25:42 +02:00
< / label >
< / div >
< / div >
< / div >