2024-06-07 01:25:42 +02:00
< div class = "caption_settings" >
< div class = "inline-drawer" >
< div class = "inline-drawer-toggle inline-drawer-header" >
2024-06-14 21:46:40 +02:00
< b data-i18n = "Image Captioning" > Image Captioning< / b >
2024-06-07 01:25:42 +02:00
< div class = "inline-drawer-icon fa-solid fa-circle-chevron-down down" > < / div >
< / div >
< div class = "inline-drawer-content" >
2024-06-14 21:46:40 +02:00
< label for = "caption_source" data-i18n = "Source" > Source< / label >
2024-06-07 01:25:42 +02:00
< select id = "caption_source" class = "text_pole" >
2024-06-14 21:46:40 +02:00
< option value = "local" data-i18n = "Local" > Local< / option >
< option value = "multimodal" data-i18n = "Multimodal (OpenAI / Anthropic / llama / Google)" > Multimodal (OpenAI / Anthropic / llama / Google)< / option >
< option value = "extras" data-i18n = "Extras" > Extras< / option >
< option value = "horde" data-i18n = "Horde" > Horde< / option >
2024-06-07 01:25:42 +02:00
< / select >
< div id = "caption_multimodal_block" class = "flex-container wide100p" >
< div class = "flex1 flex-container flexFlowColumn flexNoGap" >
2024-06-14 21:46:40 +02:00
< label for = "caption_multimodal_api" data-i18n = "API" > API< / label >
2024-06-07 01:25:42 +02:00
< select id = "caption_multimodal_api" class = "flex1 text_pole" >
2024-08-01 00:34:49 +02:00
< option value = "zerooneai" > 01.AI (Yi)< / option >
2024-06-07 01:25:42 +02:00
< option value = "anthropic" > Anthropic< / option >
2024-06-14 21:46:40 +02:00
< option value = "custom" data-i18n = "Custom (OpenAI-compatible)" > Custom (OpenAI-compatible)< / option >
2024-08-21 20:00:17 +02:00
< option value = "google" > Google AI Studio< / option >
2024-10-03 07:41:45 +02:00
< option value = "groq" > Groq< / option >
2024-06-07 01:25:42 +02:00
< option value = "koboldcpp" > KoboldCpp< / option >
< option value = "llamacpp" > llama.cpp< / option >
2024-09-17 20:44:25 +02:00
< option value = "mistral" > MistralAI< / option >
2024-06-07 01:25:42 +02:00
< option value = "ollama" > Ollama< / option >
< option value = "openai" > OpenAI< / option >
< option value = "openrouter" > OpenRouter< / option >
2024-06-14 21:46:40 +02:00
< option value = "ooba" data-i18n = "Text Generation WebUI (oobabooga)" > Text Generation WebUI (oobabooga)< / option >
2024-06-28 23:33:12 +02:00
< option value = "vllm" > vLLM< / option >
2024-06-07 01:25:42 +02:00
< / select >
< / div >
< div class = "flex1 flex-container flexFlowColumn flexNoGap" >
2024-06-14 21:46:40 +02:00
< label for = "caption_multimodal_model" data-i18n = "Model" > Model< / label >
2024-06-07 01:25:42 +02:00
< select id = "caption_multimodal_model" class = "flex1 text_pole" >
2024-09-17 20:44:25 +02:00
< option data-type = "mistral" value = "pixtral-latest" > pixtral-latest< / option >
< option data-type = "mistral" value = "pixtral-12b-2409" > pixtral-12b-2409< / option >
2024-08-01 00:34:49 +02:00
< option data-type = "zerooneai" value = "yi-vision" > yi-vision< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openai" value = "gpt-4-vision-preview" > gpt-4-vision-preview< / option >
< option data-type = "openai" value = "gpt-4-turbo" > gpt-4-turbo< / option >
< option data-type = "openai" value = "gpt-4o" > gpt-4o< / option >
2024-07-18 21:51:47 +02:00
< option data-type = "openai" value = "gpt-4o-mini" > gpt-4o-mini< / option >
2024-08-17 19:58:20 +02:00
< option data-type = "openai" value = "chatgpt-4o-latest" > chatgpt-4o-latest< / option >
2024-06-20 17:31:55 +02:00
< option data-type = "anthropic" value = "claude-3-5-sonnet-20240620" > claude-3-5-sonnet-20240620< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "anthropic" value = "claude-3-opus-20240229" > claude-3-opus-20240229< / option >
< option data-type = "anthropic" value = "claude-3-sonnet-20240229" > claude-3-sonnet-20240229< / option >
< option data-type = "anthropic" value = "claude-3-haiku-20240307" > claude-3-haiku-20240307< / option >
2024-09-07 18:37:37 +02:00
< option data-type = "google" value = "gemini-1.5-flash" > gemini-1.5-flash< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "google" value = "gemini-1.5-flash-latest" > gemini-1.5-flash-latest< / option >
2024-09-07 18:37:37 +02:00
< option data-type = "google" value = "gemini-1.5-flash-001" > gemini-1.5-flash-001< / option >
2024-09-24 21:01:57 +02:00
< option data-type = "google" value = "gemini-1.5-flash-002" > gemini-1.5-flash-002< / option >
2024-08-28 01:22:06 +02:00
< option data-type = "google" value = "gemini-1.5-flash-exp-0827" > gemini-1.5-flash-exp-0827< / option >
< option data-type = "google" value = "gemini-1.5-flash-8b-exp-0827" > gemini-1.5-flash-8b-exp-0827< / option >
2024-09-24 21:01:57 +02:00
< option data-type = "google" value = "gemini-1.5-flash-8b-exp-0924" > gemini-1.5-flash-8b-exp-0924< / option >
2024-09-07 18:37:37 +02:00
< option data-type = "google" value = "gemini-1.5-pro" > gemini-1.5-pro< / option >
2024-08-02 20:18:41 +02:00
< option data-type = "google" value = "gemini-1.5-pro-latest" > gemini-1.5-pro-latest< / option >
2024-09-07 18:37:37 +02:00
< option data-type = "google" value = "gemini-1.5-pro-001" > gemini-1.5-pro-001< / option >
2024-09-24 21:01:57 +02:00
< option data-type = "google" value = "gemini-1.5-pro-002" > gemini-1.5-pro-002< / option >
2024-08-02 20:18:41 +02:00
< option data-type = "google" value = "gemini-1.5-pro-exp-0801" > gemini-1.5-pro-exp-0801< / option >
2024-08-28 01:22:06 +02:00
< option data-type = "google" value = "gemini-1.5-pro-exp-0827" > gemini-1.5-pro-exp-0827< / option >
2024-09-07 18:37:37 +02:00
< option data-type = "google" value = "gemini-pro-vision" > gemini-pro-vision< / option >
2024-10-03 07:41:45 +02:00
< option data-type = "groq" value = "llama-3.2-11b-vision-preview" > llama-3.2-11b-vision-preview< / option >
< option data-type = "groq" value = "llama-3.2-90b-vision-preview" > llama-3.2-90b-vision-preview< / option >
< option data-type = "groq" value = "llava-v1.5-7b-4096-preview" > llava-v1.5-7b-4096-preview< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "openai/gpt-4-vision-preview" > openai/gpt-4-vision-preview< / option >
< option data-type = "openrouter" value = "openai/gpt-4o" > openai/gpt-4o< / option >
2024-09-07 18:43:25 +02:00
< option data-type = "openrouter" value = "openai/gpt-4o-2024-05-13" > openai/gpt-4o-2024-05-13< / option >
< option data-type = "openrouter" value = "openai/gpt-4o-2024-08-06" > openai/gpt-4o-2024-08-06< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "openai/gpt-4-turbo" > openai/gpt-4-turbo< / option >
2024-07-18 21:51:47 +02:00
< option data-type = "openrouter" value = "openai/gpt-4o-mini" > openai/gpt-4o-mini< / option >
2024-09-07 18:43:25 +02:00
< option data-type = "openrouter" value = "openai/gpt-4o-mini-2024-07-18" > openai/gpt-4o-mini-2024-07-18< / option >
< option data-type = "openrouter" value = "openai/chatgpt-4o-latest" > openai/chatgpt-4o-latest< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "haotian-liu/llava-13b" > haotian-liu/llava-13b< / option >
< option data-type = "openrouter" value = "fireworks/firellava-13b" > fireworks/firellava-13b< / option >
2024-06-20 17:31:55 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3.5-sonnet" > anthropic/claude-3.5-sonnet< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3-haiku" > anthropic/claude-3-haiku< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-sonnet" > anthropic/claude-3-sonnet< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-opus" > anthropic/claude-3-opus< / option >
2024-06-20 17:31:55 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3.5-sonnet:beta" > anthropic/claude-3.5-sonnet:beta< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "anthropic/claude-3-haiku:beta" > anthropic/claude-3-haiku:beta< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-sonnet:beta" > anthropic/claude-3-sonnet:beta< / option >
< option data-type = "openrouter" value = "anthropic/claude-3-opus:beta" > anthropic/claude-3-opus:beta< / option >
< option data-type = "openrouter" value = "nousresearch/nous-hermes-2-vision-7b" > nousresearch/nous-hermes-2-vision-7b< / option >
2024-09-07 18:43:25 +02:00
< option data-type = "openrouter" value = "google/gemini-flash-8b-1.5-exp" > google/gemini-flash-8b-1.5-exp< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "google/gemini-flash-1.5" > google/gemini-flash-1.5< / option >
2024-09-07 18:43:25 +02:00
< option data-type = "openrouter" value = "google/gemini-flash-1.5-exp" > google/gemini-flash-1.5-exp< / option >
< option data-type = "openrouter" value = "google/gemini-pro-1.5" > google/gemini-pro-1.5< / option >
< option data-type = "openrouter" value = "google/gemini-pro-1.5-exp" > google/gemini-pro-1.5-exp< / option >
< option data-type = "openrouter" value = "google/gemini-pro-vision" > google/gemini-pro-vision< / option >
2024-06-07 01:25:42 +02:00
< option data-type = "openrouter" value = "liuhaotian/llava-yi-34b" > liuhaotian/llava-yi-34b< / option >
2024-06-14 21:46:40 +02:00
< option data-type = "ollama" value = "ollama_current" data-i18n = "currently_selected" > [Currently selected]< / option >
2024-06-22 15:28:57 +02:00
< option data-type = "ollama" value = "bakllava" > bakllava< / option >
< option data-type = "ollama" value = "llava" > llava< / option >
< option data-type = "ollama" value = "llava-llama3" > llava-llama3< / option >
< option data-type = "ollama" value = "llava-phi3" > llava-phi3< / option >
< option data-type = "ollama" value = "moondream" > moondream< / option >
2024-06-14 21:46:40 +02:00
< option data-type = "llamacpp" value = "llamacpp_current" data-i18n = "currently_loaded" > [Currently loaded]< / option >
< option data-type = "ooba" value = "ooba_current" data-i18n = "currently_loaded" > [Currently loaded]< / option >
< option data-type = "koboldcpp" value = "koboldcpp_current" data-i18n = "currently_loaded" > [Currently loaded]< / option >
2024-06-28 23:33:12 +02:00
< option data-type = "vllm" value = "vllm_current" data-i18n = "currently_selected" > [Currently selected]< / option >
2024-06-14 21:46:40 +02:00
< option data-type = "custom" value = "custom_current" data-i18n = "currently_selected" > [Currently selected]< / option >
2024-06-07 01:25:42 +02:00
< / select >
< / div >
2024-06-22 15:28:57 +02:00
< div data-type = "ollama" >
The model must be downloaded first! Do it with the < code > ollama pull< / code > command or < a href = "#" id = "caption_ollama_pull" > click here< / a > .
< / div >
2024-09-17 20:44:25 +02:00
< label data-type = "openai,anthropic,google,mistral" class = "checkbox_label flexBasis100p" for = "caption_allow_reverse_proxy" title = "Allow using reverse proxy if defined and valid." >
2024-06-07 01:25:42 +02:00
< input id = "caption_allow_reverse_proxy" type = "checkbox" class = "checkbox" >
2024-06-14 21:46:40 +02:00
< span data-i18n = "Allow reverse proxy" > Allow reverse proxy< / span >
2024-06-07 01:25:42 +02:00
< / label >
< div class = "flexBasis100p m-b-1" >
2024-06-14 21:46:40 +02:00
< small > < b data-i18n = "Hint:" > Hint:< / b > < span data-i18n = "Set your API keys and endpoints in the 'API Connections' tab first." > Set your API keys and endpoints in the 'API Connections' tab first.< / span > < / small >
2024-06-07 01:25:42 +02:00
< / div >
< / div >
< div id = "caption_prompt_block" >
2024-06-14 21:46:40 +02:00
< label for = "caption_prompt" data-i18n = "Caption Prompt" > Caption Prompt< / label >
2024-06-29 22:22:29 +02:00
< textarea id = "caption_prompt" class = "text_pole" rows = "1" placeholder = "< Use default >" > {{PROMPT_DEFAULT}}< / textarea >
2024-06-07 01:25:42 +02:00
< label class = "checkbox_label margin-bot-10px" for = "caption_prompt_ask" title = "Ask for a custom prompt every time an image is captioned." >
< input id = "caption_prompt_ask" type = "checkbox" class = "checkbox" >
2024-06-14 21:46:40 +02:00
< span data-i18n = "Ask every time" > Ask every time< / span >
2024-06-07 01:25:42 +02:00
< / label >
< / div >
2024-06-16 13:39:46 +02:00
< label for = "caption_template" > < span data-i18n = "Message Template" > Message Template< / span > < small > < span data-i18n = "(use _space" > (use < / span > < code > { { caption} } < / code > < span data-i18n = "macro)" > macro)< / span > < / small > < / label >
2024-06-29 22:22:29 +02:00
< textarea id = "caption_template" class = "text_pole" rows = "2" placeholder = "< Use default >" > {{TEMPLATE_DEFAULT}}< / textarea >
2024-06-29 23:06:17 +02:00
< label class = "checkbox_label" for = "caption_auto_mode" >
< input id = "caption_auto_mode" type = "checkbox" class = "checkbox" >
< span data-i18n = "Automatically caption images" > Automatically caption images< / span >
< i class = "fa-solid fa-info-circle" title = "Automatically caption images when they are pasted into the chat or attached to messages." > < / i >
< / label >
2024-06-07 01:25:42 +02:00
< label class = "checkbox_label margin-bot-10px" for = "caption_refine_mode" >
< input id = "caption_refine_mode" type = "checkbox" class = "checkbox" >
2024-06-14 21:46:40 +02:00
< span data-i18n = "Edit captions before saving" > Edit captions before saving< / span >
2024-06-07 01:25:42 +02:00
< / label >
< / div >
< / div >
< / div >