mirror of
https://github.com/discourse/discourse-ai.git
synced 2025-08-01 02:43:26 +00:00
* FIX: make AI helper more robust - If JSON is broken for structured output then lean on a more forgiving parser - Gemini 2.5 flash does not support temp, support opting out - Evals for assistant were broken, fix interface - Add some missing LLMs - Translator was not mapped correctly to the feature - fix that - Don't mix XML in prompt for translator * lint * correct logic * simplify code * implement best effort json parsing direct in the structured output object
122 lines
3.5 KiB
YAML
122 lines
3.5 KiB
YAML
llms:
|
|
o3:
|
|
display_name: O3
|
|
name: o3
|
|
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
|
|
api_key_env: OPENAI_API_KEY
|
|
provider: open_ai
|
|
url: https://api.openai.com/v1/chat/completions
|
|
max_prompt_tokens: 131072
|
|
vision_enabled: true
|
|
provider_params:
|
|
disable_top_p: true
|
|
disable_temperature: true
|
|
|
|
gpt-41:
|
|
display_name: GPT-4.1
|
|
name: gpt-4.1
|
|
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
|
|
api_key_env: OPENAI_API_KEY
|
|
provider: open_ai
|
|
url: https://api.openai.com/v1/chat/completions
|
|
max_prompt_tokens: 131072
|
|
vision_enabled: true
|
|
|
|
gpt-4o:
|
|
display_name: GPT-4o
|
|
name: gpt-4o
|
|
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
|
|
api_key_env: OPENAI_API_KEY
|
|
provider: open_ai
|
|
url: https://api.openai.com/v1/chat/completions
|
|
max_prompt_tokens: 131072
|
|
vision_enabled: true
|
|
|
|
gpt-4o-mini:
|
|
display_name: GPT-4o-mini
|
|
name: gpt-4o-mini
|
|
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
|
|
api_key_env: OPENAI_API_KEY
|
|
provider: open_ai
|
|
url: https://api.openai.com/v1/chat/completions
|
|
max_prompt_tokens: 131072
|
|
vision_enabled: true
|
|
|
|
claude-3.5-haiku:
|
|
display_name: Claude 3.5 Haiku
|
|
name: claude-3-5-haiku-latest
|
|
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
|
|
api_key_env: ANTHROPIC_API_KEY
|
|
provider: anthropic
|
|
url: https://api.anthropic.com/v1/messages
|
|
max_prompt_tokens: 200000
|
|
vision_enabled: false
|
|
|
|
claude-3.5-sonnet:
|
|
display_name: Claude 3.5 Sonnet
|
|
name: claude-3-5-sonnet-latest
|
|
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
|
|
api_key_env: ANTHROPIC_API_KEY
|
|
provider: anthropic
|
|
url: https://api.anthropic.com/v1/messages
|
|
max_prompt_tokens: 200000
|
|
vision_enabled: true
|
|
|
|
claude-3.7-sonnet:
|
|
display_name: Claude 3.7 Sonnet
|
|
name: claude-3-7-sonnet-latest
|
|
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
|
|
api_key_env: ANTHROPIC_API_KEY
|
|
provider: anthropic
|
|
url: https://api.anthropic.com/v1/messages
|
|
max_prompt_tokens: 200000
|
|
vision_enabled: true
|
|
|
|
claude-3.7-sonnet-thinking:
|
|
display_name: Claude 3.7 Sonnet
|
|
name: claude-3-7-sonnet-latest
|
|
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
|
|
api_key_env: ANTHROPIC_API_KEY
|
|
provider: anthropic
|
|
url: https://api.anthropic.com/v1/messages
|
|
max_prompt_tokens: 200000
|
|
vision_enabled: true
|
|
provider_params:
|
|
disable_top_p: true
|
|
disable_temperature: true
|
|
enable_reasoning: true
|
|
reasoning_tokens: 1024
|
|
|
|
gemini-2.0-flash:
|
|
display_name: Gemini 2.0 Flash
|
|
name: gemini-2-0-flash
|
|
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
|
|
api_key_env: GEMINI_API_KEY
|
|
provider: google
|
|
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash
|
|
max_prompt_tokens: 1000000
|
|
vision_enabled: true
|
|
|
|
gemini-2.5-flash:
|
|
display_name: Gemini 2.5 Flash
|
|
name: gemini-2-5-flash
|
|
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
|
|
api_key_env: GEMINI_API_KEY
|
|
provider: google
|
|
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash
|
|
max_prompt_tokens: 1000000
|
|
vision_enabled: true
|
|
provider_params:
|
|
disable_top_p: true
|
|
disable_temperature: true
|
|
|
|
gemini-2.0-pro:
|
|
display_name: Gemini 2.0 pro
|
|
name: gemini-2-0-pro
|
|
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
|
|
api_key_env: GEMINI_API_KEY
|
|
provider: google
|
|
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-pro
|
|
max_prompt_tokens: 1000000
|
|
vision_enabled: true
|