discourse/plugins/discourse-ai/config/eval-llms.yml
Natalie Tay bcb0949a2f
FEATURE: AI-generated DE queries on /new before creation (#39412)
Redesigns the Data Explorer `/queries/new` page to be AI-first, with a
non-AI fallback if AI is disabled.
 
Instead of the old dual-form layout (manual create + separate AI
generate that redirects to the edit page), the new page lets you
describe what you want, generates the SQL inline, and saves when you're
ready.

Reviewer notes:
- there's no database record created until user clicks "Save query"
- new POST /queries/generate endpoint for query generation, no DB record
- agent rework - related PR
https://github.com/discourse/discourse-ai-evals/pull/16
  - switched to agentic execution mode
  - removed ValidateSql tool (redundant with RunSql)
  - added full Data Explorer parameter type reference
  - evaluator for the DE agent
2026-04-22 13:50:26 +08:00

140 lines
4.2 KiB
YAML
Vendored

llms:
gpt-5-nano:
display_name: GPT-5-Nano
name: gpt-5-nano
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
api_key_env: OPENAI_API_KEY
provider: open_ai
url: https://api.openai.com/v1/chat/completions
max_prompt_tokens: 131072
vision_enabled: true
gpt-5-nano-thinking:
display_name: GPT-5-Nano Thinking
name: gpt-5-nano
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
api_key_env: OPENAI_API_KEY
provider: open_ai
url: https://api.openai.com/v1/responses
max_prompt_tokens: 131072
vision_enabled: true
provider_params:
reasoning_effort: low
gpt-5.2:
display_name: GPT-5.2
name: gpt-5.2
tokenizer: DiscourseAi::Tokenizer::OpenAiTokenizer
api_key_env: OPENAI_API_KEY
provider: open_ai
url: https://api.openai.com/v1/chat/completions
max_prompt_tokens: 131072
vision_enabled: true
claude-4.5-haiku:
display_name: Claude 4.5 Haiku
name: claude-haiku-4-5
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
api_key_env: ANTHROPIC_API_KEY
provider: anthropic
url: https://api.anthropic.com/v1/messages
max_prompt_tokens: 200000
vision_enabled: false
claude-4.5-haiku-thinking:
display_name: Claude 4.5 Haiku
name: claude-haiku-4-5
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
api_key_env: ANTHROPIC_API_KEY
provider: anthropic
url: https://api.anthropic.com/v1/messages
max_prompt_tokens: 200000
vision_enabled: true
provider_params:
disable_top_p: true
disable_temperature: true
enable_reasoning: true
reasoning_tokens: 1024
claude-4.6-sonnet:
display_name: Claude 4.6 Sonnet
name: claude-sonnet-4-6
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
api_key_env: ANTHROPIC_API_KEY
provider: anthropic
url: https://api.anthropic.com/v1/messages
max_prompt_tokens: 200000
vision_enabled: true
claude-4.6-sonnet-thinking:
display_name: Claude 4.6 Sonnet
name: claude-sonnet-4-6
tokenizer: DiscourseAi::Tokenizer::AnthropicTokenizer
api_key_env: ANTHROPIC_API_KEY
provider: anthropic
url: https://api.anthropic.com/v1/messages
max_prompt_tokens: 200000
vision_enabled: true
provider_params:
disable_top_p: true
disable_temperature: true
enable_reasoning: true
reasoning_tokens: 1024
gemini-2.0-flash:
display_name: Gemini 2.0 Flash
name: gemini-2-0-flash
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
api_key_env: GEMINI_API_KEY
provider: google
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash
max_prompt_tokens: 1000000
vision_enabled: true
gemini-2.5-flash:
display_name: Gemini 2.5 Flash
name: gemini-2-5-flash
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
api_key_env: GEMINI_API_KEY
provider: google
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash
max_prompt_tokens: 1000000
vision_enabled: true
provider_params:
disable_top_p: true
disable_temperature: true
gemini-3-flash-thinking:
display_name: Gemini 3.0 Flash
name: gemini-3-0-flash
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
api_key_env: GEMINI_API_KEY
provider: google
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-3-flash-preview
max_prompt_tokens: 1000000
vision_enabled: true
provider_params:
disable_top_p: true
disable_temperature: true
enable_thinking: true
thinking_tokens: 1024
gemini-3-pro:
display_name: Gemini 3.0 pro
name: gemini-3-pro-preview
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
api_key_env: GEMINI_API_KEY
provider: google
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-3-pro-preview
max_prompt_tokens: 1000000
vision_enabled: true
gemini-3.1-flash-lite:
display_name: Gemini 3.1 Flash Lite
name: gemini-3.1-flash-lite
tokenizer: DiscourseAi::Tokenizer::GeminiTokenizer
api_key_env: GEMINI_API_KEY
provider: google
url: https://generativelanguage.googleapis.com/v1beta/models/gemini-3-flash-preview
max_prompt_tokens: 1000000
vision_enabled: true