Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,158 @@ export const ANTHROPIC_CONFIG: ProviderConfig = {
id: 'anthropic',
name: 'Anthropic',
description: 'Claude models focused on safety and helpfulness',
defaultModel: 'claude-sonnet-4-5-20250929',
defaultModel: 'claude-sonnet-4-6',
models: [
{
id: 'claude-opus-4-6',
displayName: 'Claude Opus 4.6',
aliases: ['claude-opus-4-6'],
description:
"Claude Opus 4.6 is Anthropic's most intelligent model, built for the most complex and demanding tasks. It delivers state-of-the-art performance on coding, agentic, and reasoning benchmarks with support for Extended Thinking and Adaptive Thinking modes.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2026-01-01',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 1_000_000,
maxOutputTokens: 128_000,
},
cost: {
inputCostPer1mTokens: 5,
outputCostPer1mTokens: 25,
},
tags: ['recommended', 'reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-sonnet-4-6',
displayName: 'Claude Sonnet 4.6',
aliases: ['claude-sonnet-4-6'],
description:
"Claude Sonnet 4.6 is Anthropic's best combination of speed and intelligence, offering frontier coding and agentic performance with a 1M token context window and support for Extended Thinking and Adaptive Thinking modes.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2026-01-01',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 1_000_000,
maxOutputTokens: 64_000,
},
cost: {
inputCostPer1mTokens: 3,
outputCostPer1mTokens: 15,
},
tags: ['recommended', 'reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-opus-4-5-20251101',
displayName: 'Claude Opus 4.5',
aliases: ['claude-opus-4-5'],
description:
"Claude Opus 4.5 is a highly capable model from Anthropic with strong performance on coding, analysis, and reasoning tasks. Supports Extended Thinking for enhanced problem-solving.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2025-11-01',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 64_000,
},
cost: {
inputCostPer1mTokens: 5,
outputCostPer1mTokens: 25,
},
tags: ['reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-opus-4-1-20250805',
displayName: 'Claude Opus 4.1',
aliases: ['claude-opus-4-1'],
description:
"Claude Opus 4.1 is a powerful model from Anthropic offering strong reasoning and coding capabilities with a 200k context window.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2025-08-05',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 32_000,
},
cost: {
inputCostPer1mTokens: 15,
outputCostPer1mTokens: 75,
},
tags: ['reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-opus-4-20250514',
displayName: 'Claude Opus 4',
aliases: ['claude-opus-4-0'],
description:
"Claude Opus 4 is Anthropic's original Claude 4 flagship model, excelling at complex reasoning, coding, and agentic tasks with a 200k context window.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2025-05-14',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 32_000,
},
cost: {
inputCostPer1mTokens: 15,
outputCostPer1mTokens: 75,
},
tags: ['reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-sonnet-4-5-20250929',
displayName: 'Claude Sonnet 4.5',
Expand Down Expand Up @@ -320,7 +470,9 @@ export const ANTHROPIC_CONFIG: ProviderConfig = {
displayName: 'Claude 3 Haiku',
description:
"Claude 3 Haiku is Anthropic's fastest and most compact model for near-instant responsiveness. Quick and accurate targeted performance.",
lifecycle: 'production',
lifecycle: 'deprecated',
deprecationDate: '2026-04-19',
replacementModels: ['claude-haiku-4-5-20251001'],
health: 'healthy',
releaseDate: '2024-03-07',
capabilities: {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,62 @@ export const CEREBRAS_CONFIG: ProviderConfig = {
description: 'Cerebras AI models for high-performance language processing',
defaultModel: 'gpt-oss-120b',
models: [
{
id: 'qwen-3-235b-a22b-instruct-2507',
displayName: 'Qwen3 235B A22B Instruct (Preview)',
description:
'Qwen3-235B-A22B is a massive mixture-of-experts model activating 22B parameters, delivering state-of-the-art performance on reasoning, coding, and multilingual tasks at high inference speeds on Cerebras hardware.',
capabilities: {
supportsText: true,
supportsImages: false,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 131_072,
maxOutputTokens: 16_000,
},
cost: {
inputCostPer1mTokens: 0.6,
outputCostPer1mTokens: 1.2,
},
tags: ['preview', 'general-purpose', 'reasoning'],
releaseDate: '2025-07-01',
lifecycle: 'preview',
},
{
id: 'zai-glm-4.7',
displayName: 'ZAI GLM-4.7 (Preview)',
description:
'GLM-4.7 is a high-capability model from Zhipu AI (ZAI) offering strong multilingual and multimodal understanding at high inference speeds on Cerebras hardware.',
capabilities: {
supportsText: true,
supportsImages: false,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: false,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 131_072,
maxOutputTokens: 16_000,
},
cost: {
inputCostPer1mTokens: 2.25,
outputCostPer1mTokens: 2.75,
},
tags: ['preview', 'general-purpose'],
releaseDate: '2025-07-01',
lifecycle: 'preview',
},
{
id: 'gpt-oss-120b',
displayName: 'GPT-OSS 120B (Preview)',
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,90 @@ export const FIREWORKS_CONFIG: ProviderConfig = {
description: 'Fireworks AI provides fast inference for various language models',
defaultModel: 'accounts/fireworks/models/llama-v3p1-70b-instruct',
models: [
{
id: 'deepseek-v3p2',
internalModelId: 'accounts/fireworks/models/deepseek-v3p2',
displayName: 'DeepSeek V3.2',
description:
'DeepSeek V3.2 is the latest iteration of the DeepSeek V3 series, a 685B-parameter mixture-of-experts model offering improved reasoning, coding, and instruction-following capabilities.',
capabilities: {
supportsText: true,
supportsImages: false,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: false,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 163_840,
maxOutputTokens: 16_384,
},
cost: {
inputCostPer1mTokens: 0.56,
outputCostPer1mTokens: 1.68,
},
tags: ['recommended', 'general-purpose'],
lifecycle: 'production',
},
{
id: 'deepseek-v3p1',
internalModelId: 'accounts/fireworks/models/deepseek-v3p1',
displayName: 'DeepSeek V3.1',
description:
'DeepSeek V3.1 is an updated version of the DeepSeek V3 series, a 685B-parameter mixture-of-experts model with improved performance across coding, math, and general tasks.',
capabilities: {
supportsText: true,
supportsImages: false,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: false,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 163_840,
maxOutputTokens: 16_384,
},
cost: {
inputCostPer1mTokens: 0.56,
outputCostPer1mTokens: 1.68,
},
tags: ['general-purpose'],
lifecycle: 'production',
},
{
id: 'kimi-k2-instruct-0905',
internalModelId: 'accounts/fireworks/models/kimi-k2-instruct-0905',
displayName: 'Kimi K2 Instruct 0905',
description:
'Kimi K2 Instruct 0905 is the latest Moonshot AI Kimi K2 model, a mixture-of-experts model with 262k context window optimized for agentic and coding tasks.',
capabilities: {
supportsText: true,
supportsImages: false,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 262_144,
maxOutputTokens: 16_384,
},
cost: {
inputCostPer1mTokens: 0.6,
outputCostPer1mTokens: 2.5,
},
tags: ['general-purpose', 'reasoning', 'coding'],
lifecycle: 'production',
},
{
id: 'gpt-oss-20b',
internalModelId: 'accounts/fireworks/models/gpt-oss-20b',
Expand Down
Loading