Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,156 @@ export const ANTHROPIC_CONFIG: ProviderConfig = {
id: 'anthropic',
name: 'Anthropic',
description: 'Claude models focused on safety and helpfulness',
defaultModel: 'claude-sonnet-4-5-20250929',
defaultModel: 'claude-sonnet-4-6',
models: [
{
id: 'claude-opus-4-6',
displayName: 'Claude Opus 4.6',
aliases: ['claude-opus-4-6'],
description:
"Claude Opus 4.6 is Anthropic's most intelligent model, designed for building complex agents, advanced coding workflows, and tasks requiring deep reasoning. It delivers state-of-the-art performance across coding, research, and multi-step agentic tasks.",
lifecycle: 'production',
health: 'healthy',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 128_000,
},
cost: {
inputCostPer1mTokens: 5,
outputCostPer1mTokens: 25,
},
tags: ['recommended', 'reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-sonnet-4-6',
displayName: 'Claude Sonnet 4.6',
aliases: ['claude-sonnet-4-6'],
description:
"Claude Sonnet 4.6 is Anthropic's best combination of speed and intelligence, optimized for a wide range of tasks including coding, analysis, and agentic workflows. It delivers high performance with lower latency compared to Opus models.",
lifecycle: 'production',
health: 'healthy',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 64_000,
},
cost: {
inputCostPer1mTokens: 3,
outputCostPer1mTokens: 15,
},
tags: ['recommended', 'reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-opus-4-5-20251101',
displayName: 'Claude Opus 4.5',
aliases: ['claude-opus-4-5'],
description:
"Claude Opus 4.5 is a highly capable model excelling in complex reasoning, advanced coding, and multi-step agentic tasks. It provides strong performance across a wide range of demanding use cases.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2025-11-01',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 64_000,
},
cost: {
inputCostPer1mTokens: 5,
outputCostPer1mTokens: 25,
},
tags: ['recommended', 'reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-opus-4-1-20250805',
displayName: 'Claude Opus 4.1',
aliases: ['claude-opus-4-1'],
description:
"Claude Opus 4.1 is a powerful model designed for the most demanding tasks, with strong performance in advanced reasoning, complex coding, and research workflows.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2025-08-05',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 32_000,
},
cost: {
inputCostPer1mTokens: 15,
outputCostPer1mTokens: 75,
},
tags: ['reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-opus-4-20250514',
displayName: 'Claude Opus 4',
aliases: ['claude-opus-4', 'claude-opus-4-0'],
description:
"Claude Opus 4 is Anthropic's powerful frontier model excelling at complex tasks requiring deep reasoning, advanced coding, and sophisticated analysis.",
lifecycle: 'production',
health: 'healthy',
releaseDate: '2025-05-14',
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: false,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 200_000,
maxOutputTokens: 32_000,
},
cost: {
inputCostPer1mTokens: 15,
outputCostPer1mTokens: 75,
},
tags: ['reasoning', 'agents', 'vision', 'general-purpose', 'coding'],
},
{
id: 'claude-sonnet-4-5-20250929',
displayName: 'Claude Sonnet 4.5',
Expand Down Expand Up @@ -320,9 +468,11 @@ export const ANTHROPIC_CONFIG: ProviderConfig = {
displayName: 'Claude 3 Haiku',
description:
"Claude 3 Haiku is Anthropic's fastest and most compact model for near-instant responsiveness. Quick and accurate targeted performance.",
lifecycle: 'production',
lifecycle: 'deprecated',
health: 'healthy',
releaseDate: '2024-03-07',
deprecationDate: '2026-04-19',
replacementModels: ['claude-haiku-4-5-20251001'],
capabilities: {
supportsText: true,
supportsImages: true,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,64 @@ export const GOOGLE_AI_CONFIG: ProviderConfig = {
description: 'Gemini models from Google with multimodal capabilities',
defaultModel: 'gemini-2.5-flash',
models: [
{
id: 'gemini-3.1-pro',
internalModelId: 'gemini-3.1-pro-preview',
displayName: 'Gemini 3.1 Pro',
description:
"Google's most advanced model with state-of-the-art reasoning, complex problem-solving, and powerful agentic and vibe-coding capabilities built on a foundation of frontier intelligence.",
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 1_048_576,
maxOutputTokens: 65_536,
},
cost: {
inputCostPer1mTokens: 2,
outputCostPer1mTokens: 12,
},
tags: ['recommended', 'reasoning', 'agents', 'general-purpose', 'vision', 'coding'],
releaseDate: '2026-01-01',
lifecycle: 'preview',
},
{
id: 'gemini-3.1-flash-lite',
internalModelId: 'gemini-3.1-flash-lite-preview',
displayName: 'Gemini 3.1 Flash-Lite',
description:
"Google's frontier-class model with a focus on efficiency — delivering frontier-level performance at a fraction of the cost and latency of larger models.",
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: true,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 1_048_576,
maxOutputTokens: 65_536,
},
cost: {
inputCostPer1mTokens: 0.25,
outputCostPer1mTokens: 1.5,
},
tags: ['low-cost', 'general-purpose', 'vision'],
releaseDate: '2026-01-01',
lifecycle: 'preview',
},
{
id: 'gemini-3-pro',
internalModelId: 'gemini-3-pro-preview',
Expand All @@ -31,9 +89,10 @@ export const GOOGLE_AI_CONFIG: ProviderConfig = {
inputCostPer1mTokens: 2,
outputCostPer1mTokens: 12,
},
tags: ['reasoning', 'agents', 'general-purpose', 'vision'],
tags: ['deprecated', 'reasoning', 'agents', 'general-purpose', 'vision'],
releaseDate: '2025-11-18',
lifecycle: 'preview',
lifecycle: 'deprecated',
replacementModels: ['gemini-3.1-pro'],
},
{
id: 'gemini-3-flash',
Expand Down Expand Up @@ -91,6 +150,34 @@ export const GOOGLE_AI_CONFIG: ProviderConfig = {
releaseDate: '2025-01-15',
lifecycle: 'production',
},
{
id: 'gemini-2.5-flash-lite',
displayName: 'Gemini 2.5 Flash-Lite',
description:
"Google's fastest and most budget-friendly multimodal model in the 2.5 family, designed for high-volume, latency-sensitive tasks that require strong performance at minimal cost.",
capabilities: {
supportsText: true,
supportsImages: true,
supportsTools: true,
supportsJsonMode: true,
supportsSystemMessages: true,
supportsStreaming: true,
supportsReasoning: false,
supportsStopSequence: true,
supportsTemperature: true,
},
limits: {
maxInputTokens: 1_048_576,
maxOutputTokens: 65_536,
},
cost: {
inputCostPer1mTokens: 0.1,
outputCostPer1mTokens: 0.4,
},
tags: ['low-cost', 'general-purpose', 'vision'],
releaseDate: '2025-06-01',
lifecycle: 'production',
},
{
id: 'gemini-2.5-pro',
displayName: 'Gemini 2.5 Pro',
Expand Down Expand Up @@ -144,9 +231,10 @@ export const GOOGLE_AI_CONFIG: ProviderConfig = {
inputCostPer1mTokens: 0.1,
outputCostPer1mTokens: 0.4,
},
tags: ['low-cost', 'general-purpose', 'vision'],
tags: ['deprecated', 'low-cost', 'general-purpose', 'vision'],
releaseDate: '2024-12-11',
lifecycle: 'production',
lifecycle: 'deprecated',
replacementModels: ['gemini-2.5-flash'],
},
],
}
20 changes: 10 additions & 10 deletions packages/cognitive/src/features/providers/groq/groq.config.ts
Original file line number Diff line number Diff line change
Expand Up @@ -24,12 +24,12 @@ export const GROQ_CONFIG: ProviderConfig = {
supportsTemperature: true,
},
limits: {
maxInputTokens: 131_000,
maxOutputTokens: 32_000,
maxInputTokens: 131_072,
maxOutputTokens: 65_536,
},
cost: {
inputCostPer1mTokens: 0.1,
outputCostPer1mTokens: 0.5,
inputCostPer1mTokens: 0.075,
outputCostPer1mTokens: 0.3,
},
tags: ['preview', 'general-purpose', 'reasoning', 'low-cost'],
releaseDate: '2024-12-01',
Expand All @@ -53,12 +53,12 @@ export const GROQ_CONFIG: ProviderConfig = {
supportsStopSequence: false,
},
limits: {
maxInputTokens: 131_000,
maxOutputTokens: 32_000,
maxInputTokens: 131_072,
maxOutputTokens: 65_536,
},
cost: {
inputCostPer1mTokens: 0.15,
outputCostPer1mTokens: 0.75,
outputCostPer1mTokens: 0.6,
},
tags: ['preview', 'general-purpose', 'reasoning'],
releaseDate: '2024-12-01',
Expand Down Expand Up @@ -111,7 +111,7 @@ export const GROQ_CONFIG: ProviderConfig = {
supportsTemperature: true,
},
limits: {
maxInputTokens: 128_000,
maxInputTokens: 131_072,
maxOutputTokens: 32_768,
},
cost: {
Expand Down Expand Up @@ -263,8 +263,8 @@ export const GROQ_CONFIG: ProviderConfig = {
supportsTemperature: true,
},
limits: {
maxInputTokens: 128_000,
maxOutputTokens: 8192,
maxInputTokens: 131_072,
maxOutputTokens: 131_072,
},
cost: {
inputCostPer1mTokens: 0.05,
Expand Down
Loading