Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
17 changes: 16 additions & 1 deletion providers/together-ai/MiniMaxAI/MiniMax-M2.5-FP4.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,17 @@
mode: unknown
costs:
- cache_read_input_token_cost: 6.e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 0.0000012
region: "*"
features:
- function_calling
- structured_output
limits:
context_window: 228700
modalities:
input:
- text
output:
- text
mode: chat
model: MiniMaxAI/MiniMax-M2.5-FP4
7 changes: 6 additions & 1 deletion providers/together-ai/MiniMaxAI/MiniMax-M2.5.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,12 @@ features:
- parallel_function_calling
- structured_output
limits:
context_window: 196608
context_window: 228700
modalities:
input:
- text
output:
- text
mode: chat
model: MiniMaxAI/MiniMax-M2.5
sources:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/QwQ-32B-Preview.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/QwQ-32B-Preview
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/QwQ-32B.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/QwQ-32B
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen2-72B-Instruct.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen2-72B-Instruct
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen2-VL-72B-Instruct.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen2-VL-72B-Instruct
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen2.5-14B.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen2.5-14B
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen2.5-72B-Instruct-Turbo.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen2.5-72B-Instruct-Turbo
5 changes: 5 additions & 0 deletions providers/together-ai/Qwen/Qwen2.5-7B-Instruct-Turbo.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,11 @@ features:
- structured_output
limits:
context_window: 32768
modalities:
input:
- text
output:
- text
mode: chat
model: Qwen/Qwen2.5-7B-Instruct-Turbo
sources:
Expand Down
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen2.5-Coder-32B-Instruct.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen2.5-Coder-32B-Instruct
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen2.5-VL-72B-Instruct.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen2.5-VL-72B-Instruct
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,11 @@ features:
- structured_output
limits:
context_window: 262144
modalities:
input:
- text
output:
- text
mode: chat
model: Qwen/Qwen3-235B-A22B-Instruct-2507-tput
sources:
Expand Down
2 changes: 1 addition & 1 deletion providers/together-ai/Qwen/Qwen3-8B-Lora.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,5 +2,5 @@ costs:
- input_cost_per_token: 0
output_cost_per_token: 0
region: "*"
mode: unknown
mode: chat
model: Qwen/Qwen3-8B-Lora
Original file line number Diff line number Diff line change
Expand Up @@ -4,19 +4,20 @@ costs:
region: "*"
features:
- function_calling
- parallel_function_calling
- tool_choice
- structured_output
limits:
context_window: 262144
max_input_tokens: 256000
context_window: 256000
modalities:
input:
- text
output:
- text
mode: chat
model: Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8
sources:
- https://www.together.ai/models/qwen3-coder-480b-a35b-instruct
- https://docs.together.ai/docs/serverless-models
- https://docs.together.ai/docs/function-calling
- https://docs.together.ai/docs/json-mode
- https://docs.together.ai/docs/vision-overview
supportedModes:
- chat
5 changes: 5 additions & 0 deletions providers/together-ai/Qwen/Qwen3-Coder-Next-FP8.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,11 @@ limits:
max_input_tokens: 262144
max_output_tokens: 65536
max_tokens: 65536
modalities:
input:
- text
output:
- text
mode: chat
model: Qwen/Qwen3-Coder-Next-FP8
sources:
Expand Down
7 changes: 5 additions & 2 deletions providers/together-ai/Qwen/Qwen3-Next-80B-A3B-Instruct.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -4,12 +4,15 @@ costs:
region: "*"
features:
- function_calling
- parallel_function_calling
- tool_choice
- structured_output
limits:
context_window: 262144
max_input_tokens: 262144
modalities:
input:
- text
output:
- text
mode: chat
model: Qwen/Qwen3-Next-80B-A3B-Instruct
sources:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen3-Next-80B-A3B-Thinking
1 change: 1 addition & 0 deletions providers/together-ai/Qwen/Qwen3-VL-32B-Instruct.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: Qwen/Qwen3-VL-32B-Instruct
6 changes: 6 additions & 0 deletions providers/together-ai/Qwen/Qwen3.5-35B-A3B.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,12 +7,18 @@ features:
- structured_output
limits:
context_window: 262144
max_output_tokens: 81920
max_tokens: 81920
modalities:
input:
- text
- image
output:
- text
mode: chat
model: Qwen/Qwen3.5-35B-A3B
sources:
- https://together.ai/pricing
- https://docs.together.ai/docs/serverless-models
- https://huggingface.co/Qwen/Qwen3.5-35B-A3B
thinking: true
6 changes: 3 additions & 3 deletions providers/together-ai/Qwen/Qwen3.5-397B-A17B.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,16 +8,16 @@ features:
limits:
context_window: 262144
max_input_tokens: 262144
max_output_tokens: 262144
max_tokens: 262144
modalities:
input:
- text
- image
output:
- text
mode: chat
model: Qwen/Qwen3.5-397B-A17B
sources:
- https://www.together.ai/models/qwen3-5-397b-a17b
- https://docs.together.ai/docs/serverless-models
- https://www.together.ai/pricing
supportedModes:
- chat
4 changes: 0 additions & 4 deletions providers/together-ai/Qwen/Qwen3.5-9B-FP8.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,12 +7,8 @@ features:
- structured_output
limits:
context_window: 262144
modalities:
input:
- image
mode: chat
model: Qwen/Qwen3.5-9B-FP8
sources:
- https://together.ai/models
- https://docs.together.ai/docs/serverless-models
thinking: true
12 changes: 11 additions & 1 deletion providers/together-ai/deepseek-ai/DeepSeek-OCR-2.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,12 @@
mode: unknown
features:
- system_messages
modalities:
input:
- text
- image
output:
- text
mode: chat
model: deepseek-ai/DeepSeek-OCR-2
sources:
- https://huggingface.co/deepseek-ai/DeepSeek-OCR-2
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
isDeprecated: true
limits:
context_window: 131072
mode: unknown
Expand Down
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
8 changes: 7 additions & 1 deletion providers/together-ai/deepseek-ai/DeepSeek-R1-Original.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,8 @@
mode: unknown
modalities:
input:
- text
output:
- text
mode: chat
model: deepseek-ai/DeepSeek-R1-Original
thinking: true
7 changes: 6 additions & 1 deletion providers/together-ai/deepseek-ai/DeepSeek-R1.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,9 +9,14 @@ features:
- structured_output
- system_messages
limits:
context_window: 163840
context_window: 163839
max_output_tokens: 64000
max_tokens: 64000
modalities:
input:
- text
output:
- text
mode: chat
model: deepseek-ai/DeepSeek-R1
sources:
Expand Down
11 changes: 8 additions & 3 deletions providers/together-ai/deepseek-ai/DeepSeek-V3-0324.yaml
Original file line number Diff line number Diff line change
@@ -1,13 +1,18 @@
costs:
- input_cost_per_token: 0.00000125
output_cost_per_token: 0.00000125
- input_cost_per_token: 6.e-7
output_cost_per_token: 0.0000017
region: "*"
features:
- function_calling
- parallel_function_calling
- structured_output
limits:
context_window: 131000
context_window: 128000
modalities:
input:
- text
output:
- text
mode: chat
model: deepseek-ai/DeepSeek-V3-0324
sources:
Expand Down
5 changes: 5 additions & 0 deletions providers/together-ai/deepseek-ai/DeepSeek-V3.1.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,11 @@ features:
- structured_output
limits:
context_window: 131072
modalities:
input:
- text
output:
- text
mode: chat
model: deepseek-ai/DeepSeek-V3.1
sources:
Expand Down
7 changes: 7 additions & 0 deletions providers/together-ai/deepseek-ai/DeepSeek-V3.yaml
Original file line number Diff line number Diff line change
@@ -1,13 +1,20 @@
costs:
- input_cost_per_token: 6.e-7
input_cost_per_token_batches: 2.e-7
output_cost_per_token: 0.0000017
output_cost_per_token_batches: 6.e-7
region: "*"
features:
- function_calling
- tool_choice
- structured_output
limits:
context_window: 128000
modalities:
input:
- text
output:
- text
mode: chat
model: deepseek-ai/DeepSeek-V3
sources:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: deepseek-ai/deepseek-coder-33b-instruct
1 change: 0 additions & 1 deletion providers/together-ai/essentialai/rnj-1-instruct.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,6 @@ features:
- structured_output
limits:
context_window: 32768
max_tokens: 32768
mode: chat
model: essentialai/rnj-1-instruct
sources:
Expand Down
3 changes: 3 additions & 0 deletions providers/together-ai/google/flash-image-2.5.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,9 @@ costs:
region: "*"
modalities:
input:
- text
- image
output:
- image
mode: image
model: google/flash-image-2.5
Expand Down
1 change: 1 addition & 0 deletions providers/together-ai/google/gemma-2-27b-it.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: google/gemma-2-27b-it
3 changes: 3 additions & 0 deletions providers/together-ai/google/gemma-3n-E4B-it.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,10 @@ limits:
max_input_tokens: 32768
modalities:
input:
- text
- image
output:
- text
mode: chat
model: google/gemma-3n-E4B-it
sources:
Expand Down
2 changes: 2 additions & 0 deletions providers/together-ai/google/imagen-4.0-fast.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,8 @@ costs:
region: "*"
modalities:
input:
- text
output:
- image
mode: image
model: google/imagen-4.0-fast
Expand Down
4 changes: 1 addition & 3 deletions providers/together-ai/google/imagen-4.0-preview.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,11 +2,9 @@ costs:
- output_cost_per_image: 0.04
region: "*"
modalities:
input:
output:
- image
mode: image
model: google/imagen-4.0-preview
sources:
- https://docs.together.ai/docs/serverless-models
supportedModes:
- image
2 changes: 2 additions & 0 deletions providers/together-ai/google/imagen-4.0-ultra.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,8 @@ costs:
modalities:
input:
- image
output:
- image
mode: image
model: google/imagen-4.0-ultra
sources:
Expand Down
1 change: 1 addition & 0 deletions providers/together-ai/meta-llama/Llama-2-13b-chat-hf.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: meta-llama/Llama-2-13b-chat-hf
1 change: 1 addition & 0 deletions providers/together-ai/meta-llama/Llama-2-7b-chat-hf.yaml
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
isDeprecated: true
mode: unknown
model: meta-llama/Llama-2-7b-chat-hf
Loading
Loading