truefoundry · LordGameleo · Mar 19, 2026 · Mar 19, 2026 · cursor · Mar 19, 2026
diff --git a/providers/deepinfra/BAAI/bge-base-en-v1.5.yaml b/providers/deepinfra/BAAI/bge-base-en-v1.5.yaml
@@ -3,6 +3,10 @@ costs:
       region: "*"
 limits:
     max_input_tokens: 512
+    output_vector_size: 768
+modalities:
+    input:
+        - text
 mode: embedding
 model: BAAI/bge-base-en-v1.5
 sources:

diff --git a/providers/deepinfra/BAAI/bge-en-icl.yaml b/providers/deepinfra/BAAI/bge-en-icl.yaml
@@ -1,6 +1,11 @@
 costs:
     - input_cost_per_token: 1.e-8
       region: "*"
+modalities:
+    input:
+        - text
+    output:
+        - text
 mode: embedding
 model: BAAI/bge-en-icl
 sources:

diff --git a/providers/deepinfra/BAAI/bge-large-en-v1.5.yaml b/providers/deepinfra/BAAI/bge-large-en-v1.5.yaml
@@ -3,10 +3,10 @@ costs:
       region: "*"
 limits:
     max_input_tokens: 512
-    max_tokens: 512
+    output_vector_size: 1024
 modalities:
     input:
-        - image
+        - text
 mode: embedding
 model: BAAI/bge-large-en-v1.5
 sources:

diff --git a/providers/deepinfra/BAAI/bge-m3-multi.yaml b/providers/deepinfra/BAAI/bge-m3-multi.yaml
@@ -3,7 +3,12 @@ costs:
       region: "*"
 limits:
     max_input_tokens: 8192
+    output_vector_size: 1024
+modalities:
+    input:
+        - text
 mode: embedding
 model: BAAI/bge-m3-multi
 sources:
     - https://deepinfra.com/BAAI/bge-m3-multi/api
+    - https://huggingface.co/BAAI/bge-m3
diff --git a/providers/deepinfra/BAAI/bge-m3.yaml b/providers/deepinfra/BAAI/bge-m3.yaml
@@ -4,6 +4,9 @@ costs:
 limits:
     max_input_tokens: 8192
     max_tokens: 8192
+modalities:
+    input:
+        - text
 mode: embedding
 model: BAAI/bge-m3
 sources:

diff --git a/providers/deepinfra/Bria/Bria-3.2.yaml b/providers/deepinfra/Bria/Bria-3.2.yaml
@@ -3,6 +3,8 @@ costs:
       region: "*"
 modalities:
     input:
+        - text
+    output:
         - image
 mode: image
 model: Bria/Bria-3.2

diff --git a/providers/deepinfra/Bria/blur_background.yaml b/providers/deepinfra/Bria/blur_background.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: Bria/blur_background
 sources:

diff --git a/providers/deepinfra/Bria/enhance.yaml b/providers/deepinfra/Bria/enhance.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: Bria/enhance
 sources:

diff --git a/providers/deepinfra/Bria/erase.yaml b/providers/deepinfra/Bria/erase.yaml
@@ -1,6 +1,11 @@
 costs:
     - input_cost_per_image: 0.04
       region: "*"
+modalities:
+    input:
+        - image
+    output:
+        - image
 mode: image
 model: Bria/erase
 sources:

diff --git a/providers/deepinfra/Bria/erase_foreground.yaml b/providers/deepinfra/Bria/erase_foreground.yaml
@@ -1,3 +1,11 @@
+costs:
+    - input_cost_per_image: 0.04
+      region: "*"
+modalities:
+    input:
+        - image
+    output:
+        - image
 mode: image
 model: Bria/erase_foreground
 sources:

diff --git a/providers/deepinfra/Bria/expand.yaml b/providers/deepinfra/Bria/expand.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: Bria/expand
 sources:

diff --git a/providers/deepinfra/Bria/fibo.yaml b/providers/deepinfra/Bria/fibo.yaml
@@ -1,5 +1,7 @@
 modalities:
     input:
+        - text
+    output:
         - image
 mode: image
 model: Bria/fibo

diff --git a/providers/deepinfra/Bria/fibo_edit.yaml b/providers/deepinfra/Bria/fibo_edit.yaml
@@ -1,5 +1,8 @@
 modalities:
     input:
+        - text
+        - image
+    output:
         - image
 mode: image
 model: Bria/fibo_edit

diff --git a/providers/deepinfra/Bria/gen_fill.yaml b/providers/deepinfra/Bria/gen_fill.yaml
@@ -1,5 +1,11 @@
+costs:
+    - input_cost_per_image: 0.04
+      region: "*"
 modalities:
     input:
+        - text
+        - image
+    output:
         - image
 mode: image
 model: Bria/gen_fill

diff --git a/providers/deepinfra/Bria/remove_background.yaml b/providers/deepinfra/Bria/remove_background.yaml
@@ -1,6 +1,11 @@
 costs:
     - input_cost_per_image: 0
       region: "*"
+modalities:
+    input:
+        - image
+    output:
+        - image
 mode: image
 model: Bria/remove_background
 sources:

diff --git a/providers/deepinfra/Bria/replace_background.yaml b/providers/deepinfra/Bria/replace_background.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: Bria/replace_background
 sources:

diff --git a/providers/deepinfra/ByteDance/Seed-1.8.yaml b/providers/deepinfra/ByteDance/Seed-1.8.yaml
@@ -14,13 +14,18 @@ costs:
               - cost_per_token: 0.000004
                 from: 128000
 features:
+    - function_calling
     - prompt_caching
 limits:
     context_window: 256000
+    max_output_tokens: 256000
     max_tokens: 256000
 modalities:
     input:
+        - text
         - image
+    output:
+        - text
 mode: chat
 model: ByteDance/Seed-1.8
 sources:

diff --git a/providers/deepinfra/ByteDance/Seed-2.0-mini.yaml b/providers/deepinfra/ByteDance/Seed-2.0-mini.yaml
@@ -14,13 +14,17 @@ costs:
               - cost_per_token: 8.e-7
                 from: 128000
 features:
+    - function_calling
     - prompt_caching
+    - structured_output
 limits:
     context_window: 256000
-    max_tokens: 256000
 modalities:
     input:
+        - text
         - image
+    output:
+        - text
 mode: chat
 model: ByteDance/Seed-2.0-mini
 sources:

diff --git a/providers/deepinfra/ByteDance/Seedream-4.5.yaml b/providers/deepinfra/ByteDance/Seedream-4.5.yaml
@@ -3,6 +3,8 @@ costs:
       region: "*"
 modalities:
     input:
+        - text
+    output:
         - image
 mode: image
 model: ByteDance/Seedream-4.5

diff --git a/providers/deepinfra/ClarityAI/creative.yaml b/providers/deepinfra/ClarityAI/creative.yaml
@@ -4,6 +4,9 @@ costs:
 modalities:
     input:
         - image
+        - text
+    output:
+        - image
 mode: image
 model: ClarityAI/creative
 sources:

diff --git a/providers/deepinfra/ClarityAI/crystal.yaml b/providers/deepinfra/ClarityAI/crystal.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: ClarityAI/crystal
 sources:

diff --git a/providers/deepinfra/ClarityAI/flux.yaml b/providers/deepinfra/ClarityAI/flux.yaml
@@ -4,9 +4,10 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: ClarityAI/flux
 sources:
     - https://deepinfra.com/ClarityAI/flux
     - https://deepinfra.com/ClarityAI/flux/api
-    - https://deepinfra.com/flux
diff --git a/providers/deepinfra/MiniMaxAI/MiniMax-M2.1.yaml b/providers/deepinfra/MiniMaxAI/MiniMax-M2.1.yaml
@@ -5,10 +5,12 @@ costs:
       region: "*"
 features:
     - prompt_caching
+    - function_calling
+    - structured_output
 limits:
     context_window: 196608
     max_output_tokens: 131072
-    max_tokens: 196608
+    max_tokens: 131072
 mode: chat
 model: MiniMaxAI/MiniMax-M2.1
 sources:

diff --git a/providers/deepinfra/MiniMaxAI/MiniMax-M2.5.yaml b/providers/deepinfra/MiniMaxAI/MiniMax-M2.5.yaml
@@ -1,14 +1,19 @@
 costs:
-    - cache_read_input_token_cost: 2.99999997e-8
+    - cache_read_input_token_cost: 3.e-8
       input_cost_per_token: 2.7e-7
       output_cost_per_token: 9.5e-7
       region: "*"
 features:
+    - function_calling
     - prompt_caching
+    - structured_output
 limits:
     context_window: 196608
-    max_output_tokens: 131072
-    max_tokens: 196608
+modalities:
+    input:
+        - text
+    output:
+        - text
 mode: chat
 model: MiniMaxAI/MiniMax-M2.5
 sources:

diff --git a/providers/deepinfra/PaddlePaddle/PaddleOCR-VL-0.9B.yaml b/providers/deepinfra/PaddlePaddle/PaddleOCR-VL-0.9B.yaml
@@ -7,10 +7,13 @@ features:
 limits:
     context_window: 16384
     max_output_tokens: 8192
-    max_tokens: 16384
+    max_tokens: 8192
 modalities:
     input:
+        - text
         - image
+    output:
+        - text
 mode: chat
 model: PaddlePaddle/PaddleOCR-VL-0.9B
 sources:

diff --git a/providers/deepinfra/PrunaAI/p-image-Edit.yaml b/providers/deepinfra/PrunaAI/p-image-Edit.yaml
@@ -1,3 +1,12 @@
+costs:
+    - output_cost_per_image: 0.01
+      region: "*"
+modalities:
+    input:
+        - text
+        - image
+    output:
+        - image
 mode: image
 model: PrunaAI/p-image-Edit
 sources:

diff --git a/providers/deepinfra/PrunaAI/p-image.yaml b/providers/deepinfra/PrunaAI/p-image.yaml
@@ -1,5 +1,10 @@
+costs:
+    - output_cost_per_image: 0.005
+      region: "*"
 modalities:
     input:
+        - text
+    output:
         - image
 mode: image
 model: PrunaAI/p-image

diff --git a/providers/deepinfra/Qwen/Qwen-Image-Edit-Max.yaml b/providers/deepinfra/Qwen/Qwen-Image-Edit-Max.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: Qwen/Qwen-Image-Edit-Max
 sources:

diff --git a/providers/deepinfra/Qwen/Qwen-Image-Edit.yaml b/providers/deepinfra/Qwen/Qwen-Image-Edit.yaml
@@ -4,6 +4,8 @@ costs:
 modalities:
     input:
         - image
+    output:
+        - image
 mode: image
 model: Qwen/Qwen-Image-Edit
 sources:

diff --git a/providers/deepinfra/Qwen/Qwen-Image-Max.yaml b/providers/deepinfra/Qwen/Qwen-Image-Max.yaml
@@ -3,6 +3,9 @@ costs:
       region: "*"
 modalities:
     input:
+        - text
+        - image
+    output:
         - image
 mode: image
 model: Qwen/Qwen-Image-Max

diff --git a/providers/deepinfra/Qwen/Qwen3-Embedding-0.6B-batch.yaml b/providers/deepinfra/Qwen/Qwen3-Embedding-0.6B-batch.yaml
@@ -4,6 +4,10 @@ costs:
 limits:
     context_window: 32768
     max_input_tokens: 8192
+    output_vector_size: 1024
+modalities:
+    input:
+        - text
 mode: embedding
 model: Qwen/Qwen3-Embedding-0.6B-batch
 sources:

diff --git a/providers/deepinfra/Qwen/Qwen3-Embedding-0.6B.yaml b/providers/deepinfra/Qwen/Qwen3-Embedding-0.6B.yaml
@@ -3,10 +3,12 @@ costs:
       region: "*"
 limits:
     context_window: 32768
+    output_vector_size: 1024
 modalities:
     input:
-        - image
+        - text
 mode: embedding
 model: Qwen/Qwen3-Embedding-0.6B
 sources:
     - https://deepinfra.com/Qwen/Qwen3-Embedding-0.6B/api
+    - https://huggingface.co/Qwen/Qwen3-Embedding-0.6B
diff --git a/providers/deepinfra/Qwen/Qwen3-Embedding-4B-batch.yaml b/providers/deepinfra/Qwen/Qwen3-Embedding-4B-batch.yaml
@@ -3,10 +3,12 @@ costs:
       region: "*"
 limits:
     max_input_tokens: 32768
+    output_vector_size: 2560
 modalities:
     input:
-        - image
+        - text
 mode: embedding
 model: Qwen/Qwen3-Embedding-4B-batch
 sources:
     - https://deepinfra.com/Qwen/Qwen3-Embedding-4B-batch/api
+    - https://huggingface.co/Qwen/Qwen3-Embedding-4B