truefoundry · hganwani-droid · Mar 19, 2026 · cursor · Mar 19, 2026 · cursor
diff --git a/providers/google-gemini/aqa.yaml b/providers/google-gemini/aqa.yaml
@@ -1,5 +1,11 @@
 limits:
     max_input_tokens: 7168
     max_output_tokens: 1024
+    max_tokens: 1024
+modalities:
+    input:
+        - text
+    output:
+        - text
 mode: unknown
 model: aqa
diff --git a/providers/google-gemini/deep-research-pro-preview-12-2025.yaml b/providers/google-gemini/deep-research-pro-preview-12-2025.yaml
@@ -15,15 +15,21 @@ costs:
               - cost_per_token: 0.000018
                 from: 200000
 features:
-    - structured_output
     - system_messages
 limits:
-    max_input_tokens: 131072
+    context_window: 1048576
+    max_input_tokens: 1048576
     max_output_tokens: 65536
+    max_tokens: 65536
 modalities:
     input:
+        - text
         - image
+        - audio
+        - video
         - pdf
+    output:
+        - text
 mode: chat
 model: deep-research-pro-preview-12-2025
 removeParams:

diff --git a/providers/google-gemini/gemini-2.5-flash-native-audio-preview-09-2025.yaml b/providers/google-gemini/gemini-2.5-flash-native-audio-preview-09-2025.yaml
@@ -12,11 +12,15 @@ features:
 limits:
     max_input_tokens: 131072
     max_output_tokens: 8192
+    max_tokens: 8192
 modalities:
     input:
+        - text
         - audio
+        - video
         - image
     output:
+        - text
         - audio
 mode: realtime
 model: gemini-2.5-flash-native-audio-preview-09-2025

diff --git a/providers/google-gemini/gemini-2.5-flash-native-audio-preview-12-2025.yaml b/providers/google-gemini/gemini-2.5-flash-native-audio-preview-12-2025.yaml
@@ -12,11 +12,14 @@ features:
 limits:
     max_input_tokens: 131072
     max_output_tokens: 8192
+    max_tokens: 8192
 modalities:
     input:
+        - text
         - audio
-        - image
+        - video
     output:
+        - text
         - audio
 mode: realtime
 model: gemini-2.5-flash-native-audio-preview-12-2025

diff --git a/providers/google-gemini/gemini-3.1-flash-image-preview.yaml b/providers/google-gemini/gemini-3.1-flash-image-preview.yaml
@@ -6,21 +6,25 @@ costs:
       output_cost_per_token_batches: 0.0000015
       region: "*"
 features:
-    - structured_output
     - system_messages
 limits:
-    max_input_tokens: 65536
-    max_output_tokens: 65536
+    max_input_tokens: 131072
+    max_output_tokens: 32768
+    max_tokens: 32768
 modalities:
     input:
+        - text
         - image
         - pdf
+    output:
+        - text
+        - image
 mode: image
 model: gemini-3.1-flash-image-preview
 params:
     - defaultValue: 256
       key: max_tokens
-      maxValue: 65536
+      maxValue: 32768
       minValue: 1
 removeParams:
     - tool_choice

diff --git a/providers/google-gemini/gemini-3.1-flash-lite-preview.yaml b/providers/google-gemini/gemini-3.1-flash-lite-preview.yaml
@@ -15,14 +15,25 @@ features:
     - prompt_caching
     - structured_output
     - tools
+    - code_execution
 limits:
     max_input_tokens: 1048576
     max_output_tokens: 65536
+    max_tokens: 65536
+messages:
+    options:
+        - system
+        - user
+        - assistant
 modalities:
     input:
-        - audio
+        - text
         - image
+        - audio
+        - video
         - pdf
+    output:
+        - text
 mode: chat
 model: gemini-3.1-flash-lite-preview
 params:

diff --git a/providers/google-gemini/gemini-embedding-2-preview.yaml b/providers/google-gemini/gemini-embedding-2-preview.yaml
@@ -4,17 +4,19 @@ costs:
       input_cost_per_image_token: 4.5e-7
       input_cost_per_second: 0.00016
       input_cost_per_token: 2.e-7
-      input_cost_per_token_batches: 1.e-7
       input_cost_per_video_token: 0.000012
       region: "*"
 limits:
     max_input_tokens: 8192
     max_output_tokens: 1
+    output_vector_size: 3072
 modalities:
     input:
+        - text
         - audio
         - image
         - pdf
+        - video
 mode: embedding
 model: gemini-embedding-2-preview
 removeParams:

diff --git a/providers/google-gemini/gemma-3-12b-it.yaml b/providers/google-gemini/gemma-3-12b-it.yaml
@@ -8,12 +8,19 @@ features:
     - system_messages
     - tool_choice
 limits:
-    max_input_tokens: 32768
+    max_input_tokens: 128000
     max_output_tokens: 8192
+    max_tokens: 8192
 modalities:
     input:
+        - text
         - image
+    output:
+        - text
 mode: chat
 model: gemma-3-12b-it
+params:
+    - key: max_tokens
+      maxValue: 8192
 sources:
     - https://huggingface.co/google/gemma-3-12b-it
diff --git a/providers/google-gemini/gemma-3-1b-it.yaml b/providers/google-gemini/gemma-3-1b-it.yaml
@@ -11,9 +11,20 @@ features:
     - tools
     - structured_output
 limits:
+    context_window: 32768
     max_input_tokens: 32768
     max_output_tokens: 8192
+    max_tokens: 8192
+modalities:
+    input:
+        - text
+    output:
+        - text
 mode: chat
 model: gemma-3-1b-it
+params:
+    - key: max_tokens
+      maxValue: 8192
 sources:
     - https://ai.google.dev/gemma/docs/core
+    - https://ai.google.dev/gemma/docs/core/model_card_3
diff --git a/providers/google-gemini/gemma-3-4b-it.yaml b/providers/google-gemini/gemma-3-4b-it.yaml
@@ -8,11 +8,16 @@ features:
     - system_messages
     - tool_choice
 limits:
-    max_input_tokens: 32768
+    context_window: 128000
+    max_input_tokens: 128000
     max_output_tokens: 8192
+    max_tokens: 8192
 modalities:
     input:
+        - text
         - image
+    output:
+        - text
 mode: chat
 model: gemma-3-4b-it
 params:

diff --git a/providers/google-gemini/gemma-3n-e2b-it.yaml b/providers/google-gemini/gemma-3n-e2b-it.yaml
@@ -9,10 +9,15 @@ features:
 limits:
     max_input_tokens: 8192
     max_output_tokens: 2048
+    max_tokens: 2048
 modalities:
     input:
+        - text
         - audio
         - image
+        - video
+    output:
+        - text
 mode: chat
 model: gemma-3n-e2b-it
 removeParams:

diff --git a/providers/google-gemini/gemma-3n-e4b-it.yaml b/providers/google-gemini/gemma-3n-e4b-it.yaml
@@ -5,15 +5,19 @@ costs:
 features:
     - system_messages
 limits:
-    max_input_tokens: 8192
-    max_output_tokens: 2048
+    context_window: 32000
 modalities:
     input:
+        - text
         - audio
         - image
+        - video
+    output:
+        - text
 mode: chat
 model: gemma-3n-e4b-it
 removeParams:
     - tool_choice
 sources:
     - https://ai.google.dev/gemma/docs/3n
+    - https://ai.google.dev/gemma/docs/gemma-3n/model_card
diff --git a/providers/google-gemini/nano-banana-pro-preview.yaml b/providers/google-gemini/nano-banana-pro-preview.yaml
@@ -8,21 +8,19 @@ costs:
       output_cost_per_token: 0.000012
       output_cost_per_token_batches: 0.000006
       region: "*"
-      tiered_pricing:
-          input:
-              - cost_per_token: 0.000004
-                from: 200000
-          output:
-              - cost_per_token: 0.000018
-                from: 200000
 features:
     - structured_output
     - system_messages
 limits:
-    max_input_tokens: 131072
+    max_input_tokens: 65536
     max_output_tokens: 32768
+    max_tokens: 32768
 modalities:
     input:
+        - text
+        - image
+    output:
+        - text
         - image
 mode: image
 model: nano-banana-pro-preview