Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions providers/xai/grok-2-image-1212.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,5 +8,6 @@ costs:
- input_cost_per_token: 0
output_cost_per_image: 0.07
region: "*"
isDeprecated: true
mode: image
model: grok-2-image-1212
1 change: 1 addition & 0 deletions providers/xai/grok-2-image-latest.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,5 +8,6 @@ costs:
- input_cost_per_token: 0
output_cost_per_image: 0.07
region: "*"
isDeprecated: true
mode: image
model: grok-2-image-latest
1 change: 1 addition & 0 deletions providers/xai/grok-2-image.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,5 +8,6 @@ costs:
- input_cost_per_token: 0
output_cost_per_image: 0.07
region: "*"
isDeprecated: true
mode: image
model: grok-2-image
20 changes: 7 additions & 13 deletions providers/xai/grok-2-vision-1212.yaml
Original file line number Diff line number Diff line change
@@ -1,29 +1,23 @@
costs:
- input_cost_per_image: 0.000002
input_cost_per_token: 0.000002
output_cost_per_token: 0.00001
region: us-east-1
- input_cost_per_image: 0.000002
input_cost_per_token: 0.000002
output_cost_per_token: 0.00001
region: eu-west-1
- cache_read_input_token_cost: 0
input_cost_per_image: 0.000002
input_cost_per_query: 0
input_cost_per_token: 0.000002
- input_cost_per_token: 0.000002
output_cost_per_token: 0.00001
region: "*"
features:
- function_calling
- vision
- image_input
- chat
- image
- tool_choice
- response_schema
limits:
context_window: 32768
max_input_tokens: 32768
max_output_tokens: 32768
mode: chat
model: grok-2-vision-1212
params:
- key: max_tokens
maxValue: 4096
sources:
- https://docs.x.ai/developers/release-notes
- https://docs.x.ai/docs/key-information/migrating-to-new-models
1 change: 1 addition & 0 deletions providers/xai/grok-2-vision-latest.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ features:
- vision
- chat
- tool_choice
isDeprecated: true
limits:
max_input_tokens: 32768
max_output_tokens: 32768
Expand Down
1 change: 1 addition & 0 deletions providers/xai/grok-2-vision.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ features:
- vision
- chat
- tool_choice
isDeprecated: true
limits:
max_input_tokens: 32768
max_output_tokens: 32768
Expand Down
21 changes: 9 additions & 12 deletions providers/xai/grok-3-beta.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,21 @@
costs:
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
input_cost_per_token_batches: 0.0000015
output_cost_per_token: 0.000015
region: us-east-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
region: eu-west-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_image: 0
input_cost_per_query: 0.025
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
output_cost_per_token_batches: 0.0000075
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- system_messages
- prompt_caching
limits:
max_input_tokens: 131072
max_output_tokens: 131072
context_window: 131072
mode: chat
model: grok-3-beta
sources:
- https://docs.x.ai/developers/release-notes
- https://docs.x.ai/developers/rest-api-reference/inference/chat
1 change: 1 addition & 0 deletions providers/xai/grok-3-fast-beta.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ features:
- function_calling
- chat
- tool_choice
isDeprecated: true
limits:
max_input_tokens: 131072
max_output_tokens: 131072
Expand Down
19 changes: 10 additions & 9 deletions providers/xai/grok-3-fast-latest.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,25 @@
costs:
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
region: us-east-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
region: eu-west-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_image: 0
input_cost_per_query: 0.025
input_cost_per_token: 0.000003
input_cost_per_token_batches: 0.0000015
output_cost_per_token: 0.000015
output_cost_per_token_batches: 0.0000075
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- prompt_caching
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
max_tokens: 131072
mode: chat
model: grok-3-fast-latest
sources:
- https://docs.x.ai/docs/guides/reasoning
- https://docs.x.ai/docs/models
- https://docs.oracle.com/en-us/iaas/Content/generative-ai/xai-grok-3-fast.htm
18 changes: 9 additions & 9 deletions providers/xai/grok-3-fast.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,24 @@
costs:
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
region: us-east-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
region: eu-west-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_image: 0
input_cost_per_query: 0.025
input_cost_per_token: 0.000003
input_cost_per_token_batches: 0.0000015
output_cost_per_token: 0.000015
output_cost_per_token_batches: 0.0000075
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- prompt_caching
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
mode: chat
model: grok-3-fast
sources:
- https://docs.x.ai/developers/release-notes
- https://docs.x.ai/docs/guides/reasoning
- https://docs.oracle.com/en-us/iaas/Content/generative-ai/xai-grok-3-fast.htm
20 changes: 10 additions & 10 deletions providers/xai/grok-3-latest.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,24 @@
costs:
- cache_read_input_token_cost: 7.5e-7
input_cost_per_query: 0.005
input_cost_per_token: 0.000003
input_cost_per_token_batches: 0.0000015
output_cost_per_token: 0.000015
region: us-east-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
region: eu-west-1
- cache_read_input_token_cost: 7.5e-7
input_cost_per_image: 0
input_cost_per_query: 0.025
input_cost_per_token: 0.000003
output_cost_per_token: 0.000015
output_cost_per_token_batches: 0.0000075
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- system_messages
- prompt_caching
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
max_tokens: 131072
mode: chat
model: grok-3-latest
sources:
- https://docs.x.ai/docs/models?cluster=us-west-1
34 changes: 23 additions & 11 deletions providers/xai/grok-3-mini-beta.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,36 @@
costs:
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: us-east-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: eu-west-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_image: 0
input_cost_per_query: 0.025
- cache_read_input_token_cost: 7.e-8
input_cost_per_query: 0.005
input_cost_per_token: 3.e-7
input_cost_per_token_batches: 1.5e-7
output_cost_per_token: 5.e-7
output_cost_per_token_batches: 2.5e-7
region: "*"
features:
- function_calling
- parallel_function_calling
- chat
- tool_choice
- response_schema
- prompt_caching
- system_messages
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
max_tokens: 131072
mode: chat
model: grok-3-mini-beta
params:
- defaultValue: null
key: reasoning_effort
type: string
removeParams:
- stop
sources:
- https://docs.x.ai/docs/guides/reasoning
- https://docs.x.ai/docs/guides/structured-outputs
- https://docs.x.ai/docs/guides/function-calling
- https://docs.x.ai/docs/guides/tools/overview
- https://docs.x.ai/developers/tools/tool-usage-details
thinking: true
23 changes: 12 additions & 11 deletions providers/xai/grok-3-mini-fast-beta.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,25 @@
costs:
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: us-east-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: eu-west-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_image: 0
input_cost_per_query: 0.025
- cache_read_input_token_cost: 7.e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- prompt_caching
- system_messages
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
max_tokens: 131072
mode: chat
model: grok-3-mini-fast-beta
params:
- key: max_tokens
maxValue: 131072
sources:
- https://docs.oracle.com/en-us/iaas/Content/generative-ai/xai-grok-3-mini-fast.htm
thinking: true
20 changes: 11 additions & 9 deletions providers/xai/grok-3-mini-fast-latest.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,26 @@
costs:
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: us-east-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: eu-west-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_image: 0
input_cost_per_query: 0.025
input_cost_per_token: 3.e-7
input_cost_per_token_batches: 1.5e-7
output_cost_per_token: 5.e-7
output_cost_per_token_batches: 2.5e-7
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- prompt_caching
- system_messages
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
max_tokens: 131072
mode: chat
model: grok-3-mini-fast-latest
sources:
- https://docs.x.ai/docs/models/grok-3-mini-fast
- https://docs.x.ai/docs/models?cluster=us-west-1
thinking: true
18 changes: 9 additions & 9 deletions providers/xai/grok-3-mini-fast.yaml
Original file line number Diff line number Diff line change
@@ -1,24 +1,24 @@
costs:
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: us-east-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_token: 3.e-7
output_cost_per_token: 5.e-7
region: eu-west-1
- cache_read_input_token_cost: 7.5e-8
input_cost_per_image: 0
input_cost_per_query: 0.025
input_cost_per_token: 3.e-7
input_cost_per_token_batches: 1.5e-7
output_cost_per_token: 5.e-7
output_cost_per_token_batches: 2.5e-7
region: "*"
features:
- function_calling
- chat
- tool_choice
- response_schema
- prompt_caching
limits:
context_window: 131072
max_input_tokens: 131072
max_output_tokens: 131072
max_tokens: 131072
mode: chat
model: grok-3-mini-fast
sources:
- https://docs.x.ai/docs/models/grok-3-mini-fast
thinking: true
Loading