Update models.yaml with latest OpenRouter data

This commit is contained in:
2026-02-20 12:08:00 -07:00
parent e798747135
commit ecf3780aed
+195 -132
View File
@@ -81,6 +81,7 @@
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: o4-mini - name: o4-mini
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
output_price: 4.4 output_price: 4.4
@@ -93,6 +94,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: o4-mini-high - name: o4-mini-high
max_output_tokens: 100000
real_name: o4-mini real_name: o4-mini
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
@@ -107,6 +109,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: o3 - name: o3
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 2 input_price: 2
output_price: 8 output_price: 8
@@ -133,6 +136,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: o3-mini - name: o3-mini
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
output_price: 4.4 output_price: 4.4
@@ -145,6 +149,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: o3-mini-high - name: o3-mini-high
max_output_tokens: 100000
real_name: o3-mini real_name: o3-mini
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
@@ -192,23 +197,23 @@
models: models:
- name: gemini-2.5-flash - name: gemini-2.5-flash
max_input_tokens: 1048576 max_input_tokens: 1048576
max_output_tokens: 65536 max_output_tokens: 65535
input_price: 0 input_price: 0.3
output_price: 0 output_price: 2.5
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemini-2.5-pro - name: gemini-2.5-pro
max_input_tokens: 1048576 max_input_tokens: 1048576
max_output_tokens: 65536 max_output_tokens: 65536
input_price: 0 input_price: 1.25
output_price: 0 output_price: 10
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemini-2.5-flash-lite - name: gemini-2.5-flash-lite
max_input_tokens: 1000000 max_input_tokens: 1048576
max_output_tokens: 64000 max_output_tokens: 65535
input_price: 0 input_price: 0.1
output_price: 0 output_price: 0.4
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemini-2.0-flash - name: gemini-2.0-flash
@@ -226,10 +231,11 @@
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemma-3-27b-it - name: gemma-3-27b-it
max_input_tokens: 131072 supports_vision: true
max_output_tokens: 8192 max_input_tokens: 128000
input_price: 0 max_output_tokens: 65536
output_price: 0 input_price: 0.04
output_price: 0.15
- name: text-embedding-004 - name: text-embedding-004
type: embedding type: embedding
input_price: 0 input_price: 0
@@ -509,8 +515,8 @@
output_price: 10 output_price: 10
supports_vision: true supports_vision: true
- name: command-r7b-12-2024 - name: command-r7b-12-2024
max_input_tokens: 131072 max_input_tokens: 128000
max_output_tokens: 4096 max_output_tokens: 4000
input_price: 0.0375 input_price: 0.0375
output_price: 0.15 output_price: 0.15
- name: embed-v4.0 - name: embed-v4.0
@@ -547,6 +553,7 @@
- provider: xai - provider: xai
models: models:
- name: grok-4 - name: grok-4
supports_vision: true
max_input_tokens: 256000 max_input_tokens: 256000
input_price: 3 input_price: 3
output_price: 15 output_price: 15
@@ -583,14 +590,18 @@
- provider: perplexity - provider: perplexity
models: models:
- name: sonar-pro - name: sonar-pro
max_output_tokens: 8000
supports_vision: true
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 3 input_price: 3
output_price: 15 output_price: 15
- name: sonar - name: sonar
max_input_tokens: 128000 supports_vision: true
max_input_tokens: 127072
input_price: 1 input_price: 1
output_price: 1 output_price: 1
- name: sonar-reasoning-pro - name: sonar-reasoning-pro
supports_vision: true
max_input_tokens: 128000 max_input_tokens: 128000
input_price: 2 input_price: 2
output_price: 8 output_price: 8
@@ -663,13 +674,13 @@
hipaa_safe: true hipaa_safe: true
max_input_tokens: 1048576 max_input_tokens: 1048576
max_output_tokens: 65536 max_output_tokens: 65536
input_price: 0 input_price: 2
output_price: 0 output_price: 12
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemini-2.5-flash - name: gemini-2.5-flash
max_input_tokens: 1048576 max_input_tokens: 1048576
max_output_tokens: 65536 max_output_tokens: 65535
input_price: 0.3 input_price: 0.3
output_price: 2.5 output_price: 2.5
supports_vision: true supports_vision: true
@@ -683,16 +694,16 @@
supports_function_calling: true supports_function_calling: true
- name: gemini-2.5-flash-lite - name: gemini-2.5-flash-lite
max_input_tokens: 1048576 max_input_tokens: 1048576
max_output_tokens: 65536 max_output_tokens: 65535
input_price: 0.3 input_price: 0.1
output_price: 0.4 output_price: 0.4
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemini-2.0-flash-001 - name: gemini-2.0-flash-001
max_input_tokens: 1048576 max_input_tokens: 1048576
max_output_tokens: 8192 max_output_tokens: 8192
input_price: 0.15 input_price: 0.1
output_price: 0.6 output_price: 0.4
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: gemini-2.0-flash-lite-001 - name: gemini-2.0-flash-lite-001
@@ -1194,10 +1205,16 @@
- provider: qianwen - provider: qianwen
models: models:
- name: qwen3-max - name: qwen3-max
input_price: 1.2
output_price: 6
max_output_tokens: 32768
max_input_tokens: 262144 max_input_tokens: 262144
supports_function_calling: true supports_function_calling: true
- name: qwen-plus - name: qwen-plus
max_input_tokens: 131072 input_price: 0.4
output_price: 1.2
max_output_tokens: 32768
max_input_tokens: 1000000
supports_function_calling: true supports_function_calling: true
- name: qwen-flash - name: qwen-flash
max_input_tokens: 1000000 max_input_tokens: 1000000
@@ -1213,14 +1230,14 @@
- name: qwen-coder-flash - name: qwen-coder-flash
max_input_tokens: 1000000 max_input_tokens: 1000000
- name: qwen3-next-80b-a3b-instruct - name: qwen3-next-80b-a3b-instruct
max_input_tokens: 131072 max_input_tokens: 262144
input_price: 0.14 input_price: 0.09
output_price: 0.56 output_price: 1.1
supports_function_calling: true supports_function_calling: true
- name: qwen3-next-80b-a3b-thinking - name: qwen3-next-80b-a3b-thinking
max_input_tokens: 131072 max_input_tokens: 128000
input_price: 0.14 input_price: 0.15
output_price: 1.4 output_price: 1.2
- name: qwen3-235b-a22b-instruct-2507 - name: qwen3-235b-a22b-instruct-2507
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.28 input_price: 0.28
@@ -1228,35 +1245,39 @@
supports_function_calling: true supports_function_calling: true
- name: qwen3-235b-a22b-thinking-2507 - name: qwen3-235b-a22b-thinking-2507
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.28 input_price: 0
output_price: 2.8 output_price: 0
- name: qwen3-30b-a3b-instruct-2507 - name: qwen3-30b-a3b-instruct-2507
max_input_tokens: 131072 max_output_tokens: 262144
input_price: 0.105 max_input_tokens: 262144
output_price: 0.42 input_price: 0.09
output_price: 0.3
supports_function_calling: true supports_function_calling: true
- name: qwen3-30b-a3b-thinking-2507 - name: qwen3-30b-a3b-thinking-2507
max_input_tokens: 131072 max_input_tokens: 32768
input_price: 0.105 input_price: 0.051
output_price: 1.05 output_price: 0.34
- name: qwen3-vl-32b-instruct - name: qwen3-vl-32b-instruct
max_output_tokens: 32768
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.28 input_price: 0.104
output_price: 1.12 output_price: 0.416
supports_vision: true supports_vision: true
- name: qwen3-vl-8b-instruct - name: qwen3-vl-8b-instruct
max_output_tokens: 32768
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.07 input_price: 0.08
output_price: 0.28 output_price: 0.5
supports_vision: true supports_vision: true
- name: qwen3-coder-480b-a35b-instruct - name: qwen3-coder-480b-a35b-instruct
max_input_tokens: 262144 max_input_tokens: 262144
input_price: 1.26 input_price: 1.26
output_price: 5.04 output_price: 5.04
- name: qwen3-coder-30b-a3b-instruct - name: qwen3-coder-30b-a3b-instruct
max_input_tokens: 262144 max_output_tokens: 32768
input_price: 0.315 max_input_tokens: 160000
output_price: 1.26 input_price: 0.07
output_price: 0.27
- name: deepseek-v3.2-exp - name: deepseek-v3.2-exp
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.28 input_price: 0.28
@@ -1332,9 +1353,9 @@
output_price: 8.12 output_price: 8.12
supports_vision: true supports_vision: true
- name: kimi-k2-thinking - name: kimi-k2-thinking
max_input_tokens: 262144 max_input_tokens: 131072
input_price: 0.56 input_price: 0.47
output_price: 2.24 output_price: 2
supports_vision: true supports_vision: true
# Links: # Links:
@@ -1343,10 +1364,10 @@
- provider: deepseek - provider: deepseek
models: models:
- name: deepseek-chat - name: deepseek-chat
max_input_tokens: 64000 max_input_tokens: 163840
max_output_tokens: 8192 max_output_tokens: 163840
input_price: 0.56 input_price: 0.32
output_price: 1.68 output_price: 0.89
supports_function_calling: true supports_function_calling: true
- name: deepseek-reasoner - name: deepseek-reasoner
max_input_tokens: 64000 max_input_tokens: 64000
@@ -1424,9 +1445,10 @@
- provider: minimax - provider: minimax
models: models:
- name: minimax-m2 - name: minimax-m2
max_input_tokens: 204800 max_output_tokens: 65536
input_price: 0.294 max_input_tokens: 196608
output_price: 1.176 input_price: 0.255
output_price: 1
supports_function_calling: true supports_function_calling: true
# Links: # Links:
@@ -1442,8 +1464,8 @@
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: openai/gpt-5.1-chat - name: openai/gpt-5.1-chat
max_input_tokens: 400000 max_input_tokens: 128000
max_output_tokens: 128000 max_output_tokens: 16384
input_price: 1.25 input_price: 1.25
output_price: 10 output_price: 10
supports_vision: true supports_vision: true
@@ -1456,8 +1478,8 @@
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: openai/gpt-5-chat - name: openai/gpt-5-chat
max_input_tokens: 400000 max_input_tokens: 128000
max_output_tokens: 128000 max_output_tokens: 16384
input_price: 1.25 input_price: 1.25
output_price: 10 output_price: 10
supports_vision: true supports_vision: true
@@ -1498,18 +1520,21 @@
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: openai/gpt-4o - name: openai/gpt-4o
max_output_tokens: 16384
max_input_tokens: 128000 max_input_tokens: 128000
input_price: 2.5 input_price: 2.5
output_price: 10 output_price: 10
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: openai/gpt-4o-mini - name: openai/gpt-4o-mini
max_output_tokens: 16384
max_input_tokens: 128000 max_input_tokens: 128000
input_price: 0.15 input_price: 0.15
output_price: 0.6 output_price: 0.6
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: openai/o4-mini - name: openai/o4-mini
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
output_price: 4.4 output_price: 4.4
@@ -1522,6 +1547,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: openai/o4-mini-high - name: openai/o4-mini-high
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
output_price: 4.4 output_price: 4.4
@@ -1535,6 +1561,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: openai/o3 - name: openai/o3
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 2 input_price: 2
output_price: 8 output_price: 8
@@ -1560,6 +1587,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: openai/o3-mini - name: openai/o3-mini
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
output_price: 4.4 output_price: 4.4
@@ -1571,6 +1599,7 @@
temperature: null temperature: null
top_p: null top_p: null
- name: openai/o3-mini-high - name: openai/o3-mini-high
max_output_tokens: 100000
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 1.1 input_price: 1.1
output_price: 4.4 output_price: 4.4
@@ -1583,50 +1612,57 @@
top_p: null top_p: null
- name: openai/gpt-oss-120b - name: openai/gpt-oss-120b
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.09 input_price: 0.039
output_price: 0.45 output_price: 0.19
supports_function_calling: true supports_function_calling: true
- name: openai/gpt-oss-20b - name: openai/gpt-oss-20b
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.04 input_price: 0.03
output_price: 0.16 output_price: 0.14
supports_function_calling: true supports_function_calling: true
- name: google/gemini-2.5-flash - name: google/gemini-2.5-flash
max_output_tokens: 65535
max_input_tokens: 1048576 max_input_tokens: 1048576
input_price: 0.3 input_price: 0.3
output_price: 2.5 output_price: 2.5
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: google/gemini-2.5-pro - name: google/gemini-2.5-pro
max_output_tokens: 65536
max_input_tokens: 1048576 max_input_tokens: 1048576
input_price: 1.25 input_price: 1.25
output_price: 10 output_price: 10
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: google/gemini-2.5-flash-lite - name: google/gemini-2.5-flash-lite
max_output_tokens: 65535
max_input_tokens: 1048576 max_input_tokens: 1048576
input_price: 0.3 input_price: 0.1
output_price: 0.4 output_price: 0.4
supports_vision: true supports_vision: true
- name: google/gemini-2.0-flash-001 - name: google/gemini-2.0-flash-001
max_input_tokens: 1000000 max_output_tokens: 8192
input_price: 0.15 max_input_tokens: 1048576
output_price: 0.6 input_price: 0.1
output_price: 0.4
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: google/gemini-2.0-flash-lite-001 - name: google/gemini-2.0-flash-lite-001
max_output_tokens: 8192
max_input_tokens: 1048576 max_input_tokens: 1048576
input_price: 0.075 input_price: 0.075
output_price: 0.3 output_price: 0.3
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: google/gemma-3-27b-it - name: google/gemma-3-27b-it
max_input_tokens: 131072 max_output_tokens: 65536
input_price: 0.1 supports_vision: true
output_price: 0.2 max_input_tokens: 128000
input_price: 0.04
output_price: 0.15
- name: anthropic/claude-sonnet-4.5 - name: anthropic/claude-sonnet-4.5
max_input_tokens: 200000 max_input_tokens: 1000000
max_output_tokens: 8192 max_output_tokens: 64000
require_max_tokens: true require_max_tokens: true
input_price: 3 input_price: 3
output_price: 15 output_price: 15
@@ -1634,7 +1670,7 @@
supports_function_calling: true supports_function_calling: true
- name: anthropic/claude-haiku-4.5 - name: anthropic/claude-haiku-4.5
max_input_tokens: 200000 max_input_tokens: 200000
max_output_tokens: 8192 max_output_tokens: 64000
require_max_tokens: true require_max_tokens: true
input_price: 1 input_price: 1
output_price: 5 output_price: 5
@@ -1642,7 +1678,7 @@
supports_function_calling: true supports_function_calling: true
- name: anthropic/claude-opus-4.1 - name: anthropic/claude-opus-4.1
max_input_tokens: 200000 max_input_tokens: 200000
max_output_tokens: 8192 max_output_tokens: 32000
require_max_tokens: true require_max_tokens: true
input_price: 15 input_price: 15
output_price: 75 output_price: 75
@@ -1650,15 +1686,15 @@
supports_function_calling: true supports_function_calling: true
- name: anthropic/claude-opus-4 - name: anthropic/claude-opus-4
max_input_tokens: 200000 max_input_tokens: 200000
max_output_tokens: 8192 max_output_tokens: 32000
require_max_tokens: true require_max_tokens: true
input_price: 15 input_price: 15
output_price: 75 output_price: 75
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: anthropic/claude-sonnet-4 - name: anthropic/claude-sonnet-4
max_input_tokens: 200000 max_input_tokens: 1000000
max_output_tokens: 8192 max_output_tokens: 64000
require_max_tokens: true require_max_tokens: true
input_price: 3 input_price: 3
output_price: 15 output_price: 15
@@ -1666,7 +1702,7 @@
supports_function_calling: true supports_function_calling: true
- name: anthropic/claude-3.7-sonnet - name: anthropic/claude-3.7-sonnet
max_input_tokens: 200000 max_input_tokens: 200000
max_output_tokens: 8192 max_output_tokens: 64000
require_max_tokens: true require_max_tokens: true
input_price: 3 input_price: 3
output_price: 15 output_price: 15
@@ -1681,21 +1717,24 @@
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: meta-llama/llama-4-maverick - name: meta-llama/llama-4-maverick
max_output_tokens: 16384
max_input_tokens: 1048576 max_input_tokens: 1048576
input_price: 0.18 input_price: 0.15
output_price: 0.6 output_price: 0.6
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: meta-llama/llama-4-scout - name: meta-llama/llama-4-scout
max_output_tokens: 16384
max_input_tokens: 327680 max_input_tokens: 327680
input_price: 0.08 input_price: 0.08
output_price: 0.3 output_price: 0.3
supports_vision: true supports_vision: true
supports_function_calling: true supports_function_calling: true
- name: meta-llama/llama-3.3-70b-instruct - name: meta-llama/llama-3.3-70b-instruct
max_output_tokens: 16384
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.12 input_price: 0.1
output_price: 0.3 output_price: 0.32
- name: mistralai/mistral-medium-3.1 - name: mistralai/mistral-medium-3.1
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.4 input_price: 0.4
@@ -1703,9 +1742,10 @@
supports_function_calling: true supports_function_calling: true
supports_vision: true supports_vision: true
- name: mistralai/mistral-small-3.2-24b-instruct - name: mistralai/mistral-small-3.2-24b-instruct
max_output_tokens: 131072
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.1 input_price: 0.06
output_price: 0.3 output_price: 0.18
supports_vision: true supports_vision: true
- name: mistralai/magistral-medium-2506 - name: mistralai/magistral-medium-2506
max_input_tokens: 40960 max_input_tokens: 40960
@@ -1726,8 +1766,8 @@
supports_function_calling: true supports_function_calling: true
- name: mistralai/devstral-small - name: mistralai/devstral-small
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.07 input_price: 0.1
output_price: 0.28 output_price: 0.3
supports_function_calling: true supports_function_calling: true
- name: mistralai/codestral-2508 - name: mistralai/codestral-2508
max_input_tokens: 256000 max_input_tokens: 256000
@@ -1735,6 +1775,7 @@
output_price: 0.9 output_price: 0.9
supports_function_calling: true supports_function_calling: true
- name: ai21/jamba-large-1.7 - name: ai21/jamba-large-1.7
max_output_tokens: 4096
max_input_tokens: 256000 max_input_tokens: 256000
input_price: 2 input_price: 2
output_price: 8 output_price: 8
@@ -1745,88 +1786,98 @@
output_price: 0.4 output_price: 0.4
supports_function_calling: true supports_function_calling: true
- name: cohere/command-a - name: cohere/command-a
max_output_tokens: 8192
max_input_tokens: 256000 max_input_tokens: 256000
input_price: 2.5 input_price: 2.5
output_price: 10 output_price: 10
supports_function_calling: true supports_function_calling: true
- name: cohere/command-r7b-12-2024 - name: cohere/command-r7b-12-2024
max_input_tokens: 128000 max_input_tokens: 128000
max_output_tokens: 4096 max_output_tokens: 4000
input_price: 0.0375 input_price: 0.0375
output_price: 0.15 output_price: 0.15
- name: deepseek/deepseek-v3.2-exp - name: deepseek/deepseek-v3.2-exp
max_output_tokens: 65536
max_input_tokens: 163840 max_input_tokens: 163840
input_price: 0.27 input_price: 0.27
output_price: 0.40 output_price: 0.41
- name: deepseek/deepseek-v3.1-terminus - name: deepseek/deepseek-v3.1-terminus
max_input_tokens: 163840 max_input_tokens: 163840
input_price: 0.23 input_price: 0.21
output_price: 0.90 output_price: 0.79
- name: deepseek/deepseek-chat-v3.1 - name: deepseek/deepseek-chat-v3.1
max_input_tokens: 163840 max_output_tokens: 7168
input_price: 0.2 max_input_tokens: 32768
output_price: 0.8 input_price: 0.15
output_price: 0.75
- name: deepseek/deepseek-r1-0528 - name: deepseek/deepseek-r1-0528
max_input_tokens: 128000 max_output_tokens: 65536
input_price: 0.50 max_input_tokens: 163840
output_price: 2.15 input_price: 0.4
output_price: 1.75
patch: patch:
body: body:
include_reasoning: true include_reasoning: true
- name: qwen/qwen3-max - name: qwen/qwen3-max
max_output_tokens: 32768
max_input_tokens: 262144 max_input_tokens: 262144
input_price: 1.2 input_price: 1.2
output_price: 6 output_price: 6
supports_function_calling: true supports_function_calling: true
- name: qwen/qwen-plus - name: qwen/qwen-plus
max_input_tokens: 131072 max_input_tokens: 1000000
max_output_tokens: 8192 max_output_tokens: 32768
input_price: 0.4 input_price: 0.4
output_price: 1.2 output_price: 1.2
supports_function_calling: true supports_function_calling: true
- name: qwen/qwen3-next-80b-a3b-instruct - name: qwen/qwen3-next-80b-a3b-instruct
max_input_tokens: 262144 max_input_tokens: 262144
input_price: 0.1 input_price: 0.09
output_price: 0.8 output_price: 1.1
supports_function_calling: true supports_function_calling: true
- name: qwen/qwen3-next-80b-a3b-thinking - name: qwen/qwen3-next-80b-a3b-thinking
max_input_tokens: 262144 max_input_tokens: 128000
input_price: 0.1 input_price: 0.15
output_price: 0.8 output_price: 1.2
- name: qwen/qwen5-235b-a22b-2507 # Qwen3 235B A22B Instruct 2507 - name: qwen/qwen5-235b-a22b-2507 # Qwen3 235B A22B Instruct 2507
max_input_tokens: 262144 max_input_tokens: 262144
input_price: 0.12 input_price: 0.12
output_price: 0.59 output_price: 0.59
supports_function_calling: true supports_function_calling: true
- name: qwen/qwen3-235b-a22b-thinking-2507 - name: qwen/qwen3-235b-a22b-thinking-2507
max_input_tokens: 262144
input_price: 0.118
output_price: 0.118
- name: qwen/qwen3-30b-a3b-instruct-2507
max_input_tokens: 131072 max_input_tokens: 131072
input_price: 0.2 input_price: 0
output_price: 0.8 output_price: 0
- name: qwen/qwen3-30b-a3b-instruct-2507
max_output_tokens: 262144
max_input_tokens: 262144
input_price: 0.09
output_price: 0.3
- name: qwen/qwen3-30b-a3b-thinking-2507 - name: qwen/qwen3-30b-a3b-thinking-2507
max_input_tokens: 262144 max_input_tokens: 32768
input_price: 0.071 input_price: 0.051
output_price: 0.285 output_price: 0.34
- name: qwen/qwen3-vl-32b-instruct - name: qwen/qwen3-vl-32b-instruct
max_input_tokens: 262144 max_output_tokens: 32768
input_price: 0.35 max_input_tokens: 131072
output_price: 1.1 input_price: 0.104
output_price: 0.416
supports_vision: true supports_vision: true
- name: qwen/qwen3-vl-8b-instruct - name: qwen/qwen3-vl-8b-instruct
max_input_tokens: 262144 max_output_tokens: 32768
max_input_tokens: 131072
input_price: 0.08 input_price: 0.08
output_price: 0.50 output_price: 0.5
supports_vision: true supports_vision: true
- name: qwen/qwen3-coder-plus - name: qwen/qwen3-coder-plus
max_input_tokens: 128000 max_output_tokens: 65536
max_input_tokens: 1000000
input_price: 1 input_price: 1
output_price: 5 output_price: 5
supports_function_calling: true supports_function_calling: true
- name: qwen/qwen3-coder-flash - name: qwen/qwen3-coder-flash
max_input_tokens: 128000 max_output_tokens: 65536
max_input_tokens: 1000000
input_price: 0.3 input_price: 0.3
output_price: 1.5 output_price: 1.5
supports_function_calling: true supports_function_calling: true
@@ -1836,19 +1887,20 @@
output_price: 0.95 output_price: 0.95
supports_function_calling: true supports_function_calling: true
- name: qwen/qwen3-coder-30b-a3b-instruct - name: qwen/qwen3-coder-30b-a3b-instruct
max_input_tokens: 262144 max_output_tokens: 32768
input_price: 0.052 max_input_tokens: 160000
output_price: 0.207 input_price: 0.07
output_price: 0.27
supports_function_calling: true supports_function_calling: true
- name: moonshotai/kimi-k2-0905 - name: moonshotai/kimi-k2-0905
max_input_tokens: 262144 max_input_tokens: 131072
input_price: 0.296 input_price: 0.4
output_price: 1.185 output_price: 2
supports_function_calling: true supports_function_calling: true
- name: moonshotai/kimi-k2-thinking - name: moonshotai/kimi-k2-thinking
max_input_tokens: 262144 max_input_tokens: 131072
input_price: 0.45 input_price: 0.47
output_price: 2.35 output_price: 2
supports_function_calling: true supports_function_calling: true
- name: moonshotai/kimi-dev-72b - name: moonshotai/kimi-dev-72b
max_input_tokens: 131072 max_input_tokens: 131072
@@ -1856,21 +1908,26 @@
output_price: 1.15 output_price: 1.15
supports_function_calling: true supports_function_calling: true
- name: x-ai/grok-4 - name: x-ai/grok-4
supports_vision: true
max_input_tokens: 256000 max_input_tokens: 256000
input_price: 3 input_price: 3
output_price: 15 output_price: 15
supports_function_calling: true supports_function_calling: true
- name: x-ai/grok-4-fast - name: x-ai/grok-4-fast
max_output_tokens: 30000
supports_vision: true
max_input_tokens: 2000000 max_input_tokens: 2000000
input_price: 0.2 input_price: 0.2
output_price: 0.5 output_price: 0.5
supports_function_calling: true supports_function_calling: true
- name: x-ai/grok-code-fast-1 - name: x-ai/grok-code-fast-1
max_output_tokens: 10000
max_input_tokens: 256000 max_input_tokens: 256000
input_price: 0.2 input_price: 0.2
output_price: 1.5 output_price: 1.5
supports_function_calling: true supports_function_calling: true
- name: amazon/nova-premier-v1 - name: amazon/nova-premier-v1
max_output_tokens: 32000
max_input_tokens: 1000000 max_input_tokens: 1000000
input_price: 2.5 input_price: 2.5
output_price: 12.5 output_price: 12.5
@@ -1893,14 +1950,18 @@
input_price: 0.035 input_price: 0.035
output_price: 0.14 output_price: 0.14
- name: perplexity/sonar-pro - name: perplexity/sonar-pro
max_output_tokens: 8000
supports_vision: true
max_input_tokens: 200000 max_input_tokens: 200000
input_price: 3 input_price: 3
output_price: 15 output_price: 15
- name: perplexity/sonar - name: perplexity/sonar
supports_vision: true
max_input_tokens: 127072 max_input_tokens: 127072
input_price: 1 input_price: 1
output_price: 1 output_price: 1
- name: perplexity/sonar-reasoning-pro - name: perplexity/sonar-reasoning-pro
supports_vision: true
max_input_tokens: 128000 max_input_tokens: 128000
input_price: 2 input_price: 2
output_price: 8 output_price: 8
@@ -1915,20 +1976,22 @@
body: body:
include_reasoning: true include_reasoning: true
- name: perplexity/sonar-deep-research - name: perplexity/sonar-deep-research
max_input_tokens: 200000 max_input_tokens: 128000
input_price: 2 input_price: 2
output_price: 8 output_price: 8
patch: patch:
body: body:
include_reasoning: true include_reasoning: true
- name: minimax/minimax-m2 - name: minimax/minimax-m2
max_output_tokens: 65536
max_input_tokens: 196608 max_input_tokens: 196608
input_price: 0.15 input_price: 0.255
output_price: 0.45 output_price: 1
- name: z-ai/glm-4.6 - name: z-ai/glm-4.6
max_output_tokens: 131072
max_input_tokens: 202752 max_input_tokens: 202752
input_price: 0.5 input_price: 0.35
output_price: 1.75 output_price: 1.71
supports_function_calling: true supports_function_calling: true
# Links: # Links: