|
24 | 24 | "gpt-4o-2024-08-06": 128000, |
25 | 25 | "gpt-4o-2024-05-13": 128000, |
26 | 26 | "gpt-4o-mini": 128000, |
27 | | - "gpt-4.1": 1000000, |
28 | | - "gpt-4.1-mini": 1000000, |
29 | | - "gpt-4.1-nano": 1000000, |
| 27 | + "gpt-4.1": 1048576, |
| 28 | + "gpt-4.1-mini": 1048576, |
| 29 | + "gpt-4.1-nano": 1048576, |
30 | 30 | "gpt-4.5": 128000, |
31 | 31 | "gpt-4.5-preview": 128000, |
32 | | - "o1-preview": 128000, |
| 32 | + "o1-preview": 200000, |
33 | 33 | "o1-mini": 128000, |
34 | | - "o1": 128000, |
| 34 | + "o1": 200000, |
| 35 | + "o1-pro": 200000, |
35 | 36 | "o3-mini": 200000, |
| 37 | + "o3": 200000, |
| 38 | + "o3-pro": 200000, |
| 39 | + "o4-mini": 200000, |
| 40 | + "o3-deep-research": 200000, |
| 41 | + "o4-mini-deep-research": 200000, |
| 42 | + "gpt-5": 200000, |
| 43 | + "gpt-5.1": 200000, |
36 | 44 | "gpt-5.2": 128000, |
37 | 45 | "gpt-5.2-pro": 128000, |
| 46 | + "gpt-5.2-codex": 128000, |
| 47 | + "gpt-5.1-codex": 200000, |
| 48 | + "gpt-5.1-codex-max": 200000, |
| 49 | + "gpt-5.1-codex-mini": 200000, |
| 50 | + "gpt-5-codex": 200000, |
38 | 51 | "gpt-5.2-chat-latest": 128000, |
| 52 | + "gpt-5.1-chat-latest": 200000, |
| 53 | + "gpt-5-chat-latest": 200000, |
39 | 54 | "gpt-5-mini": 128000, |
40 | 55 | "gpt-5-nano": 128000, |
| 56 | + "gpt-oss-120b": 128000, |
| 57 | + "gpt-oss-20b": 128000, |
41 | 58 | }, |
42 | 59 | "azure_openai": { |
43 | 60 | "gpt-3.5-turbo-0125": 16385, |
|
58 | 75 | "gpt-4o": 128000, |
59 | 76 | "gpt-4o-mini": 128000, |
60 | 77 | "chatgpt-4o-latest": 128000, |
61 | | - "o1-preview": 128000, |
| 78 | + "o1-preview": 200000, |
62 | 79 | "o1-mini": 128000, |
| 80 | + "o1": 200000, |
| 81 | + "o1-pro": 200000, |
| 82 | + "o3-mini": 200000, |
| 83 | + "o3": 200000, |
| 84 | + "o3-pro": 200000, |
| 85 | + "o4-mini": 200000, |
| 86 | + "gpt-4.1": 1048576, |
| 87 | + "gpt-4.1-mini": 1048576, |
| 88 | + "gpt-4.1-nano": 1048576, |
| 89 | + "gpt-5": 200000, |
| 90 | + "gpt-5.1": 200000, |
63 | 91 | "gpt-5.2": 128000, |
64 | 92 | "gpt-5.2-pro": 128000, |
| 93 | + "gpt-5.2-codex": 128000, |
| 94 | + "gpt-5.1-codex": 200000, |
| 95 | + "gpt-5.1-codex-max": 200000, |
| 96 | + "gpt-5.1-codex-mini": 200000, |
| 97 | + "gpt-5-codex": 200000, |
65 | 98 | "gpt-5.2-chat-latest": 128000, |
| 99 | + "gpt-5.1-chat-latest": 200000, |
| 100 | + "gpt-5-chat-latest": 200000, |
66 | 101 | "gpt-5-mini": 128000, |
67 | 102 | "gpt-5-nano": 128000, |
| 103 | + "gpt-oss-120b": 128000, |
| 104 | + "gpt-oss-20b": 128000, |
68 | 105 | }, |
69 | 106 | "google_genai": { |
70 | 107 | "gemini-pro": 128000, |
|
79 | 116 | "gemini-1.5-flash": 128000, |
80 | 117 | "gemini-1.5-pro": 128000, |
81 | 118 | "gemini-1.0-pro": 128000, |
| 119 | + "gemini-2.0-flash": 1048576, |
| 120 | + "gemini-2.0-flash-exp": 1048576, |
| 121 | + "gemini-2.0-pro": 2000000, |
| 122 | + "gemini-2.0-pro-exp": 2000000, |
82 | 123 | }, |
83 | 124 | "ollama": { |
84 | 125 | "command-r": 12800, |
|
96 | 137 | "llama3.1": 128000, |
97 | 138 | "llama3.1:8b": 128000, |
98 | 139 | "llama3.1:70b": 128000, |
99 | | - "lama3.1:405b": 128000, |
| 140 | + "llama3.1:405b": 128000, |
100 | 141 | "llama3.2": 128000, |
101 | 142 | "llama3.2:1b": 128000, |
102 | 143 | "llama3.2:3b": 128000, |
|
139 | 180 | "qwen-turbo": 6000, |
140 | 181 | }, |
141 | 182 | "nvidia": { |
142 | | - "meta/llama3-70b-instruct": 419, |
143 | | - "meta/llama3-8b-instruct": 419, |
| 183 | + "meta/llama3-70b-instruct": 8192, |
| 184 | + "meta/llama3-8b-instruct": 8192, |
144 | 185 | "nemotron-4-340b-instruct": 1024, |
145 | 186 | "databricks/dbrx-instruct": 4096, |
146 | 187 | "google/codegemma-7b": 8192, |
|
155 | 196 | "mistralai/mixtral-8x22b-instruct-v0.1": 32768, |
156 | 197 | "mistralai/mixtral-8x7b-instruct-v0.1": 8192, |
157 | 198 | "snowflake/arctic": 16384, |
| 199 | + "meta/llama-3.3-70b-instruct": 128000, |
158 | 200 | }, |
159 | 201 | "groq": { |
160 | 202 | "llama3-8b-8192": 8192, |
|
0 commit comments