|
20 | 20 | ] |
21 | 21 |
|
22 | 22 | CHAT_MODEL_ARGS_DICT = { |
| 23 | + "openai/gpt-5-2025-08-07": OpenAIModelArgs( |
| 24 | + model_name="gpt-5-2025-08-07", |
| 25 | + max_total_tokens=400_000, |
| 26 | + max_input_tokens=256_000, |
| 27 | + max_new_tokens=128_000, |
| 28 | + temperature=1, # gpt-5 supports temperature of 1 only |
| 29 | + vision_support=True, |
| 30 | + ), |
23 | 31 | "openai/gpt-5-nano-2025-08-07": OpenAIModelArgs( |
24 | 32 | model_name="gpt-5-nano-2025-08-07", |
25 | | - max_total_tokens=128_000, |
26 | | - max_input_tokens=128_000, |
27 | | - max_new_tokens=16_384, |
| 33 | + max_total_tokens=400_000, |
| 34 | + max_input_tokens=256_000, |
| 35 | + max_new_tokens=128_000, |
28 | 36 | temperature=1, # gpt-5 supports temperature of 1 only |
29 | 37 | vision_support=True, |
30 | 38 | ), |
31 | 39 | "openai/gpt-5-mini-2025-08-07": OpenAIModelArgs( |
32 | 40 | model_name="gpt-5-mini-2025-08-07", |
33 | | - max_total_tokens=128_000, |
34 | | - max_input_tokens=128_000, |
35 | | - max_new_tokens=16_384, |
| 41 | + max_total_tokens=400_000, |
| 42 | + max_input_tokens=256_000, |
| 43 | + max_new_tokens=128_000, |
36 | 44 | temperature=1, # gpt-5 supports temperature of 1 only |
37 | 45 | vision_support=True, |
38 | 46 | ), |
|
111 | 119 | max_new_tokens=64_000, |
112 | 120 | temperature=1e-1, |
113 | 121 | ), |
114 | | - "openai/gpt-5-nano-2025-08-07": OpenAIModelArgs( |
115 | | - model_name="gpt-5-nano-2025-08-07", |
116 | | - max_total_tokens=400_000, |
117 | | - max_input_tokens=400_000 - 4_000, |
118 | | - max_new_tokens=4_000, |
119 | | - temperature=1, # temperature param not supported by gpt-5 |
120 | | - ), |
121 | | - "openai/gpt-5-mini-2025-08-07": OpenAIModelArgs( |
122 | | - model_name="gpt-5-mini-2025-08-07", |
123 | | - max_total_tokens=400_000, |
124 | | - max_input_tokens=400_000 - 4_000, |
125 | | - max_new_tokens=4_000, |
126 | | - temperature=1, # temperature param not supported by gpt-5 |
127 | | - ), |
128 | 122 | "azure/gpt-35-turbo/gpt-35-turbo": AzureModelArgs( |
129 | 123 | model_name="gpt-35-turbo", |
130 | | - deployment_name="gpt-35-turbo", |
131 | 124 | max_total_tokens=8_192, |
132 | 125 | max_input_tokens=7500, |
133 | 126 | max_new_tokens=500, |
134 | 127 | ), |
135 | 128 | "azure/gpt-4o-2024-05-13": AzureModelArgs( |
136 | 129 | model_name="gpt-4o", |
137 | | - deployment_name="gpt-4o-2024-05-13", |
138 | 130 | max_total_tokens=128_000, |
139 | 131 | max_input_tokens=100_000, |
140 | 132 | max_new_tokens=16_384, |
141 | 133 | vision_support=True, |
142 | 134 | ), |
143 | 135 | "azure/gpt-4o-2024-08-06": AzureModelArgs( |
144 | 136 | model_name="gpt-4o", |
145 | | - deployment_name="gpt-4o-2024-08-06", |
146 | 137 | max_total_tokens=128_000, |
147 | 138 | max_input_tokens=128_000, |
148 | 139 | max_new_tokens=16_384, |
149 | 140 | vision_support=True, |
150 | 141 | ), |
151 | 142 | "azure/gpt-4o-mini-2024-07-18": AzureModelArgs( |
152 | 143 | model_name="gpt-4o-mini", |
153 | | - deployment_name="gpt-4o-mini-2024-07-18", |
154 | 144 | max_total_tokens=128_000, |
155 | 145 | max_input_tokens=128_000, |
156 | 146 | max_new_tokens=16_384, |
157 | 147 | vision_support=True, |
158 | 148 | ), |
| 149 | + "azure/gpt-4.1-2025-04-14": AzureModelArgs( |
| 150 | + model_name="gpt-4.1", |
| 151 | + max_total_tokens=128_000, |
| 152 | + max_input_tokens=128_000, |
| 153 | + max_new_tokens=16_384, |
| 154 | + vision_support=True, |
| 155 | + ), |
| 156 | + "azure/gpt-4.1-mini-2025-04-14": AzureModelArgs( |
| 157 | + model_name="gpt-4.1-mini", |
| 158 | + max_total_tokens=128_000, |
| 159 | + max_input_tokens=128_000, |
| 160 | + max_new_tokens=16_384, |
| 161 | + vision_support=True, |
| 162 | + ), |
| 163 | + "azure/gpt-5-2025-08-07": AzureModelArgs( |
| 164 | + model_name="gpt-5", |
| 165 | + max_total_tokens=400_000, |
| 166 | + max_input_tokens=256_000, |
| 167 | + max_new_tokens=128_000, |
| 168 | + temperature=1, # temperature param not supported by gpt-5 |
| 169 | + vision_support=True, |
| 170 | + ), |
| 171 | + "azure/gpt-5-mini-2025-08-07": AzureModelArgs( |
| 172 | + model_name="gpt-5-mini", |
| 173 | + max_total_tokens=400_000, |
| 174 | + max_input_tokens=256_000, |
| 175 | + max_new_tokens=128_000, |
| 176 | + temperature=1, # temperature param not supported by gpt-5 |
| 177 | + vision_support=True, |
| 178 | + ), |
| 179 | + "azure/gpt-5-nano-2025-08-07": AzureModelArgs( |
| 180 | + model_name="gpt-5-nano", |
| 181 | + max_total_tokens=400_000, |
| 182 | + max_input_tokens=256_000, |
| 183 | + max_new_tokens=128_000, |
| 184 | + temperature=1, # temperature param not supported by gpt-5 |
| 185 | + vision_support=True, |
| 186 | + ), |
159 | 187 | # ---------------- Anthropic ----------------# |
160 | 188 | "anthropic/claude-3-7-sonnet-20250219": AnthropicModelArgs( |
161 | 189 | model_name="claude-3-7-sonnet-20250219", |
|
0 commit comments