@@ -255,26 +255,26 @@ Low, high, and embedding models have different rate limits. To see which type of
255255 <td>1</td>
256256 </tr >
257257 <tr >
258- <th rowspan="4" scope="rowgroup" style="box-shadow: none" ><b>Azure OpenAI o1-mini </b></th>
258+ <th rowspan="4" scope="rowgroup"><b>Azure OpenAI o1 and o3 </b></th>
259259 <th style="padding-left: 0"><b>Requests per minute</b></th>
260260 <td>Not applicable</td>
261+ <td>1</td>
262+ <td>2</td>
261263 <td>2</td>
262- <td>3</td>
263- <td>3</td>
264264 </tr >
265265 <tr >
266266 <th><b>Requests per day</b></th>
267267 <td>Not applicable</td>
268+ <td>8</td>
269+ <td>10</td>
268270 <td>12</td>
269- <td>15</td>
270- <td>20</td>
271271 </tr >
272272 <tr >
273273 <th><b>Tokens per request</b></th>
274274 <td>Not applicable</td>
275275 <td>4000 in, 4000 out</td>
276276 <td>4000 in, 4000 out</td>
277- <td>4000 in, 4000 out</td>
277+ <td>4000 in, 8000 out</td>
278278 </tr >
279279 <tr >
280280 <th><b>Concurrent requests</b></th>
@@ -284,7 +284,7 @@ Low, high, and embedding models have different rate limits. To see which type of
284284 <td>1</td>
285285 </tr >
286286 <tr >
287- <th rowspan="4" scope="rowgroup" style="box-shadow: none"><b>Azure OpenAI o3 -mini</b></th>
287+ <th rowspan="4" scope="rowgroup" style="box-shadow: none"><b>Azure OpenAI o1-mini, o3-mini, and o4 -mini</b></th>
288288 <th style="padding-left: 0"><b>Requests per minute</b></th>
289289 <td>Not applicable</td>
290290 <td>2</td>
@@ -313,7 +313,7 @@ Low, high, and embedding models have different rate limits. To see which type of
313313 <td>1</td>
314314 </tr >
315315 <tr >
316- <th rowspan="4" scope="rowgroup" style="box-shadow: none"><b>DeepSeek-R1</b></th>
316+ <th rowspan="4" scope="rowgroup" style="box-shadow: none"><b>DeepSeek-R1 and MAI-DS-R1 </b></th>
317317 <th style="padding-left: 0"><b>Requests per minute</b></th>
318318 <td>1</td>
319319 <td>1</td>
0 commit comments