@@ -265,7 +265,7 @@ Low, high, and embedding models have different rate limits. To see which type of
265265 <td>1</td>
266266 </tr >
267267 <tr >
268- <th rowspan="4" scope="rowgroup"><b>Azure OpenAI o1 and o3, xAI Grok-3 </b></th>
268+ <th rowspan="4" scope="rowgroup"><b>Azure OpenAI o1 and o3</b></th>
269269 <th style="padding-left: 0"><b>Requests per minute</b></th>
270270 <td>Not applicable</td>
271271 <td>1</td>
@@ -294,7 +294,7 @@ Low, high, and embedding models have different rate limits. To see which type of
294294 <td>1</td>
295295 </tr >
296296 <tr >
297- <th rowspan="4" scope="rowgroup" style="box-shadow: none" ><b>Azure OpenAI o1-mini, o3-mini, and o4-mini</b></th>
297+ <th rowspan="4" scope="rowgroup"><b>Azure OpenAI o1-mini, o3-mini, and o4-mini</b></th>
298298 <th style="padding-left: 0"><b>Requests per minute</b></th>
299299 <td>Not applicable</td>
300300 <td>2</td>
@@ -323,7 +323,7 @@ Low, high, and embedding models have different rate limits. To see which type of
323323 <td>1</td>
324324 </tr >
325325 <tr >
326- <th rowspan="4" scope="rowgroup" style="box-shadow: none" ><b>DeepSeek-R1 and MAI-DS-R1</b></th>
326+ <th rowspan="4" scope="rowgroup"><b>DeepSeek-R1 and MAI-DS-R1</b></th>
327327 <th style="padding-left: 0"><b>Requests per minute</b></th>
328328 <td>1</td>
329329 <td>1</td>
@@ -351,6 +351,64 @@ Low, high, and embedding models have different rate limits. To see which type of
351351 <td>1</td>
352352 <td>1</td>
353353 </tr >
354+ <tr >
355+ <th rowspan="4" scope="rowgroup"><b>xAI Grok-3</b></th>
356+ <th style="padding-left: 0"><b>Requests per minute</b></th>
357+ <td>1</td>
358+ <td>1</td>
359+ <td>2</td>
360+ <td>2</td>
361+ </tr >
362+ <tr >
363+ <th><b>Requests per day</b></th>
364+ <td>15</td>
365+ <td>15</td>
366+ <td>20</td>
367+ <td>30</td>
368+ </tr >
369+ <tr >
370+ <th><b>Tokens per request</b></th>
371+ <td>4000 in, 4000 out</td>
372+ <td>4000 in, 4000 out</td>
373+ <td>4000 in, 8000 out</td>
374+ <td>4000 in, 16000 out</td>
375+ </tr >
376+ <tr >
377+ <th><b>Concurrent requests</b></th>
378+ <td>1</td>
379+ <td>1</td>
380+ <td>1</td>
381+ <td>1</td>
382+ </tr >
383+ <tr >
384+ <th rowspan="4" scope="rowgroup" style="box-shadow: none"><b>xAI Grok-3-Mini</b></th>
385+ <th style="padding-left: 0"><b>Requests per minute</b></th>
386+ <td>2</td>
387+ <td>2</td>
388+ <td>3</td>
389+ <td>3</td>
390+ </tr >
391+ <tr >
392+ <th><b>Requests per day</b></th>
393+ <td>30</td>
394+ <td>30</td>
395+ <td>40</td>
396+ <td>50</td>
397+ </tr >
398+ <tr >
399+ <th><b>Tokens per request</b></th>
400+ <td>4000 in, 8000 out</td>
401+ <td>4000 in, 8000 out</td>
402+ <td>4000 in, 12000 out</td>
403+ <td>4000 in, 12000 out</td>
404+ </tr >
405+ <tr >
406+ <th><b>Concurrent requests</b></th>
407+ <td>1</td>
408+ <td>1</td>
409+ <td>1</td>
410+ <td>1</td>
411+ </tr >
354412</table >
355413
356414These limits are subject to change without notice.
0 commit comments