Commit
·
e34be39
1
Parent(s):
1694662
Update README.md
Browse files
README.md
CHANGED
|
@@ -315,7 +315,7 @@ The following tables show the evaluation results of each model, with reasoning a
|
|
| 315 |
<td align="center">64.7</td>
|
| 316 |
</tr>
|
| 317 |
<tr>
|
| 318 |
-
<td >Tau-
|
| 319 |
<td align="center">51.5</td>
|
| 320 |
<td align="center">N/A</td>
|
| 321 |
<td align="center">38.5</td>
|
|
@@ -324,7 +324,7 @@ The following tables show the evaluation results of each model, with reasoning a
|
|
| 324 |
<td align="center">53.5</td>
|
| 325 |
</tr>
|
| 326 |
<tr>
|
| 327 |
-
<td >Tau-
|
| 328 |
<td align="center">62.8</td>
|
| 329 |
<td align="center">N/A</td>
|
| 330 |
<td align="center">10.2</td>
|
|
@@ -390,7 +390,7 @@ The following tables show the evaluation results of each model, with reasoning a
|
|
| 390 |
<th>EXAONE 4.0 32B </th>
|
| 391 |
<th>Phi 4</th>
|
| 392 |
<th>Mistral-Small-2506</th>
|
| 393 |
-
<th>
|
| 394 |
<th>Qwen3 32B </th>
|
| 395 |
<th>Qwen3 235B </th>
|
| 396 |
<th>Llama-4-Maverick</th>
|
|
@@ -689,7 +689,7 @@ The following tables show the evaluation results of each model, with reasoning a
|
|
| 689 |
<th>EXAONE Deep 2.4B</th>
|
| 690 |
<th>Qwen 3 0.6B </th>
|
| 691 |
<th>Qwen 3 1.7B </th>
|
| 692 |
-
<th>
|
| 693 |
</tr>
|
| 694 |
<tr>
|
| 695 |
<td align="center">Model Size</td>
|
|
@@ -869,7 +869,7 @@ The following tables show the evaluation results of each model, with reasoning a
|
|
| 869 |
<th>Qwen 3 0.6B </th>
|
| 870 |
<th>Gemma 3 1B</th>
|
| 871 |
<th>Qwen 3 1.7B </th>
|
| 872 |
-
<th>
|
| 873 |
</tr>
|
| 874 |
<tr>
|
| 875 |
<td align="center">Model Size</td>
|
|
|
|
| 315 |
<td align="center">64.7</td>
|
| 316 |
</tr>
|
| 317 |
<tr>
|
| 318 |
+
<td >Tau-Bench (Airline)</td>
|
| 319 |
<td align="center">51.5</td>
|
| 320 |
<td align="center">N/A</td>
|
| 321 |
<td align="center">38.5</td>
|
|
|
|
| 324 |
<td align="center">53.5</td>
|
| 325 |
</tr>
|
| 326 |
<tr>
|
| 327 |
+
<td >Tau-Bench (Retail)</td>
|
| 328 |
<td align="center">62.8</td>
|
| 329 |
<td align="center">N/A</td>
|
| 330 |
<td align="center">10.2</td>
|
|
|
|
| 390 |
<th>EXAONE 4.0 32B </th>
|
| 391 |
<th>Phi 4</th>
|
| 392 |
<th>Mistral-Small-2506</th>
|
| 393 |
+
<th>Gemma3 27B</th>
|
| 394 |
<th>Qwen3 32B </th>
|
| 395 |
<th>Qwen3 235B </th>
|
| 396 |
<th>Llama-4-Maverick</th>
|
|
|
|
| 689 |
<th>EXAONE Deep 2.4B</th>
|
| 690 |
<th>Qwen 3 0.6B </th>
|
| 691 |
<th>Qwen 3 1.7B </th>
|
| 692 |
+
<th>SmolLM 3 3B </th>
|
| 693 |
</tr>
|
| 694 |
<tr>
|
| 695 |
<td align="center">Model Size</td>
|
|
|
|
| 869 |
<th>Qwen 3 0.6B </th>
|
| 870 |
<th>Gemma 3 1B</th>
|
| 871 |
<th>Qwen 3 1.7B </th>
|
| 872 |
+
<th>SmolLM 3 3B </th>
|
| 873 |
</tr>
|
| 874 |
<tr>
|
| 875 |
<td align="center">Model Size</td>
|