File tree Expand file tree Collapse file tree 1 file changed +16
-16
lines changed
Expand file tree Collapse file tree 1 file changed +16
-16
lines changed Original file line number Diff line number Diff line change @@ -337,25 +337,25 @@ <h2 id="results">Results</h2>
337337 < thead >
338338 < tr >
339339 < th > < strong > Agent</ strong > </ th >
340- < th > < strong > MDL ratio </ strong > </ th >
341- < th > < strong > Pass rate </ strong > </ th >
340+ < th > < strong > Pass rate (%) </ strong > </ th >
341+ < th > < strong > MDL ratio (%) </ strong > </ th >
342342 </ tr >
343343 </ thead >
344344 < tbody >
345345 < tr >
346346 < td > original</ td >
347- < td > 1.0 </ td >
348- < td > 1.0 </ td >
347+ < td > 100 </ td >
348+ < td > 100 </ td >
349349 </ tr >
350350 < tr >
351- < td > Cl-Cl </ td >
352- < td > 5.14 </ td >
353- < td > 0.78 </ td >
351+ < td > Claude Sonnet 3.7 planner, Claude Sonnet 3.7 implementer </ td >
352+ < td > 78 </ td >
353+ < td > 514 </ td >
354354 </ tr >
355355 < tr >
356- < td > Cl-Cx </ td >
357- < td > 2.44 </ td >
358- < td > 0.8 </ td >
356+ < td > Claude Sonnet 3.7 planner, o4-mini implementer </ td >
357+ < td > 80 </ td >
358+ < td > 244 </ td >
359359 </ tr >
360360 </ tbody >
361361 </ table >
@@ -367,8 +367,8 @@ <h2 id="results">Results</h2>
367367 < thead >
368368 < tr >
369369 < th > < strong > Agent</ strong > </ th >
370- < th > < strong > MDL % </ strong > </ th >
371- < th > < strong > Pass % </ strong > </ th >
370+ < th > < strong > Pass Rate (%) </ strong > </ th >
371+ < th > < strong > MDL Ratio (%) </ strong > </ th >
372372 </ tr >
373373 </ thead >
374374 < tbody >
@@ -378,14 +378,14 @@ <h2 id="results">Results</h2>
378378 < td > 100</ td >
379379 </ tr >
380380 < tr >
381- < td > sonnet 3.7</ td >
382- < td > 152</ td >
381+ < td > Claude Sonnet 3.7</ td >
383382 < td > 84.3</ td >
383+ < td > 152</ td >
384384 </ tr >
385385 < tr >
386- < td > sonnet 4</ td >
387- < td > 143.3</ td >
386+ < td > Claude Sonnet 4</ td >
388387 < td > 88.3</ td >
388+ < td > 143.3</ td >
389389 </ tr >
390390 </ tbody >
391391 </ table >
You can’t perform that action at this time.
0 commit comments