@@ -421,22 +421,13 @@ <h2 id="leaderboard-lite">Leaderboard (lite)</h2>
421421< tr >
422422< td > OpenHands (subset of < code > all</ code > )</ td >
423423< td style ="text-align: center; "> 2</ td >
424- < td style ="text-align: center; "> 88.67 %</ td >
425- < td style ="text-align: center; "> 408.27 </ td >
424+ < td style ="text-align: center; "> 42.95 %</ td >
425+ < td style ="text-align: center; "> 116.76 </ td >
426426< td style ="text-align: center; "> 11/25/2024</ td >
427427< td > < a href ="/analysis_openhands-commit0_openhands "> Analysis</ a > </ td >
428428< td > < a href ="https://github.com/openhands-commit0 "> Github</ a > </ td >
429429</ tr >
430430< tr >
431- < td > Claude Sonnet 3.5 - Fill-in (subset of < code > all</ code > )</ td >
432- < td style ="text-align: center; "> 0</ td >
433- < td style ="text-align: center; "> 19.13%</ td >
434- < td style ="text-align: center; "> 629.19</ td >
435- < td style ="text-align: center; "> 09/25/2024</ td >
436- < td > < a href ="/analysis_commit0-all-plain_fillin "> Analysis</ a > </ td >
437- < td > < a href ="https://github.com/commit0-all-plain "> Github</ a > </ td >
438- </ tr >
439- < tr >
440431< td > Claude Sonnet 3.5 - Fill-in + Unit Test Feedback</ td >
441432< td style ="text-align: center; "> 0</ td >
442433< td style ="text-align: center; "> 17.06%</ td >
@@ -446,6 +437,15 @@ <h2 id="leaderboard-lite">Leaderboard (lite)</h2>
446437< td > < a href ="https://github.com/commit0-lite-with-test "> Github</ a > </ td >
447438</ tr >
448439< tr >
440+ < td > Claude Sonnet 3.5 - Fill-in (subset of < code > all</ code > )</ td >
441+ < td style ="text-align: center; "> 0</ td >
442+ < td style ="text-align: center; "> 12.35%</ td >
443+ < td style ="text-align: center; "> 64.49</ td >
444+ < td style ="text-align: center; "> 09/25/2024</ td >
445+ < td > < a href ="/analysis_commit0-all-plain_fillin "> Analysis</ a > </ td >
446+ < td > < a href ="https://github.com/commit0-all-plain "> Github</ a > </ td >
447+ </ tr >
448+ < tr >
449449< td > Claude Sonnet 3.5 - Fill-in</ td >
450450< td style ="text-align: center; "> 0</ td >
451451< td style ="text-align: center; "> 10.50%</ td >
@@ -466,8 +466,8 @@ <h2 id="leaderboard-lite">Leaderboard (lite)</h2>
466466< tr >
467467< td > SWE-Agent (subset of < code > all</ code > )</ td >
468468< td style ="text-align: center; "> 0</ td >
469- < td style ="text-align: center; "> 9.10 %</ td >
470- < td style ="text-align: center; "> 62.35 </ td >
469+ < td style ="text-align: center; "> 7.83 %</ td >
470+ < td style ="text-align: center; "> 17.96 </ td >
471471< td style ="text-align: center; "> 11/26/2024</ td >
472472< td > < a href ="/analysis_sweagent-commit0_sweagent "> Analysis</ a > </ td >
473473< td > < a href ="https://github.com/sweagent-commit0 "> Github</ a > </ td >
@@ -500,7 +500,7 @@ <h2 id="leaderboard-all">Leaderboard (all)</h2>
500500< tr >
501501< td > OpenHands</ td >
502502< td style ="text-align: center; "> 2</ td >
503- < td style ="text-align: center; "> 2.28 %</ td >
503+ < td style ="text-align: center; "> 15.25 %</ td >
504504< td style ="text-align: center; "> 408.27</ td >
505505< td style ="text-align: center; "> 11/25/2024</ td >
506506< td > < a href ="/analysis_openhands-commit0_openhands "> Analysis</ a > </ td >
0 commit comments