diff --git a/css/styles.css b/css/styles.css index fd1aba1..d800146 100644 --- a/css/styles.css +++ b/css/styles.css @@ -311,7 +311,6 @@ tr { text-align: left; position: sticky; top: 0; - z-index: 3; background-color: var(--even_line_color); } @@ -343,7 +342,6 @@ tr { .sticky-header-content { position: sticky; top: 0; - z-index: 3; padding: 6px 0px; /* Adjusted padding */ /* box-sizing: border-box; */ background-color: var(--even_line_color); diff --git a/index.html b/index.html index 45f714c..b094ff2 100644 --- a/index.html +++ b/index.html @@ -517,6 +517,39 @@

Leaderboard (Lite)

🥇 + Alibaba Lingma Agent +

+ +

33.00

+

2024-06-22

+ +

+ + 🔗 + +

+ + +

+ - +

+ + +

+ + 🔗 + +

+ +

✘

+

✘

+ + + + +

+ 🥈 + Factory Code Droid

@@ -548,7 +581,39 @@

Leaderboard (Lite)

- 🥈 + 🥉 + + AutoCodeRover (v20240620) + GPT 4o (2024-05-13) +

+ +

30.67

+

2024-06-21

+ +

+ + 🔗 + +

+ + +

+ - +

+ + +

+ + 🔗 + +

+ +

✘

+

✘

+ + + + +

CodeR + GPT 4 (1106)

@@ -581,7 +646,6 @@

Leaderboard (Lite)

- 🥉 MASAI + GPT 4o (2024-05-13)

@@ -643,6 +707,40 @@

Leaderboard (Lite)

✘

+ + +

+ + Moatless Tools + Claude 3.5 Sonnet +

+ +

26.67

+

2024-06-23

+ +

+ + 🔗 + +

+ + +

+ + 🔗 + +

+ + +

+ + 🔗 + +

+ +

✓

+

✓

+ +

diff --git a/template/data.json b/template/data.json index 1631585..5f9b129 100644 --- a/template/data.json +++ b/template/data.json @@ -91,6 +91,13 @@ } ], "lite_leaderboard": [ + { + "name": "Alibaba Lingma Agent", + "resolved": "33.00", + "date": "2024-06-22", + "logs": "lite/20240622_Lingma_Agent/logs", + "site": "https://arxiv.org/abs/2406.01422" + }, { "name": "Factory Code Droid", "resolved": "31.33", @@ -98,6 +105,13 @@ "logs": "lite/20240617_factory_code_droid/logs", "site": "https://www.factory.ai/" }, + { + "name": "AutoCodeRover (v20240620) + GPT 4o (2024-05-13)", + "resolved": "30.67", + "date": "2024-06-21", + "logs": "lite/20240621_autocoderover-v20240620/logs", + "site": "https://autocoderover.dev/" + }, { "name": "CodeR + GPT 4 (1106)", "resolved": "28.33", @@ -119,6 +133,16 @@ "logs": "lite/20240612_IBM_Research_Agent101/logs", "site": "https://github.com/swe-bench/experiments/tree/main/evaluation/lite/20240612_IBM_Research_Agent101" }, + { + "name": "Moatless Tools + Claude 3.5 Sonnet", + "resolved": "26.67", + "date": "2024-06-23", + "logs": "lite/20240623_moatless_claude35sonnet/logs", + "trajs": "lite/20240623_moatless_claude35sonnet/trajs", + "site": "https://github.com/aorwall/moatless-tools", + "verified": true, + "oss": true + }, { "name": "Aider + GPT 4o & Claude 3 Opus", "resolved": "26.33", diff --git a/viewer.html b/viewer.html index 5f069fb..1f99c45 100644 --- a/viewer.html +++ b/viewer.html @@ -99,6 +99,9 @@

SWE-bench Analysis

+ + +