Skip to content

Commit f3657e6

Browse files
committed
chore: rehost swebench pro images to ghcr and update dockerfiles
1 parent 63c9ec4 commit f3657e6

File tree

33 files changed

+3493
-16
lines changed

33 files changed

+3493
-16
lines changed

benchmarks/csb_sdlc_fix/element-web-roomheaderbuttons-can-crash-fix-001/environment/Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# SWE-bench Pro Task Environment
22
# Repo: element-hq/element-web
33

4-
FROM jefzda/sweap-images:element-hq.element-element-hq__element-web-ee13e23b156fbad9369d6a656c827b6444343d4f
4+
FROM ghcr.io/sg-evals/sweap-images:element-hq.element-element-hq__element-web-ee13e23b156fbad9369d6a656c827b6444343d4f
55

66
# Install uv for Python package management
77
RUN curl -LsSf https://astral.sh/uv/0.7.13/install.sh 2>/dev/null | sh || true

benchmarks/csb_sdlc_fix/element-web-roomheaderbuttons-can-crash-fix-001/environment/Dockerfile.sg_only

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# SWE-bench Pro Task Environment (Sourcegraph-only mode)
22
# Repo: element-hq/element-web
33

4-
FROM jefzda/sweap-images:element-hq.element-element-hq__element-web-ee13e23b156fbad9369d6a656c827b6444343d4f
4+
FROM ghcr.io/sg-evals/sweap-images:element-hq.element-element-hq__element-web-ee13e23b156fbad9369d6a656c827b6444343d4f
55

66
RUN curl -LsSf https://astral.sh/uv/0.7.13/install.sh 2>/dev/null | sh || true
77
RUN mkdir -p /logs /workspace
Lines changed: 77 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,77 @@
1+
{
2+
"files": [
3+
"src/components/views/right_panel/RoomHeaderButtons.tsx",
4+
"src/components/views/right_panel/PinnedMessagesCard.tsx",
5+
"src/settings/SettingsStore.ts",
6+
"src/stores/notifications/ThreadsRoomNotificationState.ts",
7+
"src/stores/notifications/NotificationColor.ts",
8+
"src/stores/right-panel/RightPanelStore.ts"
9+
],
10+
"symbols": [
11+
{
12+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
13+
"symbol": "RoomHeaderButtons",
14+
"repo": null
15+
},
16+
{
17+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
18+
"symbol": "PinnedMessagesHeaderButton",
19+
"repo": null
20+
},
21+
{
22+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
23+
"symbol": "threadNotificationState",
24+
"repo": null
25+
},
26+
{
27+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
28+
"symbol": "onNotificationUpdate",
29+
"repo": null
30+
},
31+
{
32+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
33+
"symbol": "notificationColor",
34+
"repo": null
35+
},
36+
{
37+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
38+
"symbol": "onThreadsPanelClicked",
39+
"repo": null
40+
},
41+
{
42+
"file": "src/components/views/right_panel/RoomHeaderButtons.tsx",
43+
"symbol": "renderButtons",
44+
"repo": null
45+
},
46+
{
47+
"file": "src/components/views/right_panel/PinnedMessagesCard.tsx",
48+
"symbol": "usePinnedEvents",
49+
"repo": null
50+
},
51+
{
52+
"file": "src/components/views/right_panel/PinnedMessagesCard.tsx",
53+
"symbol": "useReadPinnedEvents",
54+
"repo": null
55+
},
56+
{
57+
"file": "src/stores/notifications/NotificationColor.ts",
58+
"symbol": "NotificationColor",
59+
"repo": null
60+
},
61+
{
62+
"file": "src/stores/notifications/ThreadsRoomNotificationState.ts",
63+
"symbol": "ThreadsRoomNotificationState",
64+
"repo": null
65+
},
66+
{
67+
"file": "src/settings/SettingsStore.ts",
68+
"symbol": "SettingsStore",
69+
"repo": null
70+
},
71+
{
72+
"file": "src/stores/right-panel/RightPanelStore.ts",
73+
"symbol": "RightPanelStore",
74+
"repo": null
75+
}
76+
]
77+
}
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
{
2+
"has_ground_truth": true,
3+
"has_chunk_ground_truth": false,
4+
"ground_truth_source": "curator_agent",
5+
"ground_truth_confidence": "medium",
6+
"task_name": "element-web-roomheaderbuttons-can-crash-fix-001",
7+
"curator_agent_version": "2.0",
8+
"model": "claude-opus-4-6",
9+
"backend": "hybrid",
10+
"timestamp": "2026-03-03T15:30:39.213642+00:00",
11+
"files_count": 6,
12+
"edit_files_count": 0,
13+
"chunks_count": 0,
14+
"symbols_count": 13,
15+
"cost_usd": 0.8203,
16+
"elapsed_sec": 149.8,
17+
"exploration_notes": "The bug fix is concentrated in a single file: `src/components/views/right_panel/RoomHeaderButtons.tsx`. The patch makes 7 changes: (1) removes `useSettingValue` import, (2) changes `PinnedMessagesHeaderButton` to call `usePinnedEvents(room)` and `useReadPinnedEvents(room)` directly without `feature_pinning` gating, (3) types `threadNotificationState` as `ThreadsRoomNotificationState | null`, (4) guards constructor assignment with `this.props.room` check and falls back to `null`, (5) uses optiona"
18+
}

benchmarks/csb_sdlc_fix/element-web-unread-indicators-diverge-fix-001/environment/Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# SWE-bench Pro Task Environment
22
# Repo: element-hq/element-web
33

4-
FROM jefzda/sweap-images:element-hq.element-element-hq__element-web-dae13ac8522fc6d41e64d1ac6e3174486fdcce0c
4+
FROM ghcr.io/sg-evals/sweap-images:element-hq.element-element-hq__element-web-dae13ac8522fc6d41e64d1ac6e3174486fdcce0c
55

66
# Install uv for Python package management
77
RUN curl -LsSf https://astral.sh/uv/0.7.13/install.sh 2>/dev/null | sh || true

benchmarks/csb_sdlc_fix/element-web-unread-indicators-diverge-fix-001/environment/Dockerfile.sg_only

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# SWE-bench Pro Task Environment (Sourcegraph-only mode)
22
# Repo: element-hq/element-web
33

4-
FROM jefzda/sweap-images:element-hq.element-element-hq__element-web-dae13ac8522fc6d41e64d1ac6e3174486fdcce0c
4+
FROM ghcr.io/sg-evals/sweap-images:element-hq.element-element-hq__element-web-dae13ac8522fc6d41e64d1ac6e3174486fdcce0c
55

66
RUN curl -LsSf https://astral.sh/uv/0.7.13/install.sh 2>/dev/null | sh || true
77
RUN mkdir -p /logs /workspace
Lines changed: 53 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
{
2+
"files": [
3+
"apps/web/src/Unread.ts",
4+
"apps/web/src/RoomNotifs.ts"
5+
],
6+
"symbols": [
7+
{
8+
"file": "apps/web/src/Unread.ts",
9+
"symbol": "doesTimelineHaveUnreadMessages",
10+
"repo": null
11+
},
12+
{
13+
"file": "apps/web/src/Unread.ts",
14+
"symbol": "doesRoomHaveUnreadMessages",
15+
"repo": null
16+
},
17+
{
18+
"file": "apps/web/src/Unread.ts",
19+
"symbol": "doesRoomHaveUnreadThreads",
20+
"repo": null
21+
},
22+
{
23+
"file": "apps/web/src/Unread.ts",
24+
"symbol": "doesRoomOrThreadHaveUnreadMessages",
25+
"repo": null
26+
},
27+
{
28+
"file": "apps/web/src/Unread.ts",
29+
"symbol": "eventTriggersUnreadCount",
30+
"repo": null
31+
},
32+
{
33+
"file": "apps/web/src/Unread.ts",
34+
"symbol": "findLatestImportantEvent",
35+
"repo": null
36+
},
37+
{
38+
"file": "apps/web/src/Unread.ts",
39+
"symbol": "isImportantEvent",
40+
"repo": null
41+
},
42+
{
43+
"file": "apps/web/src/RoomNotifs.ts",
44+
"symbol": "determineUnreadState",
45+
"repo": null
46+
},
47+
{
48+
"file": "apps/web/src/RoomNotifs.ts",
49+
"symbol": "getUnreadNotificationCount",
50+
"repo": null
51+
}
52+
]
53+
}
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
{
2+
"has_ground_truth": true,
3+
"has_chunk_ground_truth": false,
4+
"ground_truth_source": "curator_agent",
5+
"ground_truth_confidence": "medium",
6+
"task_name": "element-web-unread-indicators-diverge-fix-001",
7+
"curator_agent_version": "2.0",
8+
"model": "claude-opus-4-6",
9+
"backend": "hybrid",
10+
"timestamp": "2026-03-03T15:38:54.760588+00:00",
11+
"files_count": 2,
12+
"edit_files_count": 0,
13+
"chunks_count": 0,
14+
"symbols_count": 9,
15+
"cost_usd": 2.8565,
16+
"elapsed_sec": 495.5,
17+
"exploration_notes": "The bug centers on apps/web/src/Unread.ts, specifically the doesTimelineHaveUnreadMessages function. Three issues were identified and fixed: (1) Thread-scoped receipts ignored: the function always called room.hasUserReadEvent() even for thread timelines, bypassing Thread.hasUserReadEvent() which has special logic for thread-scoped and unthreaded receipt comparisons. Fixed by adding a receiptSource parameter (Room | Thread) and passing the correct Thread/Room through all callers (doesRoomHaveUnre"
18+
}
Lines changed: 40 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,40 @@
1+
{
2+
"files": [
3+
"source/common/upstream/upstream_impl.cc",
4+
"source/extensions/clusters/dynamic_forward_proxy/cluster.cc",
5+
"source/extensions/clusters/dynamic_forward_proxy/cluster.h",
6+
"test/extensions/clusters/dynamic_forward_proxy/cluster_test.cc"
7+
],
8+
"symbols": [
9+
{
10+
"file": "source/extensions/clusters/dynamic_forward_proxy/cluster.cc",
11+
"symbol": "addOrUpdateHost",
12+
"repo": null
13+
},
14+
{
15+
"file": "source/extensions/clusters/dynamic_forward_proxy/cluster.cc",
16+
"symbol": "updatePriorityState",
17+
"repo": null
18+
},
19+
{
20+
"file": "source/extensions/clusters/dynamic_forward_proxy/cluster.cc",
21+
"symbol": "onDnsHostAddOrUpdate",
22+
"repo": null
23+
},
24+
{
25+
"file": "source/extensions/clusters/dynamic_forward_proxy/cluster.h",
26+
"symbol": "addOrUpdateHost",
27+
"repo": null
28+
},
29+
{
30+
"file": "source/common/upstream/upstream_impl.cc",
31+
"symbol": "updateCrossPriorityHostMap",
32+
"repo": null
33+
},
34+
{
35+
"file": "source/common/upstream/upstream_impl.cc",
36+
"symbol": "MainPrioritySetImpl",
37+
"repo": null
38+
}
39+
]
40+
}
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
{
2+
"has_ground_truth": true,
3+
"has_chunk_ground_truth": false,
4+
"ground_truth_source": "curator_agent",
5+
"ground_truth_confidence": "medium",
6+
"task_name": "envoy-dfp-host-leak-fix-001",
7+
"curator_agent_version": "2.0",
8+
"model": "claude-opus-4-6",
9+
"backend": "hybrid",
10+
"timestamp": "2026-03-03T15:39:57.773524+00:00",
11+
"files_count": 4,
12+
"edit_files_count": 0,
13+
"chunks_count": 0,
14+
"symbols_count": 6,
15+
"cost_usd": 0.4248,
16+
"elapsed_sec": 63.0,
17+
"exploration_notes": "All 4 files specified in the task confirmed locally. The call chain is: onDnsHostAddOrUpdate() -> addOrUpdateHost() -> updatePriorityState() -> PrioritySetImpl::updateHosts() -> MainPrioritySetImpl::updateCrossPriorityHostMap(). The memory leak is in addOrUpdateHost() which calls setNewAddresses() to update the LogicalHost's IP in-place without removing the old IP from the cross-priority host map maintained in upstream_impl.cc. The fix requires: (1) debug logging in updateCrossPriorityHostMap(),"
18+
}

0 commit comments

Comments
 (0)