Skip to content

Commit d0afa20

Browse files
sjarmakclaude
andcommitted
fix: add python3 to kafka/flipt sg_only Dockerfiles, switch envoy to bookworm
- CSB_REPO_BASE_MAP entries for ccb-repo-kafka-0753c489 and ccb-repo-flipt-3d5a345f were missing python3, causing sgonly_verifier_wrapper.sh to fail (needs python3 for JSON parsing). - envoy-routeconfig-dep-chain-001 main Dockerfile switched from golang:1.23-alpine to golang:1.23-bookworm for OpenHands compat (apt-get not available on Alpine). sg_only variant was already fixed in c6310bb but main Dockerfile was missed. - Regenerated all 404 Dockerfile.sg_only + artifact variants. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
1 parent 3f40257 commit d0afa20

File tree

468 files changed

+3836
-2484
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

468 files changed

+3836
-2484
lines changed

benchmarks/csb_org_compliance/ccx-compliance-182/environment/Dockerfile.artifact_only

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,11 @@
1-
# CCX-compliance-182 — artifact_only variant
1+
# ccx-compliance-182 — artifact_only variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
33
# Agent produces answer.json artifact; verifier scores the artifact.
44

55
FROM ubuntu:22.04
66

77
ENV DEBIAN_FRONTEND=noninteractive
8+
ENV SOURCEGRAPH_REPOS="sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0,sg-evals/etcd-io-etcd,sg-evals/kubernetes--v1.32.0"
89

910
RUN apt-get update && apt-get install -y --no-install-recommends \
1011
git \
Lines changed: 11 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,11 @@
1-
# CCX-compliance-182 — sg_only variant
2-
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
3-
# The verifier clones mirror repos at verification time (no /repo_full/ backup).
1+
# ccx-compliance-182 — sg_only_env variant (v2: clone-at-verify)
2+
# Empty workspace — agent uses Sourcegraph MCP for code access.
3+
# Verifier clones mirror(s) at verification time via clone manifest.
44

55
FROM ubuntu:22.04
66

77
ENV DEBIAN_FRONTEND=noninteractive
8+
ENV SOURCEGRAPH_REPOS="sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0,sg-evals/etcd-io-etcd,sg-evals/kubernetes--v1.32.0"
89

910
RUN apt-get update && apt-get install -y --no-install-recommends \
1011
git \
@@ -15,23 +16,21 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
1516

1617
WORKDIR /workspace
1718

18-
# Empty workspace — agent discovers code via MCP tools only
19+
# Empty git repo so agent can commit work
1920
RUN git init && \
2021
git config user.email "agent@example.com" && \
21-
git config user.name "Agent" && \
22-
git config --global safe.directory '*'
22+
git config user.name "Agent"
2323

24-
# Create log directories
2524
RUN mkdir -p /logs/agent /logs/verifier
2625

27-
# Mark sg_only mode — verifiers and eval scripts check this flag
26+
# Clone manifest for verifier (clone-at-verify strategy)
27+
RUN echo '{"workdir":"/workspace","repos":[{"mirror":"sg-evals/kubernetes--v1.32.0","target_dir":"kubernetes--v1.32.0"},{"mirror":"sg-evals/client-go--v0.32.0","target_dir":"client-go--v0.32.0"},{"mirror":"sg-evals/api--v0.32.0","target_dir":"api--v0.32.0"},{"mirror":"sg-evals/etcd-io-etcd","target_dir":"etcd-io-etcd"}]}' > /tmp/.sg_only_clone_manifest.json
28+
29+
# Mark sg_only mode
2830
RUN touch /tmp/.sg_only_mode
2931

30-
# Pre-create claude user and set ownership at build time so Harbor's
31-
# runtime chown is a no-op (avoids 15-30 min delay on large repos).
32+
# Pre-create claude user and set ownership at build time.
3233
RUN (adduser --disabled-password --gecos '' claude 2>/dev/null || true) && \
3334
for d in /workspace /app /testbed /logs; do [ -d "$d" ] && chown -R claude:claude "$d"; done || true
3435

35-
ENV SOURCEGRAPH_REPOS=sg-evals/kubernetes--v1.32.0,sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0
36-
3736
ENTRYPOINT []

benchmarks/csb_org_compliance/ccx-compliance-183/environment/Dockerfile.artifact_only

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,11 @@
1-
# CCX-compliance-183 — artifact_only variant
1+
# ccx-compliance-183 — artifact_only variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
33
# Agent produces answer.json artifact; verifier scores the artifact.
44

55
FROM ubuntu:22.04
66

77
ENV DEBIAN_FRONTEND=noninteractive
8+
ENV SOURCEGRAPH_REPOS="sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0,sg-evals/etcd-io-etcd,sg-evals/kubernetes--v1.32.0"
89

910
RUN apt-get update && apt-get install -y --no-install-recommends \
1011
git \

benchmarks/csb_org_compliance/ccx-compliance-183/environment/Dockerfile.sg_only

Lines changed: 11 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,11 @@
1-
# CCX-compliance-183 — sg_only variant
2-
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
3-
# The verifier clones mirror repos at verification time (no /repo_full/ backup).
1+
# ccx-compliance-183 — sg_only_env variant (v2: clone-at-verify)
2+
# Empty workspace — agent uses Sourcegraph MCP for code access.
3+
# Verifier clones mirror(s) at verification time via clone manifest.
44

55
FROM ubuntu:22.04
66

77
ENV DEBIAN_FRONTEND=noninteractive
8+
ENV SOURCEGRAPH_REPOS="sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0,sg-evals/etcd-io-etcd,sg-evals/kubernetes--v1.32.0"
89

910
RUN apt-get update && apt-get install -y --no-install-recommends \
1011
git \
@@ -15,20 +16,20 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
1516

1617
WORKDIR /workspace
1718

18-
# Empty workspace — agent discovers code via MCP tools only
19+
# Empty git repo so agent can commit work
1920
RUN git init && \
2021
git config user.email "agent@example.com" && \
21-
git config user.name "Agent" && \
22-
git config --global safe.directory '*'
22+
git config user.name "Agent"
2323

24-
# Create log directories
2524
RUN mkdir -p /logs/agent /logs/verifier
2625

27-
# Mark sg_only mode — verifiers and eval scripts check this flag
26+
# Clone manifest for verifier (clone-at-verify strategy)
27+
RUN echo '{"workdir":"/workspace","repos":[{"mirror":"sg-evals/kubernetes--v1.32.0","target_dir":"kubernetes--v1.32.0"},{"mirror":"sg-evals/client-go--v0.32.0","target_dir":"client-go--v0.32.0"},{"mirror":"sg-evals/api--v0.32.0","target_dir":"api--v0.32.0"},{"mirror":"sg-evals/etcd-io-etcd","target_dir":"etcd-io-etcd"}]}' > /tmp/.sg_only_clone_manifest.json
28+
29+
# Mark sg_only mode
2830
RUN touch /tmp/.sg_only_mode
2931

30-
# Pre-create claude user and set ownership at build time so Harbor's
31-
# runtime chown is a no-op (avoids 15-30 min delay on large repos).
32+
# Pre-create claude user and set ownership at build time.
3233
RUN (adduser --disabled-password --gecos '' claude 2>/dev/null || true) && \
3334
for d in /workspace /app /testbed /logs; do [ -d "$d" ] && chown -R claude:claude "$d"; done || true
3435

benchmarks/csb_org_compliance/ccx-compliance-184/environment/Dockerfile.artifact_only

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,11 @@
1-
# CCX-compliance-184 — artifact_only variant
1+
# ccx-compliance-184 — artifact_only variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
33
# Agent produces answer.json artifact; verifier scores the artifact.
44

55
FROM ubuntu:22.04
66

77
ENV DEBIAN_FRONTEND=noninteractive
8+
ENV SOURCEGRAPH_REPOS="sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0,sg-evals/etcd-io-etcd,sg-evals/kubernetes--v1.32.0"
89

910
RUN apt-get update && apt-get install -y --no-install-recommends \
1011
git \

benchmarks/csb_org_compliance/ccx-compliance-184/environment/Dockerfile.sg_only

Lines changed: 11 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,11 @@
1-
# CCX-compliance-184 — sg_only variant
2-
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
3-
# The verifier clones mirror repos at verification time (no /repo_full/ backup).
1+
# ccx-compliance-184 — sg_only_env variant (v2: clone-at-verify)
2+
# Empty workspace — agent uses Sourcegraph MCP for code access.
3+
# Verifier clones mirror(s) at verification time via clone manifest.
44

55
FROM ubuntu:22.04
66

77
ENV DEBIAN_FRONTEND=noninteractive
8+
ENV SOURCEGRAPH_REPOS="sg-evals/api--v0.32.0,sg-evals/client-go--v0.32.0,sg-evals/etcd-io-etcd,sg-evals/kubernetes--v1.32.0"
89

910
RUN apt-get update && apt-get install -y --no-install-recommends \
1011
git \
@@ -15,20 +16,20 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
1516

1617
WORKDIR /workspace
1718

18-
# Empty workspace — agent discovers code via MCP tools only
19+
# Empty git repo so agent can commit work
1920
RUN git init && \
2021
git config user.email "agent@example.com" && \
21-
git config user.name "Agent" && \
22-
git config --global safe.directory '*'
22+
git config user.name "Agent"
2323

24-
# Create log directories
2524
RUN mkdir -p /logs/agent /logs/verifier
2625

27-
# Mark sg_only mode — verifiers and eval scripts check this flag
26+
# Clone manifest for verifier (clone-at-verify strategy)
27+
RUN echo '{"workdir":"/workspace","repos":[{"mirror":"sg-evals/kubernetes--v1.32.0","target_dir":"kubernetes--v1.32.0"},{"mirror":"sg-evals/client-go--v0.32.0","target_dir":"client-go--v0.32.0"},{"mirror":"sg-evals/api--v0.32.0","target_dir":"api--v0.32.0"},{"mirror":"sg-evals/etcd-io-etcd","target_dir":"etcd-io-etcd"}]}' > /tmp/.sg_only_clone_manifest.json
28+
29+
# Mark sg_only mode
2830
RUN touch /tmp/.sg_only_mode
2931

30-
# Pre-create claude user and set ownership at build time so Harbor's
31-
# runtime chown is a no-op (avoids 15-30 min delay on large repos).
32+
# Pre-create claude user and set ownership at build time.
3233
RUN (adduser --disabled-password --gecos '' claude 2>/dev/null || true) && \
3334
for d in /workspace /app /testbed /logs; do [ -d "$d" ] && chown -R claude:claude "$d"; done || true
3435

benchmarks/csb_org_compliance/ccx-compliance-185/environment/Dockerfile.artifact_only

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# CCX-compliance-185 — artifact_only variant
1+
# ccx-compliance-185 — artifact_only variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
33
# Agent produces answer.json artifact; verifier scores the artifact.
44

benchmarks/csb_org_compliance/ccx-compliance-185/environment/Dockerfile.sg_only

Lines changed: 5 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,5 @@
1-
# CCX-compliance-185 — sg_only variant
1+
# ccx-compliance-185 — sg_only_env variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
3-
# The verifier clones mirror repos at verification time (no /repo_full/ backup).
43

54
FROM ubuntu:22.04
65

@@ -15,20 +14,17 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
1514

1615
WORKDIR /workspace
1716

18-
# Empty workspace — agent discovers code via MCP tools only
17+
# Empty git repo so agent can commit work
1918
RUN git init && \
2019
git config user.email "agent@example.com" && \
21-
git config user.name "Agent" && \
22-
git config --global safe.directory '*'
20+
git config user.name "Agent"
2321

24-
# Create log directories
2522
RUN mkdir -p /logs/agent /logs/verifier
2623

27-
# Mark sg_only mode verifiers and eval scripts check this flag
24+
# Mark sg_only mode so verifiers can skip local-path checks
2825
RUN touch /tmp/.sg_only_mode
2926

30-
# Pre-create claude user and set ownership at build time so Harbor's
31-
# runtime chown is a no-op (avoids 15-30 min delay on large repos).
27+
# Pre-create claude user and set ownership at build time.
3228
RUN (adduser --disabled-password --gecos '' claude 2>/dev/null || true) && \
3329
for d in /workspace /app /testbed /logs; do [ -d "$d" ] && chown -R claude:claude "$d"; done || true
3430

benchmarks/csb_org_compliance/ccx-compliance-186/environment/Dockerfile.artifact_only

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# CCX-compliance-186 — artifact_only variant
1+
# ccx-compliance-186 — artifact_only variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
33
# Agent produces answer.json artifact; verifier scores the artifact.
44

benchmarks/csb_org_compliance/ccx-compliance-186/environment/Dockerfile.sg_only

Lines changed: 5 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,5 @@
1-
# CCX-compliance-186 — sg_only variant
1+
# ccx-compliance-186 — sg_only_env variant
22
# No local repo clone — agent uses Sourcegraph MCP exclusively for code access.
3-
# The verifier clones mirror repos at verification time (no /repo_full/ backup).
43

54
FROM ubuntu:22.04
65

@@ -15,20 +14,17 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
1514

1615
WORKDIR /workspace
1716

18-
# Empty workspace — agent discovers code via MCP tools only
17+
# Empty git repo so agent can commit work
1918
RUN git init && \
2019
git config user.email "agent@example.com" && \
21-
git config user.name "Agent" && \
22-
git config --global safe.directory '*'
20+
git config user.name "Agent"
2321

24-
# Create log directories
2522
RUN mkdir -p /logs/agent /logs/verifier
2623

27-
# Mark sg_only mode verifiers and eval scripts check this flag
24+
# Mark sg_only mode so verifiers can skip local-path checks
2825
RUN touch /tmp/.sg_only_mode
2926

30-
# Pre-create claude user and set ownership at build time so Harbor's
31-
# runtime chown is a no-op (avoids 15-30 min delay on large repos).
27+
# Pre-create claude user and set ownership at build time.
3228
RUN (adduser --disabled-password --gecos '' claude 2>/dev/null || true) && \
3329
for d in /workspace /app /testbed /logs; do [ -d "$d" ] && chown -R claude:claude "$d"; done || true
3430

0 commit comments

Comments
 (0)