-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathDockerfile.eval
More file actions
42 lines (31 loc) · 1.26 KB
/
Dockerfile.eval
File metadata and controls
42 lines (31 loc) · 1.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
# Dockerfile.eval — Standalone CSB Eval Kit
#
# Build: docker build -f Dockerfile.eval -t csb-eval .
# Run: docker run --rm csb-eval --suite quick --agent-command 'echo placeholder'
#
# This image packages the CSB CLI, CSB-Quick tasks, schemas, and observatory
# data so users can evaluate agents without Daytona, Harbor, or Sourcegraph.
FROM python:3.11-slim
LABEL org.opencontainers.image.title="csb-eval" \
org.opencontainers.image.description="CodeScaleBench standalone eval kit — run CSB-Quick benchmarks against any agent command" \
org.opencontainers.image.version="1.0.0" \
org.opencontainers.image.source="https://github.com/sourcegraph/CodeScaleBench"
WORKDIR /app
# Install minimal Python dependencies
RUN pip install --no-cache-dir jsonschema
# Copy the CLI entrypoint
COPY csb ./csb
RUN chmod +x csb
# Copy the core library
COPY lib/ ./lib/
# Copy evaluation scripts
COPY scripts/evaluation/ ./scripts/evaluation/
# Copy the quick-suite manifest
COPY configs/csb_quick.json ./configs/csb_quick.json
# Copy JSON schemas for validation
COPY schemas/ ./schemas/
# Copy observatory (taxonomy, annotation schema, exemplars)
COPY observatory/ ./observatory/
# Default entrypoint: csb eval
ENTRYPOINT ["python3", "csb", "eval"]
CMD ["--help"]