-
Notifications
You must be signed in to change notification settings - Fork 213
Expand file tree
/
Copy pathDockerfile
More file actions
36 lines (28 loc) · 886 Bytes
/
Dockerfile
File metadata and controls
36 lines (28 loc) · 886 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# Docker container for MRR Benchmark execution
# Provides isolated, reproducible environment for benchmark runs
FROM python:3.10-slim
# Install system dependencies
RUN apt-get update && apt-get install -y \
git \
build-essential \
curl \
&& rm -rf /var/lib/apt/lists/*
# Set working directory
WORKDIR /benchmark
# Copy requirements first for better caching
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt
# Copy benchmark code
COPY . .
# Create results directory
RUN mkdir -p /benchmark/results
# Set environment variables
ENV PYTHONUNBUFFERED=1
ENV BENCHMARK_SEED=42
ENV BENCHMARK_MODEL=claude_4_opus
# Default command runs the benchmark
CMD ["python", "run_full_mrr_benchmark.py", \
"--model", "${BENCHMARK_MODEL}", \
"--scenarios", "5000", \
"--seed", "${BENCHMARK_SEED}", \
"--output-dir", "/benchmark/results"]