Skip to content

Commit 65a84d9

Browse files
refactor: switch to standalone evaluation execution
1 parent 602da9f commit 65a84d9

1 file changed

Lines changed: 4 additions & 16 deletions

File tree

cloudbuild.yaml

Lines changed: 4 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -46,25 +46,13 @@ steps:
4646
# Substitute environment variables in model_config.yaml
4747
python3 /workspace/evals/substitute_env.py
4848
49-
export EVALBENCH_INSECURE=True
50-
export EVALBENCH_HOST=0.0.0.0
51-
cd evalbench
52-
export PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=python
53-
export PYTHONPATH=./evalproto:.
54-
export CLOUD_RUN=True
55-
export PORT=50051
56-
57-
echo "Starting Evaluation Server in background..."
58-
python3 -u ./eval_server.py --localhost </dev/null 2>&1 | tee server.log &
59-
60-
echo "Waiting for port 50051 to open..."
61-
python3 /workspace/evals/wait_for_port.py || { echo "Server failed to bind port."; exit 1; }
62-
63-
echo "Server is running. Launching Evaluation Client..."
6449
cd /evalbench
6550
export PYTHONPATH=./evalbench:./evalbench/evalproto
51+
export PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=python
52+
53+
echo "Launching Standalone Evaluation..."
54+
python3 evalbench/evalbench.py --experiment_config=/workspace/evals/run_config.yaml
6655
67-
python3 evalbench/client/eval_client.py --experiment=/workspace/evals/run_config.yaml --endpoint=local || { echo "Client failed! Server logs:"; cat /evalbench/evalbench/server.log; exit 1; }
6856
6957
availableSecrets:
7058
secretManager:

0 commit comments

Comments
 (0)