|
#!/bin/bash
|
|
|
|
set -e
|
|
EVAL_WORKSPACE="evaluation/benchmarks/swe_bench/eval_workspace"
|
|
mkdir -p $EVAL_WORKSPACE
|
|
|
|
|
|
echo "==== Prepare SWE-bench repo ===="
|
|
OH_SWE_BENCH_REPO_PATH="https://github.com/All-Hands-AI/SWE-bench.git"
|
|
OH_SWE_BENCH_REPO_BRANCH="eval"
|
|
git clone -b $OH_SWE_BENCH_REPO_BRANCH $OH_SWE_BENCH_REPO_PATH $EVAL_WORKSPACE/OH-SWE-bench
|
|
|
|
|
|
echo "==== Prepare SWE-bench data ===="
|
|
EVAL_IMAGE=ghcr.io/all-hands-ai/eval-swe-bench:builder_with_conda
|
|
EVAL_WORKSPACE=$(realpath $EVAL_WORKSPACE)
|
|
chmod +x $EVAL_WORKSPACE/OH-SWE-bench/swebench/harness/prepare_data.sh
|
|
if [ -d $EVAL_WORKSPACE/eval_data ]; then
|
|
rm -r $EVAL_WORKSPACE/eval_data
|
|
fi
|
|
docker run \
|
|
-v $EVAL_WORKSPACE:/workspace \
|
|
-w /workspace \
|
|
-u $(id -u):$(id -g) \
|
|
-e HF_DATASETS_CACHE="/tmp" \
|
|
--rm -it $EVAL_IMAGE \
|
|
bash -c "cd OH-SWE-bench/swebench/harness && /swe_util/miniforge3/bin/conda run -n swe-bench-eval ./prepare_data.sh && mv eval_data /workspace/"
|
|
|