eval_infer.sh 1.2 KB

1234567891011121314151617181920212223242526272829303132333435
  1. #!/bin/bash
  2. PROCESS_FILEPATH=$1
  3. if [ -z "$PROCESS_FILEPATH" ]; then
  4. echo "Error: PROCESS_FILEPATH is empty. Usage: ./eval_infer.sh <output_file>"
  5. exit 1
  6. fi
  7. if [ ! -f $PROCESS_FILEPATH ]; then
  8. echo "Error: $PROCESS_FILEPATH is not a file"
  9. exit 1
  10. fi
  11. PROCESS_FILEPATH=$(realpath $PROCESS_FILEPATH)
  12. FILE_DIR=$(dirname $PROCESS_FILEPATH)
  13. FILE_NAME=$(basename $PROCESS_FILEPATH)
  14. mkdir -p $FILE_DIR/eval_logs
  15. mkdir -p $FILE_DIR/swe_bench_format
  16. echo "Evaluating $FILE_NAME @ $FILE_DIR"
  17. echo "Merged output file with fine-grained report will be saved to $FILE_DIR"
  18. docker run --rm \
  19. -v $FILE_DIR:/swe_bench_output \
  20. -e MINICONDA3=/swe_util/miniforge3 \
  21. -e OD_SWE_BENCH=/swe_util/OD-SWE-bench \
  22. -e EVAL_DATA_DIR=/swe_util/eval_data \
  23. -w /swe_util \
  24. ghcr.io/opendevin/eval-swe-bench:full-v1.2.1 \
  25. bash -c "./get_agent_report.sh --output-file /swe_bench_output/$FILE_NAME \
  26. --agent-name CodeActAgent \
  27. --dataset swe-bench-test-lite \
  28. --experiment-name test_experiment \
  29. --merge-report && cp -r /swe_util/eval_data/eval_logs/test_experiment/* /swe_bench_output/eval_logs \
  30. && cp -r /swe_util/eval_data/outputs/* /swe_bench_output/swe_bench_format/"