14 lines
436 B
Bash
Executable file
14 lines
436 B
Bash
Executable file
#!/bin/bash
|
|
set -euo pipefail
|
|
|
|
# Automated eval scorer
|
|
# Usage: ./score-eval.sh <results-dir>
|
|
#
|
|
# Reads the manifest rubric, session JSONL, and test output to
|
|
# automatically score each variant. No interactive input needed.
|
|
|
|
EVAL_DIR="$(cd "$(dirname "$0")" && pwd)"
|
|
RESULTS_DIR="${1:?Usage: $0 <results-dir>}"
|
|
[ -d "$RESULTS_DIR" ] || { echo "ERROR: $RESULTS_DIR not found"; exit 1; }
|
|
|
|
exec python3 "$EVAL_DIR/score.py" "$RESULTS_DIR"
|