Update nohup evaluator defaults for faster resumable batched generation
Browse files- scripts/nohup_eval.sh +12 -2
scripts/nohup_eval.sh
CHANGED
|
@@ -2,8 +2,9 @@
|
|
| 2 |
set -euo pipefail
|
| 3 |
|
| 4 |
# Evaluate a completed or checkpointed run under nohup.
|
|
|
|
| 5 |
# Usage:
|
| 6 |
-
# bash scripts/nohup_eval.sh runs/qwen3-8b-qlora-YYYYMMDD-HHMMSS [adapter_path]
|
| 7 |
|
| 8 |
if [ $# -lt 1 ]; then
|
| 9 |
echo "Usage: $0 <RUN_DIR> [ADAPTER_PATH]" >&2
|
|
@@ -40,7 +41,11 @@ python scripts/evaluate_model.py \\
|
|
| 40 |
--adapter '$ADAPTER' \\
|
| 41 |
--dataset nraptisss/TMF921-intent-to-config-research-sota \\
|
| 42 |
--output_dir '$RUN_DIR/eval' \\
|
| 43 |
-
--load_in_4bit
|
|
|
|
|
|
|
|
|
|
|
|
|
| 44 |
" > "$LOG" 2>&1 &
|
| 45 |
|
| 46 |
echo $! > "$RUN_DIR/EVAL_PID.txt"
|
|
@@ -55,4 +60,9 @@ RESULTS=$RUN_DIR/eval/all_metrics.json
|
|
| 55 |
|
| 56 |
Monitor:
|
| 57 |
tail -f "$LOG"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 58 |
EOF
|
|
|
|
| 2 |
set -euo pipefail
|
| 3 |
|
| 4 |
# Evaluate a completed or checkpointed run under nohup.
|
| 5 |
+
# Resumable: existing eval/<split>/predictions.json rows are skipped.
|
| 6 |
# Usage:
|
| 7 |
+
# EVAL_BATCH_SIZE=4 bash scripts/nohup_eval.sh runs/qwen3-8b-qlora-YYYYMMDD-HHMMSS [adapter_path]
|
| 8 |
|
| 9 |
if [ $# -lt 1 ]; then
|
| 10 |
echo "Usage: $0 <RUN_DIR> [ADAPTER_PATH]" >&2
|
|
|
|
| 41 |
--adapter '$ADAPTER' \\
|
| 42 |
--dataset nraptisss/TMF921-intent-to-config-research-sota \\
|
| 43 |
--output_dir '$RUN_DIR/eval' \\
|
| 44 |
+
--load_in_4bit \\
|
| 45 |
+
--batch_size '${EVAL_BATCH_SIZE:-4}' \\
|
| 46 |
+
--max_new_tokens '${EVAL_MAX_NEW_TOKENS:-1536}' \\
|
| 47 |
+
--gold_length_buffer '${EVAL_GOLD_LENGTH_BUFFER:-96}' \\
|
| 48 |
+
--save_every '${EVAL_SAVE_EVERY:-25}'
|
| 49 |
" > "$LOG" 2>&1 &
|
| 50 |
|
| 51 |
echo $! > "$RUN_DIR/EVAL_PID.txt"
|
|
|
|
| 60 |
|
| 61 |
Monitor:
|
| 62 |
tail -f "$LOG"
|
| 63 |
+
|
| 64 |
+
Tuning knobs:
|
| 65 |
+
EVAL_BATCH_SIZE=${EVAL_BATCH_SIZE:-4}
|
| 66 |
+
EVAL_MAX_NEW_TOKENS=${EVAL_MAX_NEW_TOKENS:-1536}
|
| 67 |
+
EVAL_GOLD_LENGTH_BUFFER=${EVAL_GOLD_LENGTH_BUFFER:-96}
|
| 68 |
EOF
|