PEFT
qlora
sft
trl
qwen3
tmf921
intent-based-networking
network-slicing
rtx-6000-ada
ml-intern
nraptisss commited on
Commit
f4beb76
·
verified ·
1 Parent(s): 6f5475f

Update nohup evaluator defaults for faster resumable batched generation

Browse files
Files changed (1) hide show
  1. scripts/nohup_eval.sh +12 -2
scripts/nohup_eval.sh CHANGED
@@ -2,8 +2,9 @@
2
  set -euo pipefail
3
 
4
  # Evaluate a completed or checkpointed run under nohup.
 
5
  # Usage:
6
- # bash scripts/nohup_eval.sh runs/qwen3-8b-qlora-YYYYMMDD-HHMMSS [adapter_path]
7
 
8
  if [ $# -lt 1 ]; then
9
  echo "Usage: $0 <RUN_DIR> [ADAPTER_PATH]" >&2
@@ -40,7 +41,11 @@ python scripts/evaluate_model.py \\
40
  --adapter '$ADAPTER' \\
41
  --dataset nraptisss/TMF921-intent-to-config-research-sota \\
42
  --output_dir '$RUN_DIR/eval' \\
43
- --load_in_4bit
 
 
 
 
44
  " > "$LOG" 2>&1 &
45
 
46
  echo $! > "$RUN_DIR/EVAL_PID.txt"
@@ -55,4 +60,9 @@ RESULTS=$RUN_DIR/eval/all_metrics.json
55
 
56
  Monitor:
57
  tail -f "$LOG"
 
 
 
 
 
58
  EOF
 
2
  set -euo pipefail
3
 
4
  # Evaluate a completed or checkpointed run under nohup.
5
+ # Resumable: existing eval/<split>/predictions.json rows are skipped.
6
  # Usage:
7
+ # EVAL_BATCH_SIZE=4 bash scripts/nohup_eval.sh runs/qwen3-8b-qlora-YYYYMMDD-HHMMSS [adapter_path]
8
 
9
  if [ $# -lt 1 ]; then
10
  echo "Usage: $0 <RUN_DIR> [ADAPTER_PATH]" >&2
 
41
  --adapter '$ADAPTER' \\
42
  --dataset nraptisss/TMF921-intent-to-config-research-sota \\
43
  --output_dir '$RUN_DIR/eval' \\
44
+ --load_in_4bit \\
45
+ --batch_size '${EVAL_BATCH_SIZE:-4}' \\
46
+ --max_new_tokens '${EVAL_MAX_NEW_TOKENS:-1536}' \\
47
+ --gold_length_buffer '${EVAL_GOLD_LENGTH_BUFFER:-96}' \\
48
+ --save_every '${EVAL_SAVE_EVERY:-25}'
49
  " > "$LOG" 2>&1 &
50
 
51
  echo $! > "$RUN_DIR/EVAL_PID.txt"
 
60
 
61
  Monitor:
62
  tail -f "$LOG"
63
+
64
+ Tuning knobs:
65
+ EVAL_BATCH_SIZE=${EVAL_BATCH_SIZE:-4}
66
+ EVAL_MAX_NEW_TOKENS=${EVAL_MAX_NEW_TOKENS:-1536}
67
+ EVAL_GOLD_LENGTH_BUFFER=${EVAL_GOLD_LENGTH_BUFFER:-96}
68
  EOF