anuragredbus commited on
Commit
95d0045
·
1 Parent(s): 7db31d9

hf jobs: propagate TEST_ONLY env through launcher + remote runner

Browse files
training/hf_remote_run.sh CHANGED
@@ -17,6 +17,7 @@ set -euo pipefail
17
 
18
  NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
19
  export SMOKE_MODE="${SMOKE_MODE:-0}"
 
20
  export HF_HUB_ENABLE_HF_TRANSFER="${HF_HUB_ENABLE_HF_TRANSFER:-1}"
21
  export TOKENIZERS_PARALLELISM="${TOKENIZERS_PARALLELISM:-false}"
22
  export DEBIAN_FRONTEND=noninteractive
@@ -24,6 +25,7 @@ export DEBIAN_FRONTEND=noninteractive
24
  echo "===== hf_remote_run.sh starting at $(date -u +%FT%TZ) ====="
25
  echo "SPACE_REPO=${SPACE_REPO}"
26
  echo "SMOKE_MODE=${SMOKE_MODE}"
 
27
  echo "NB_EXEC_TIMEOUT=${NB_EXEC_TIMEOUT}"
28
 
29
  nvidia-smi || true
 
17
 
18
  NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
19
  export SMOKE_MODE="${SMOKE_MODE:-0}"
20
+ export TEST_ONLY="${TEST_ONLY:-0}"
21
  export HF_HUB_ENABLE_HF_TRANSFER="${HF_HUB_ENABLE_HF_TRANSFER:-1}"
22
  export TOKENIZERS_PARALLELISM="${TOKENIZERS_PARALLELISM:-false}"
23
  export DEBIAN_FRONTEND=noninteractive
 
25
  echo "===== hf_remote_run.sh starting at $(date -u +%FT%TZ) ====="
26
  echo "SPACE_REPO=${SPACE_REPO}"
27
  echo "SMOKE_MODE=${SMOKE_MODE}"
28
+ echo "TEST_ONLY=${TEST_ONLY}"
29
  echo "NB_EXEC_TIMEOUT=${NB_EXEC_TIMEOUT}"
30
 
31
  nvidia-smi || true
training/hf_run_space_train_job.sh CHANGED
@@ -16,6 +16,7 @@ TIMEOUT="${HF_JOB_TIMEOUT:-8h}"
16
  SPACE_REPO="${HF_SPACE_REPO_ID:-ycwhencpp/final-iteration}"
17
  NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
18
  SMOKE_MODE="${SMOKE_MODE:-0}"
 
19
 
20
  if ! hf auth whoami &>/dev/null; then
21
  echo "Run: hf auth login" >&2
@@ -43,4 +44,5 @@ exec hf jobs run \
43
  --env "SPACE_REPO=$SPACE_REPO" \
44
  --env "NB_EXEC_TIMEOUT=$NB_EXEC_TIMEOUT" \
45
  --env "SMOKE_MODE=$SMOKE_MODE" \
 
46
  -- "$IMAGE" bash -c "$BOOTSTRAP"
 
16
  SPACE_REPO="${HF_SPACE_REPO_ID:-ycwhencpp/final-iteration}"
17
  NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
18
  SMOKE_MODE="${SMOKE_MODE:-0}"
19
+ TEST_ONLY="${TEST_ONLY:-0}"
20
 
21
  if ! hf auth whoami &>/dev/null; then
22
  echo "Run: hf auth login" >&2
 
44
  --env "SPACE_REPO=$SPACE_REPO" \
45
  --env "NB_EXEC_TIMEOUT=$NB_EXEC_TIMEOUT" \
46
  --env "SMOKE_MODE=$SMOKE_MODE" \
47
+ --env "TEST_ONLY=$TEST_ONLY" \
48
  -- "$IMAGE" bash -c "$BOOTSTRAP"