Spaces:
Paused
Paused
Commit ·
95d0045
1
Parent(s): 7db31d9
hf jobs: propagate TEST_ONLY env through launcher + remote runner
Browse files
training/hf_remote_run.sh
CHANGED
|
@@ -17,6 +17,7 @@ set -euo pipefail
|
|
| 17 |
|
| 18 |
NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
|
| 19 |
export SMOKE_MODE="${SMOKE_MODE:-0}"
|
|
|
|
| 20 |
export HF_HUB_ENABLE_HF_TRANSFER="${HF_HUB_ENABLE_HF_TRANSFER:-1}"
|
| 21 |
export TOKENIZERS_PARALLELISM="${TOKENIZERS_PARALLELISM:-false}"
|
| 22 |
export DEBIAN_FRONTEND=noninteractive
|
|
@@ -24,6 +25,7 @@ export DEBIAN_FRONTEND=noninteractive
|
|
| 24 |
echo "===== hf_remote_run.sh starting at $(date -u +%FT%TZ) ====="
|
| 25 |
echo "SPACE_REPO=${SPACE_REPO}"
|
| 26 |
echo "SMOKE_MODE=${SMOKE_MODE}"
|
|
|
|
| 27 |
echo "NB_EXEC_TIMEOUT=${NB_EXEC_TIMEOUT}"
|
| 28 |
|
| 29 |
nvidia-smi || true
|
|
|
|
| 17 |
|
| 18 |
NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
|
| 19 |
export SMOKE_MODE="${SMOKE_MODE:-0}"
|
| 20 |
+
export TEST_ONLY="${TEST_ONLY:-0}"
|
| 21 |
export HF_HUB_ENABLE_HF_TRANSFER="${HF_HUB_ENABLE_HF_TRANSFER:-1}"
|
| 22 |
export TOKENIZERS_PARALLELISM="${TOKENIZERS_PARALLELISM:-false}"
|
| 23 |
export DEBIAN_FRONTEND=noninteractive
|
|
|
|
| 25 |
echo "===== hf_remote_run.sh starting at $(date -u +%FT%TZ) ====="
|
| 26 |
echo "SPACE_REPO=${SPACE_REPO}"
|
| 27 |
echo "SMOKE_MODE=${SMOKE_MODE}"
|
| 28 |
+
echo "TEST_ONLY=${TEST_ONLY}"
|
| 29 |
echo "NB_EXEC_TIMEOUT=${NB_EXEC_TIMEOUT}"
|
| 30 |
|
| 31 |
nvidia-smi || true
|
training/hf_run_space_train_job.sh
CHANGED
|
@@ -16,6 +16,7 @@ TIMEOUT="${HF_JOB_TIMEOUT:-8h}"
|
|
| 16 |
SPACE_REPO="${HF_SPACE_REPO_ID:-ycwhencpp/final-iteration}"
|
| 17 |
NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
|
| 18 |
SMOKE_MODE="${SMOKE_MODE:-0}"
|
|
|
|
| 19 |
|
| 20 |
if ! hf auth whoami &>/dev/null; then
|
| 21 |
echo "Run: hf auth login" >&2
|
|
@@ -43,4 +44,5 @@ exec hf jobs run \
|
|
| 43 |
--env "SPACE_REPO=$SPACE_REPO" \
|
| 44 |
--env "NB_EXEC_TIMEOUT=$NB_EXEC_TIMEOUT" \
|
| 45 |
--env "SMOKE_MODE=$SMOKE_MODE" \
|
|
|
|
| 46 |
-- "$IMAGE" bash -c "$BOOTSTRAP"
|
|
|
|
| 16 |
SPACE_REPO="${HF_SPACE_REPO_ID:-ycwhencpp/final-iteration}"
|
| 17 |
NB_EXEC_TIMEOUT="${NB_EXEC_TIMEOUT:-14400}"
|
| 18 |
SMOKE_MODE="${SMOKE_MODE:-0}"
|
| 19 |
+
TEST_ONLY="${TEST_ONLY:-0}"
|
| 20 |
|
| 21 |
if ! hf auth whoami &>/dev/null; then
|
| 22 |
echo "Run: hf auth login" >&2
|
|
|
|
| 44 |
--env "SPACE_REPO=$SPACE_REPO" \
|
| 45 |
--env "NB_EXEC_TIMEOUT=$NB_EXEC_TIMEOUT" \
|
| 46 |
--env "SMOKE_MODE=$SMOKE_MODE" \
|
| 47 |
+
--env "TEST_ONLY=$TEST_ONLY" \
|
| 48 |
-- "$IMAGE" bash -c "$BOOTSTRAP"
|