Spaces:
Sleeping
Sleeping
Upload folder using huggingface_hub
Browse files
frontend/src/components/RunWithLlmPane.tsx
CHANGED
|
@@ -718,7 +718,7 @@ function ModelPresetPicker({
|
|
| 718 |
key={preset.id}
|
| 719 |
preset={preset}
|
| 720 |
selected={selected.id === preset.id}
|
| 721 |
-
disabled={disabled}
|
| 722 |
onSelect={() => selectPreset(preset)}
|
| 723 |
/>
|
| 724 |
))}
|
|
|
|
| 718 |
key={preset.id}
|
| 719 |
preset={preset}
|
| 720 |
selected={selected.id === preset.id}
|
| 721 |
+
disabled={disabled ?? false}
|
| 722 |
onSelect={() => selectPreset(preset)}
|
| 723 |
/>
|
| 724 |
))}
|
train/physix_train_colab.ipynb
CHANGED
|
@@ -323,28 +323,7 @@
|
|
| 323 |
"metadata": {},
|
| 324 |
"outputs": [],
|
| 325 |
"source": [
|
| 326 |
-
"import subprocess, sys\n",
|
| 327 |
-
"\n",
|
| 328 |
-
"SFT_OUT = \"/tmp/physix-sft\"\n",
|
| 329 |
-
"\n",
|
| 330 |
-
"sft_cmd = [\n",
|
| 331 |
-
" sys.executable, \"-m\", \"physix.training.sft\",\n",
|
| 332 |
-
" \"--model\", p[\"base_model\"],\n",
|
| 333 |
-
" \"--output-dir\", SFT_OUT,\n",
|
| 334 |
-
" \"--epochs\", p[\"sft_epochs\"],\n",
|
| 335 |
-
" \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n",
|
| 336 |
-
" \"--lora-r\", p[\"sft_lora_r\"],\n",
|
| 337 |
-
" \"--learning-rate\", p[\"sft_lr\"],\n",
|
| 338 |
-
" \"--wandb-run-name\", p[\"sft_run_name\"],\n",
|
| 339 |
-
" \"--seed\", \"0\",\n",
|
| 340 |
-
"]\n",
|
| 341 |
-
"if SYSTEM_ID:\n",
|
| 342 |
-
" sft_cmd += [\"--system-ids\", SYSTEM_ID]\n",
|
| 343 |
-
"if PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n",
|
| 344 |
-
" sft_cmd += [\"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"]]\n",
|
| 345 |
-
"\n",
|
| 346 |
-
"print(\"$\", \" \".join(sft_cmd))\n",
|
| 347 |
-
"subprocess.run(sft_cmd, check=True)"
|
| 348 |
]
|
| 349 |
},
|
| 350 |
{
|
|
@@ -372,35 +351,7 @@
|
|
| 372 |
"metadata": {},
|
| 373 |
"outputs": [],
|
| 374 |
"source": [
|
| 375 |
-
"GRPO_OUT = \"/tmp/physix-grpo\"\n",
|
| 376 |
-
"\n",
|
| 377 |
-
"grpo_cmd = [\n",
|
| 378 |
-
" sys.executable, \"-m\", \"physix.training.loop\",\n",
|
| 379 |
-
" \"--model\", p[\"base_model\"],\n",
|
| 380 |
-
" \"--output-dir\", GRPO_OUT,\n",
|
| 381 |
-
" \"--num-steps\", p[\"num_steps\"],\n",
|
| 382 |
-
" \"--num-generations\", p[\"num_generations\"],\n",
|
| 383 |
-
" \"--max-completion-length\", p[\"max_completion\"],\n",
|
| 384 |
-
" \"--learning-rate\", p[\"grpo_lr\"],\n",
|
| 385 |
-
" \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n",
|
| 386 |
-
" \"--lora-r\", p[\"grpo_lora_r\"],\n",
|
| 387 |
-
" \"--save-method\", \"merged_16bit\",\n",
|
| 388 |
-
" \"--wandb-project\", \"physix-live\",\n",
|
| 389 |
-
" \"--wandb-run-name\", p[\"grpo_run_name\"],\n",
|
| 390 |
-
" \"--sft-checkpoint\", f\"{SFT_OUT}/merged\",\n",
|
| 391 |
-
" \"--seed\", \"0\",\n",
|
| 392 |
-
"]\n",
|
| 393 |
-
"if SYSTEM_ID:\n",
|
| 394 |
-
" grpo_cmd += [\"--system-ids\", SYSTEM_ID]\n",
|
| 395 |
-
"if PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n",
|
| 396 |
-
" grpo_cmd += [\n",
|
| 397 |
-
" \"--push-to-hub\",\n",
|
| 398 |
-
" \"--hub-repo-id\", p[\"hub_final_repo\"],\n",
|
| 399 |
-
" \"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"],\n",
|
| 400 |
-
" ]\n",
|
| 401 |
-
"\n",
|
| 402 |
-
"print(\"$\", \" \".join(grpo_cmd))\n",
|
| 403 |
-
"subprocess.run(grpo_cmd, check=True)"
|
| 404 |
]
|
| 405 |
},
|
| 406 |
{
|
|
|
|
| 323 |
"metadata": {},
|
| 324 |
"outputs": [],
|
| 325 |
"source": [
|
| 326 |
+
"import subprocess, sys\n\nSFT_OUT = \"/tmp/physix-sft\"\n\nsft_cmd = [\n sys.executable, \"-m\", \"physix.training.sft\",\n \"--model\", p[\"base_model\"],\n \"--output-dir\", SFT_OUT,\n \"--epochs\", p[\"sft_epochs\"],\n \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n \"--lora-r\", p[\"sft_lora_r\"],\n \"--learning-rate\", p[\"sft_lr\"],\n \"--wandb-run-name\", p[\"sft_run_name\"],\n \"--seed\", \"0\",\n]\nif SYSTEM_ID:\n sft_cmd += [\"--system-ids\", SYSTEM_ID]\nif PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n sft_cmd += [\"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"]]\n\nprint(\"=\" * 78)\nprint(\" SFT is launched as a subprocess. Per-step loss WILL NOT stream to this cell.\")\nprint(\" \u2192 Live loss curve: https://wandb.ai/pratyush01/physix-live\")\nprint(f\" run name: {p['sft_run_name']}\")\nprint(\" (If WANDB_API_KEY is unset, metrics are still saved to trainer_state.json\")\nprint(\" under SFT_OUT and plotted in the final cell of this notebook.)\")\nprint(\"=\" * 78)\nprint(\"$\", \" \".join(sft_cmd))\nsubprocess.run(sft_cmd, check=True)\n"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 327 |
]
|
| 328 |
},
|
| 329 |
{
|
|
|
|
| 351 |
"metadata": {},
|
| 352 |
"outputs": [],
|
| 353 |
"source": [
|
| 354 |
+
"GRPO_OUT = \"/tmp/physix-grpo\"\n\ngrpo_cmd = [\n sys.executable, \"-m\", \"physix.training.loop\",\n \"--model\", p[\"base_model\"],\n \"--output-dir\", GRPO_OUT,\n \"--num-steps\", p[\"num_steps\"],\n \"--num-generations\", p[\"num_generations\"],\n \"--max-completion-length\", p[\"max_completion\"],\n \"--learning-rate\", p[\"grpo_lr\"],\n \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n \"--lora-r\", p[\"grpo_lora_r\"],\n \"--save-method\", \"merged_16bit\",\n \"--wandb-project\", \"physix-live\",\n \"--wandb-run-name\", p[\"grpo_run_name\"],\n \"--sft-checkpoint\", f\"{SFT_OUT}/merged\",\n \"--seed\", \"0\",\n]\nif SYSTEM_ID:\n grpo_cmd += [\"--system-ids\", SYSTEM_ID]\nif PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n grpo_cmd += [\n \"--push-to-hub\",\n \"--hub-repo-id\", p[\"hub_final_repo\"],\n \"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"],\n ]\n\nprint(\"=\" * 78)\nprint(\" GRPO is launched as a subprocess. Per-step reward / loss WILL NOT stream here.\")\nprint(\" \u2192 Live curves (reward, reward_std, KL, per-component reward, loss):\")\nprint(\" https://wandb.ai/pratyush01/physix-live\")\nprint(f\" run name: {p['grpo_run_name']}\")\nprint(\" (If WANDB_API_KEY is unset, all metrics are still saved to\")\nprint(\" trainer_state.json under GRPO_OUT and plotted in the final cell.)\")\nprint(\"=\" * 78)\nprint(\"$\", \" \".join(grpo_cmd))\nsubprocess.run(grpo_cmd, check=True)\n"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 355 |
]
|
| 356 |
},
|
| 357 |
{
|