Pratyush-01 commited on
Commit
825a76e
·
verified ·
1 Parent(s): 74ddb14

Upload folder using huggingface_hub

Browse files
frontend/src/components/RunWithLlmPane.tsx CHANGED
@@ -718,7 +718,7 @@ function ModelPresetPicker({
718
  key={preset.id}
719
  preset={preset}
720
  selected={selected.id === preset.id}
721
- disabled={disabled}
722
  onSelect={() => selectPreset(preset)}
723
  />
724
  ))}
 
718
  key={preset.id}
719
  preset={preset}
720
  selected={selected.id === preset.id}
721
+ disabled={disabled ?? false}
722
  onSelect={() => selectPreset(preset)}
723
  />
724
  ))}
train/physix_train_colab.ipynb CHANGED
@@ -323,28 +323,7 @@
323
  "metadata": {},
324
  "outputs": [],
325
  "source": [
326
- "import subprocess, sys\n",
327
- "\n",
328
- "SFT_OUT = \"/tmp/physix-sft\"\n",
329
- "\n",
330
- "sft_cmd = [\n",
331
- " sys.executable, \"-m\", \"physix.training.sft\",\n",
332
- " \"--model\", p[\"base_model\"],\n",
333
- " \"--output-dir\", SFT_OUT,\n",
334
- " \"--epochs\", p[\"sft_epochs\"],\n",
335
- " \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n",
336
- " \"--lora-r\", p[\"sft_lora_r\"],\n",
337
- " \"--learning-rate\", p[\"sft_lr\"],\n",
338
- " \"--wandb-run-name\", p[\"sft_run_name\"],\n",
339
- " \"--seed\", \"0\",\n",
340
- "]\n",
341
- "if SYSTEM_ID:\n",
342
- " sft_cmd += [\"--system-ids\", SYSTEM_ID]\n",
343
- "if PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n",
344
- " sft_cmd += [\"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"]]\n",
345
- "\n",
346
- "print(\"$\", \" \".join(sft_cmd))\n",
347
- "subprocess.run(sft_cmd, check=True)"
348
  ]
349
  },
350
  {
@@ -372,35 +351,7 @@
372
  "metadata": {},
373
  "outputs": [],
374
  "source": [
375
- "GRPO_OUT = \"/tmp/physix-grpo\"\n",
376
- "\n",
377
- "grpo_cmd = [\n",
378
- " sys.executable, \"-m\", \"physix.training.loop\",\n",
379
- " \"--model\", p[\"base_model\"],\n",
380
- " \"--output-dir\", GRPO_OUT,\n",
381
- " \"--num-steps\", p[\"num_steps\"],\n",
382
- " \"--num-generations\", p[\"num_generations\"],\n",
383
- " \"--max-completion-length\", p[\"max_completion\"],\n",
384
- " \"--learning-rate\", p[\"grpo_lr\"],\n",
385
- " \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n",
386
- " \"--lora-r\", p[\"grpo_lora_r\"],\n",
387
- " \"--save-method\", \"merged_16bit\",\n",
388
- " \"--wandb-project\", \"physix-live\",\n",
389
- " \"--wandb-run-name\", p[\"grpo_run_name\"],\n",
390
- " \"--sft-checkpoint\", f\"{SFT_OUT}/merged\",\n",
391
- " \"--seed\", \"0\",\n",
392
- "]\n",
393
- "if SYSTEM_ID:\n",
394
- " grpo_cmd += [\"--system-ids\", SYSTEM_ID]\n",
395
- "if PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n",
396
- " grpo_cmd += [\n",
397
- " \"--push-to-hub\",\n",
398
- " \"--hub-repo-id\", p[\"hub_final_repo\"],\n",
399
- " \"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"],\n",
400
- " ]\n",
401
- "\n",
402
- "print(\"$\", \" \".join(grpo_cmd))\n",
403
- "subprocess.run(grpo_cmd, check=True)"
404
  ]
405
  },
406
  {
 
323
  "metadata": {},
324
  "outputs": [],
325
  "source": [
326
+ "import subprocess, sys\n\nSFT_OUT = \"/tmp/physix-sft\"\n\nsft_cmd = [\n sys.executable, \"-m\", \"physix.training.sft\",\n \"--model\", p[\"base_model\"],\n \"--output-dir\", SFT_OUT,\n \"--epochs\", p[\"sft_epochs\"],\n \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n \"--lora-r\", p[\"sft_lora_r\"],\n \"--learning-rate\", p[\"sft_lr\"],\n \"--wandb-run-name\", p[\"sft_run_name\"],\n \"--seed\", \"0\",\n]\nif SYSTEM_ID:\n sft_cmd += [\"--system-ids\", SYSTEM_ID]\nif PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n sft_cmd += [\"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"]]\n\nprint(\"=\" * 78)\nprint(\" SFT is launched as a subprocess. Per-step loss WILL NOT stream to this cell.\")\nprint(\" \u2192 Live loss curve: https://wandb.ai/pratyush01/physix-live\")\nprint(f\" run name: {p['sft_run_name']}\")\nprint(\" (If WANDB_API_KEY is unset, metrics are still saved to trainer_state.json\")\nprint(\" under SFT_OUT and plotted in the final cell of this notebook.)\")\nprint(\"=\" * 78)\nprint(\"$\", \" \".join(sft_cmd))\nsubprocess.run(sft_cmd, check=True)\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
327
  ]
328
  },
329
  {
 
351
  "metadata": {},
352
  "outputs": [],
353
  "source": [
354
+ "GRPO_OUT = \"/tmp/physix-grpo\"\n\ngrpo_cmd = [\n sys.executable, \"-m\", \"physix.training.loop\",\n \"--model\", p[\"base_model\"],\n \"--output-dir\", GRPO_OUT,\n \"--num-steps\", p[\"num_steps\"],\n \"--num-generations\", p[\"num_generations\"],\n \"--max-completion-length\", p[\"max_completion\"],\n \"--learning-rate\", p[\"grpo_lr\"],\n \"--instances-per-system\", str(INSTANCES_PER_SYSTEM),\n \"--lora-r\", p[\"grpo_lora_r\"],\n \"--save-method\", \"merged_16bit\",\n \"--wandb-project\", \"physix-live\",\n \"--wandb-run-name\", p[\"grpo_run_name\"],\n \"--sft-checkpoint\", f\"{SFT_OUT}/merged\",\n \"--seed\", \"0\",\n]\nif SYSTEM_ID:\n grpo_cmd += [\"--system-ids\", SYSTEM_ID]\nif PUSH_TO_HUB and os.environ.get(\"HF_TOKEN\"):\n grpo_cmd += [\n \"--push-to-hub\",\n \"--hub-repo-id\", p[\"hub_final_repo\"],\n \"--hub-checkpoint-repo-id\", p[\"hub_ckpt_repo\"],\n ]\n\nprint(\"=\" * 78)\nprint(\" GRPO is launched as a subprocess. Per-step reward / loss WILL NOT stream here.\")\nprint(\" \u2192 Live curves (reward, reward_std, KL, per-component reward, loss):\")\nprint(\" https://wandb.ai/pratyush01/physix-live\")\nprint(f\" run name: {p['grpo_run_name']}\")\nprint(\" (If WANDB_API_KEY is unset, all metrics are still saved to\")\nprint(\" trainer_state.json under GRPO_OUT and plotted in the final cell.)\")\nprint(\"=\" * 78)\nprint(\"$\", \" \".join(grpo_cmd))\nsubprocess.run(grpo_cmd, check=True)\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
355
  ]
356
  },
357
  {