asdf98
/

ethical-hacking-llm-colab

asdf98 commited on 1 day ago

Commit

313d1a1

verified ·

1 Parent(s): a7d1cc9

Upload EthicalHacking_Qwen3-4B_Ultimate_Colab.ipynb

Files changed (1) hide show

EthicalHacking_Qwen3-4B_Ultimate_Colab.ipynb CHANGED Viewed

@@ -67,7 +67,10 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "## 3️⃣ Load Qwen3-4B-Instruct-2507 in 4-bit via Unsloth"
    ]
   },
   {
@@ -100,6 +103,7 @@
     "    max_seq_length=MAX_SEQ_LENGTH,\n",
     "    dtype=None,\n",
     "    load_in_4bit=True,\n",
     ")\n",
     "\n",
     "model = FastLanguageModel.get_peft_model(\n",
@@ -219,8 +223,6 @@
     "    return {\"messages\": msgs}\n",
     "\n",
     "def _convert_code_corpus(example):\n",
-    "    # Code Corpus: raw code text with domain/repo metadata in a user prompt + assistant format\n",
-    "    # We treat the code block as an assistant response to a user asking about that code\n",
     "    code_text = example[\"text\"]\n",
     "    domain = example.get(\"domain\", \"code\")\n",
     "    repo = example.get(\"repo\", \"unknown\")\n",
@@ -231,7 +233,6 @@
     "        {\"role\": \"assistant\", \"content\": code_text},\n",
     "    ]}\n",
     "\n",
-    "# ===================== LOAD DATASET(S) =====================\n",
     "all_datasets = []\n",
     "\n",
     "if DATASET_CHOICE == \"cybersecurity\":\n",
@@ -388,7 +389,7 @@
    "outputs": [],
    "source": [
     "if torch.cuda.is_available():\n",
-    "    print(f\"VRAM before train: {torch.cuda.memory_allocated()/1e9:.2f} GB\")\n",
     "\n",
     "trainer_stats = trainer.train()\n",
     "\n",

    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "## 3️⃣ Load Qwen3-4B-Instruct-2507 in 4-bit via Unsloth\n",
+    "\n",
+    "**⚠️ IMPORTANT:** We add `device_map={\"\": torch.cuda.current_device()}` to force the model onto the correct GPU.\n",
+    "Without this, `accelerate` may place the model on CPU and throw a `ValueError` during training on Kaggle/Colab."
    ]
   },
   {
     "    max_seq_length=MAX_SEQ_LENGTH,\n",
     "    dtype=None,\n",
     "    load_in_4bit=True,\n",
+    "    device_map={\"\": torch.cuda.current_device()},  # ← FORCE GPU: fixes Kaggle/Colab device placement bug\n",
     ")\n",
     "\n",
     "model = FastLanguageModel.get_peft_model(\n",
     "    return {\"messages\": msgs}\n",
     "\n",
     "def _convert_code_corpus(example):\n",
     "    code_text = example[\"text\"]\n",
     "    domain = example.get(\"domain\", \"code\")\n",
     "    repo = example.get(\"repo\", \"unknown\")\n",
     "        {\"role\": \"assistant\", \"content\": code_text},\n",
     "    ]}\n",
     "\n",
     "all_datasets = []\n",
     "\n",
     "if DATASET_CHOICE == \"cybersecurity\":\n",
    "outputs": [],
    "source": [
     "if torch.cuda.is_available():\n",
+    "    print(f\"VRAM before train: {torch.cuda.memory_allocated()/1e9:.2f} GB / {torch.cuda.get_device_properties(0).total_memory/1e9:.2f} GB\")\n",
     "\n",
     "trainer_stats = trainer.train()\n",
     "\n",