nraptisss commited on
Commit
02163ca
·
verified ·
1 Parent(s): 1a58981

Upload merge_and_push.py

Browse files
Files changed (1) hide show
  1. merge_and_push.py +12 -3
merge_and_push.py CHANGED
@@ -3,6 +3,9 @@ Merge LoRA adapters into the base model and push to Hugging Face Hub.
3
  Run this after train.py completes successfully.
4
  """
5
 
 
 
 
6
  import torch
7
  from transformers import AutoModelForCausalLM, AutoTokenizer
8
  from peft import PeftModel
@@ -19,10 +22,16 @@ HUB_MODEL_ID = "nraptisss/qwen2.5-7b-telecom-intent-merged"
19
 
20
  def merge_and_push():
21
  """Load adapters, merge, save locally, and push to hub."""
 
 
 
 
 
 
22
  print(f"Loading base model: {BASE_MODEL}")
23
  base_model = AutoModelForCausalLM.from_pretrained(
24
  BASE_MODEL,
25
- torch_dtype=torch.float16,
26
  device_map="auto",
27
  trust_remote_code=True,
28
  )
@@ -34,8 +43,8 @@ def merge_and_push():
34
  if tokenizer.pad_token is None:
35
  tokenizer.pad_token = tokenizer.eos_token
36
 
37
- print(f"Loading adapters from: {ADAPTER_PATH}")
38
- model = PeftModel.from_pretrained(base_model, ADAPTER_PATH)
39
 
40
  print("Merging adapters into base model...")
41
  model = model.merge_and_unload()
 
3
  Run this after train.py completes successfully.
4
  """
5
 
6
+ import os
7
+ import sys
8
+
9
  import torch
10
  from transformers import AutoModelForCausalLM, AutoTokenizer
11
  from peft import PeftModel
 
22
 
23
  def merge_and_push():
24
  """Load adapters, merge, save locally, and push to hub."""
25
+ adapter_path = os.path.abspath(ADAPTER_PATH)
26
+ if not os.path.isdir(adapter_path):
27
+ print(f"ERROR: Adapter path not found: {adapter_path}")
28
+ print("Run train.py first to generate adapters.")
29
+ sys.exit(1)
30
+
31
  print(f"Loading base model: {BASE_MODEL}")
32
  base_model = AutoModelForCausalLM.from_pretrained(
33
  BASE_MODEL,
34
+ dtype=torch.float16,
35
  device_map="auto",
36
  trust_remote_code=True,
37
  )
 
43
  if tokenizer.pad_token is None:
44
  tokenizer.pad_token = tokenizer.eos_token
45
 
46
+ print(f"Loading adapters from: {adapter_path}")
47
+ model = PeftModel.from_pretrained(base_model, adapter_path)
48
 
49
  print("Merging adapters into base model...")
50
  model = model.merge_and_unload()