| from unsloth import FastVisionModel |
| from dotenv import load_dotenv |
| import os |
|
|
|
|
| def save_model(model, tokenizer, local: bool) -> None: |
| load_dotenv() |
| if local: |
| model.save_pretrained() |
| tokenizer.save_pretrained("ft_llava") |
| else: |
| model.push_to_hub(f"{os.getenv("ORG_NAME")}/ft_llava", token = os.getenv("HF_TOKEN")) |
| return |
|
|
|
|
| def save_gguf(model_name: str, local:bool, tokenizer): |
| model, processor = FastVisionModel.from_pretrained( |
| model_name= model_name, |
| load_in_4bit=True, |
| ) |
| FastVisionModel.for_inference(model) |
| if local: |
| model.save_pretrained_merged("ft_qwen2_vl_2b", tokenizer) |
|
|
| else: |
| model.push_to_hub_merged(f"{os.getenv("ORG_NAME")}/ft_qwen2_vl_2b", tokenizer, token = f"{os.getenv("HF_TOKEN")}") |
|
|