File size: 806 Bytes
3b6ded8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
from unsloth import FastVisionModel
from dotenv import load_dotenv
import os


def save_model(model, tokenizer, local: bool) -> None:
    load_dotenv()
    if local:
        model.save_pretrained()
        tokenizer.save_pretrained("ft_llava")
    else:
        model.push_to_hub(f"{os.getenv("ORG_NAME")}/ft_llava", token = os.getenv("HF_TOKEN"))        
    return 


def save_gguf(model_name: str, local:bool, tokenizer): 
    model, processor = FastVisionModel.from_pretrained(
        model_name= model_name, 
        load_in_4bit=True,  
    )
    FastVisionModel.for_inference(model) 
    if local:
        model.save_pretrained_merged("ft_qwen2_vl_2b", tokenizer)

    else:
        model.push_to_hub_merged(f"{os.getenv("ORG_NAME")}/ft_qwen2_vl_2b", tokenizer, token = f"{os.getenv("HF_TOKEN")}")