Spaces:

jayashree
/

TatTwamAI

Sleeping

Jayashree Sridhar commited on Jun 11

Commit

f8a9066

1 Parent(s): 94ae986

replaced mistral with TinyGPT2Model

Files changed (1) hide show

models/mistral_model.py CHANGED Viewed

@@ -24,9 +24,9 @@ class MistralModel:
     def _initialize_model(self):
         """Initialize Mistral model with optimizations"""
-        print("Loading Mistral model...")
-        model_id = "mistralai/Mistral-7B-Instruct-v0.2"
         # Load tokenizer
         MistralModel._tokenizer = AutoTokenizer.from_pretrained(model_id, token=HUGGINGFACE_TOKEN,use_fast=False)
@@ -35,12 +35,11 @@ class MistralModel:
         MistralModel._model = AutoModelForCausalLM.from_pretrained(
             model_id,
             token=HUGGINGFACE_TOKEN,
-            torch_dtype=torch.float16,
-            device_map="auto",
             load_in_8bit=True  # Use 8-bit quantization for memory efficiency
         )
-        print("Mistral model loaded successfully!")
     def generate(
         self,

     def _initialize_model(self):
         """Initialize Mistral model with optimizations"""
+        print("Loading TinyGPT2Model model...")
+        model_id = "sshleifer/tiny-gpt2"
         # Load tokenizer
         MistralModel._tokenizer = AutoTokenizer.from_pretrained(model_id, token=HUGGINGFACE_TOKEN,use_fast=False)
         MistralModel._model = AutoModelForCausalLM.from_pretrained(
             model_id,
             token=HUGGINGFACE_TOKEN,
+            torch_dtype=torch.float32,
             load_in_8bit=True  # Use 8-bit quantization for memory efficiency
         )
+        print("TinyGPT2Model loaded successfully!")
     def generate(
         self,