webpluging

Paused

ranamhamoud commited on Dec 23, 2024

Commit

9363edf

verified ·

1 Parent(s): 44a3700

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -36,7 +36,11 @@ def generate_image(text):
         logging.error("Failed to generate image: %s", str(error))
         raise gr.Error("An error occurred while generating the image. Please check your API key and try again.")
 # Constants
 MAX_MAX_NEW_TOKENS = 2048
@@ -63,7 +67,12 @@ if torch.cuda.is_available():
         bnb_4bit_quant_type="nf4",
         bnb_4bit_compute_dtype=torch.bfloat16
     )
-    base_model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", quantization_config=bnb_config)
     model = PeftModel.from_pretrained(base_model, "ranamhamoud/storytellai-2.0")
     tokenizer = AutoTokenizer.from_pretrained(model_id)
     tokenizer.pad_token = tokenizer.eos_token

         logging.error("Failed to generate image: %s", str(error))
         raise gr.Error("An error occurred while generating the image. Please check your API key and try again.")
+ rope_scaling = {
+    'type': 'linear',  # Adjust the type to the appropriate scaling type for your model.
+    'factor': 8.0      # Use the intended scaling factor.
+}
 # Constants
 MAX_MAX_NEW_TOKENS = 2048
         bnb_4bit_quant_type="nf4",
         bnb_4bit_compute_dtype=torch.bfloat16
     )
+base_model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    device_map="auto",
+    quantization_config=bnb_config,
+    rope_scaling=rope_scaling  # Add this only if your model specifically requires it.
+)
     model = PeftModel.from_pretrained(base_model, "ranamhamoud/storytellai-2.0")
     tokenizer = AutoTokenizer.from_pretrained(model_id)
     tokenizer.pad_token = tokenizer.eos_token