ShabanEjupi
/

Chatbot-i

Safetensors

Model card Files Files and versions

xet

Community

ShabanEjupi commited on Feb 16, 2025

Commit

d9e9533

verified ·

1 Parent(s): 3194358

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -13

app.py CHANGED Viewed

@@ -6,13 +6,27 @@ def install(package):
     subprocess.check_call([sys.executable, "-m", "pip", "install", package])
 # Install dependencies
-install("transformers==4.34.0")
-install("torch==2.0.1+cu118")
-install("gradio==3.39.0")
-install("accelerate==0.23.0")
-install("bitsandbytes==0.41.1")
-install("sentencepiece==0.1.99")
-install("python-dotenv==1.0.0")
 from transformers import LlamaTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 import gradio as gr
@@ -25,26 +39,40 @@ import torch
 load_dotenv()
 # Log in to Hugging Face
-login(token=os.getenv("HUGGINGFACE_TOKEN"))
 # Model configuration
 model_name = "mistralai/Mistral-7B-v0.3"
-# Load tokenizer explicitly
 tokenizer = LlamaTokenizer.from_pretrained(model_name)
 # 4-bit quantization for better performance
 bnb_config = BitsAndBytesConfig(
-    load_in_4bit=True,
     bnb_4bit_quant_type="nf4",
-    bnb_4bit_compute_dtype="float16"
 )
 # Load model with optimized settings
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     quantization_config=bnb_config,
-    device_map="auto",
     torch_dtype=torch.float16
 )
@@ -70,4 +98,4 @@ gr.ChatInterface(
     title="Shërbimi i Konsumatorit",
     examples=["Si mund të rivendos fjalëkalimin?", "A e keni në dispozicion këtë produkt?"],
     cache_examples=True
-).launch(server_port=7860, share=True)

     subprocess.check_call([sys.executable, "-m", "pip", "install", package])
 # Install dependencies
+packages = [
+    "transformers==4.34.0",
+    "torch==2.0.1+cu118",
+    "gradio==3.39.0",
+    "accelerate==0.23.0",
+    "bitsandbytes==0.41.1",
+    "sentencepiece==0.1.99",
+    "python-dotenv==1.0.0"
+]
+for package in packages:
+    try:
+        install(package)
+    except Exception as e:
+        print(f"Failed to install {package}: {e}")
+# Install bitsandbytes from Test PyPI if needed
+try:
+    import bitsandbytes
+except ImportError:
+    install("bitsandbytes -i https://test.pypi.org/simple/")
 from transformers import LlamaTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 import gradio as gr
 load_dotenv()
 # Log in to Hugging Face
+huggingface_token = os.getenv("HUGGINGFACE_TOKEN")
+if huggingface_token:
+    login(token=huggingface_token)
+else:
+    raise ValueError("HUGGINGFACE_TOKEN is missing in .env file!")
 # Model configuration
 model_name = "mistralai/Mistral-7B-v0.3"
+# Load tokenizer
 tokenizer = LlamaTokenizer.from_pretrained(model_name)
+# Check if torch is correctly installed
+try:
+    assert torch.cuda.is_available(), "CUDA is not available. Install CUDA or use CPU mode."
+except AssertionError as e:
+    print(e)
+    print("Falling back to CPU mode.")
+    device_map = "cpu"
+else:
+    device_map = "auto"
 # 4-bit quantization for better performance
 bnb_config = BitsAndBytesConfig(
+    load_in_4bit=True,  # Change to load_in_8bit=True if needed
     bnb_4bit_quant_type="nf4",
+    bnb_4bit_compute_dtype=torch.float16
 )
 # Load model with optimized settings
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     quantization_config=bnb_config,
+    device_map=device_map,
     torch_dtype=torch.float16
 )
     title="Shërbimi i Konsumatorit",
     examples=["Si mund të rivendos fjalëkalimin?", "A e keni në dispozicion këtë produkt?"],
     cache_examples=True
+).launch(server_port=7860, share=True)