Update app.py
Browse files
app.py
CHANGED
|
@@ -2,9 +2,11 @@ import torch
|
|
| 2 |
from transformers import AutoTokenizer, AutoModelForCausalLM, TextStreamer, GenerationConfig, BitsAndBytesConfig
|
| 3 |
import gradio as gr
|
| 4 |
import os
|
| 5 |
-
|
| 6 |
# Authenticate using token from environment
|
| 7 |
hf_token = os.getenv("HF_TOKEN")
|
|
|
|
|
|
|
| 8 |
|
| 9 |
# Use quantization for low-memory GPU inference
|
| 10 |
quantization_config = BitsAndBytesConfig(
|
|
|
|
| 2 |
from transformers import AutoTokenizer, AutoModelForCausalLM, TextStreamer, GenerationConfig, BitsAndBytesConfig
|
| 3 |
import gradio as gr
|
| 4 |
import os
|
| 5 |
+
from huggingface_hub import login
|
| 6 |
# Authenticate using token from environment
|
| 7 |
hf_token = os.getenv("HF_TOKEN")
|
| 8 |
+
login(token=hf_token)
|
| 9 |
+
|
| 10 |
|
| 11 |
# Use quantization for low-memory GPU inference
|
| 12 |
quantization_config = BitsAndBytesConfig(
|