Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -32,7 +32,22 @@ logging.getLogger("httpx").setLevel(logging.WARNING)
|
|
| 32 |
logging.getLogger("gradio").setLevel(logging.WARNING)
|
| 33 |
# ููู ุนุงู
ูุญู
ุงูุฉ ุงููุตูู ุฅูู LLM/Agent ุฏุงุฎู ุงูุฎููุท
|
| 34 |
llama_lock = threading.Lock()
|
| 35 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
# ุชุญูู ู
ู ูุฌูุฏ ุชููู ูู ู
ุชุบูุฑ ุงูุจูุฆุฉ
|
| 37 |
HF_TOKEN = os.getenv("HF_TOKEN")
|
| 38 |
|
|
@@ -451,22 +466,7 @@ def gradio_interface():
|
|
| 451 |
# class DummyLLM:
|
| 452 |
# def __call__(self, *args, **kwargs):
|
| 453 |
# return ""
|
| 454 |
-
model_path = hf_hub_download(
|
| 455 |
-
repo_id="bartowski/Qwen2.5-14B-Instruct-GGUF",
|
| 456 |
-
filename="Qwen2.5-14B-Instruct-IQ4_XS.gguf",
|
| 457 |
-
)
|
| 458 |
|
| 459 |
-
llm = LlamaCpp(
|
| 460 |
-
model_path=model_path,
|
| 461 |
-
n_ctx=10000,
|
| 462 |
-
n_threads=os.cpu_count(),
|
| 463 |
-
n_gpu_layers=0,
|
| 464 |
-
f16_kv=True,
|
| 465 |
-
temperature=0.7,
|
| 466 |
-
top_p=0.7,
|
| 467 |
-
max_tokens=500,
|
| 468 |
-
verbose=False
|
| 469 |
-
)
|
| 470 |
tracer = None
|
| 471 |
if LANGSMITH_AVAILABLE and os.getenv("LANGSMITH_API_KEY"):
|
| 472 |
try:
|
|
|
|
| 32 |
logging.getLogger("gradio").setLevel(logging.WARNING)
|
| 33 |
# ููู ุนุงู
ูุญู
ุงูุฉ ุงููุตูู ุฅูู LLM/Agent ุฏุงุฎู ุงูุฎููุท
|
| 34 |
llama_lock = threading.Lock()
|
| 35 |
+
model_path = hf_hub_download(
|
| 36 |
+
repo_id="bartowski/Qwen2.5-14B-Instruct-GGUF",
|
| 37 |
+
filename="Qwen2.5-14B-Instruct-IQ4_XS.gguf",
|
| 38 |
+
)
|
| 39 |
+
|
| 40 |
+
llm = LlamaCpp(
|
| 41 |
+
model_path=model_path,
|
| 42 |
+
n_ctx=10000,
|
| 43 |
+
n_threads=os.cpu_count(),
|
| 44 |
+
n_gpu_layers=0,
|
| 45 |
+
f16_kv=True,
|
| 46 |
+
temperature=0.7,
|
| 47 |
+
top_p=0.7,
|
| 48 |
+
max_tokens=500,
|
| 49 |
+
verbose=False
|
| 50 |
+
)
|
| 51 |
# ุชุญูู ู
ู ูุฌูุฏ ุชููู ูู ู
ุชุบูุฑ ุงูุจูุฆุฉ
|
| 52 |
HF_TOKEN = os.getenv("HF_TOKEN")
|
| 53 |
|
|
|
|
| 466 |
# class DummyLLM:
|
| 467 |
# def __call__(self, *args, **kwargs):
|
| 468 |
# return ""
|
|
|
|
|
|
|
|
|
|
|
|
|
| 469 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 470 |
tracer = None
|
| 471 |
if LANGSMITH_AVAILABLE and os.getenv("LANGSMITH_API_KEY"):
|
| 472 |
try:
|