Mustafa-albakkar commited on
Commit
95fc3d5
ยท
verified ยท
1 Parent(s): 01df69f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +16 -16
app.py CHANGED
@@ -32,7 +32,22 @@ logging.getLogger("httpx").setLevel(logging.WARNING)
32
  logging.getLogger("gradio").setLevel(logging.WARNING)
33
  # ู‚ูู„ ุนุงู… ู„ุญู…ุงูŠุฉ ุงู„ูˆุตูˆู„ ุฅู„ู‰ LLM/Agent ุฏุงุฎู„ ุงู„ุฎูŠูˆุท
34
  llama_lock = threading.Lock()
35
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
36
  # ุชุญู‚ู‚ ู…ู† ูˆุฌูˆุฏ ุชูˆูƒู† ููŠ ู…ุชุบูŠุฑ ุงู„ุจูŠุฆุฉ
37
  HF_TOKEN = os.getenv("HF_TOKEN")
38
 
@@ -451,22 +466,7 @@ def gradio_interface():
451
  # class DummyLLM:
452
  # def __call__(self, *args, **kwargs):
453
  # return ""
454
- model_path = hf_hub_download(
455
- repo_id="bartowski/Qwen2.5-14B-Instruct-GGUF",
456
- filename="Qwen2.5-14B-Instruct-IQ4_XS.gguf",
457
- )
458
 
459
- llm = LlamaCpp(
460
- model_path=model_path,
461
- n_ctx=10000,
462
- n_threads=os.cpu_count(),
463
- n_gpu_layers=0,
464
- f16_kv=True,
465
- temperature=0.7,
466
- top_p=0.7,
467
- max_tokens=500,
468
- verbose=False
469
- )
470
  tracer = None
471
  if LANGSMITH_AVAILABLE and os.getenv("LANGSMITH_API_KEY"):
472
  try:
 
32
  logging.getLogger("gradio").setLevel(logging.WARNING)
33
  # ู‚ูู„ ุนุงู… ู„ุญู…ุงูŠุฉ ุงู„ูˆุตูˆู„ ุฅู„ู‰ LLM/Agent ุฏุงุฎู„ ุงู„ุฎูŠูˆุท
34
  llama_lock = threading.Lock()
35
+ model_path = hf_hub_download(
36
+ repo_id="bartowski/Qwen2.5-14B-Instruct-GGUF",
37
+ filename="Qwen2.5-14B-Instruct-IQ4_XS.gguf",
38
+ )
39
+
40
+ llm = LlamaCpp(
41
+ model_path=model_path,
42
+ n_ctx=10000,
43
+ n_threads=os.cpu_count(),
44
+ n_gpu_layers=0,
45
+ f16_kv=True,
46
+ temperature=0.7,
47
+ top_p=0.7,
48
+ max_tokens=500,
49
+ verbose=False
50
+ )
51
  # ุชุญู‚ู‚ ู…ู† ูˆุฌูˆุฏ ุชูˆูƒู† ููŠ ู…ุชุบูŠุฑ ุงู„ุจูŠุฆุฉ
52
  HF_TOKEN = os.getenv("HF_TOKEN")
53
 
 
466
  # class DummyLLM:
467
  # def __call__(self, *args, **kwargs):
468
  # return ""
 
 
 
 
469
 
 
 
 
 
 
 
 
 
 
 
 
470
  tracer = None
471
  if LANGSMITH_AVAILABLE and os.getenv("LANGSMITH_API_KEY"):
472
  try: