Arjunvir Singh commited on
Commit
de03f34
·
1 Parent(s): 31ea79c

Lower @spaces.GPU duration from 180/120 to 60 (ZeroGPU max-duration cap)

Browse files
zsgdp/benchmarks/embedding_retriever.py CHANGED
@@ -41,7 +41,7 @@ from zsgdp.schema import Chunk
41
  Embedder = Callable[[list[str]], list[list[float]]]
42
 
43
 
44
- @zero_gpu_slot(duration=180)
45
  def _gpu_encode_batch(model_id: str, task: str | None, texts: list[str]) -> list[list[float]]:
46
  """Load a sentence-transformers model and encode `texts` under a ZeroGPU slot.
47
 
 
41
  Embedder = Callable[[list[str]], list[list[float]]]
42
 
43
 
44
+ @zero_gpu_slot(duration=60)
45
  def _gpu_encode_batch(model_id: str, task: str | None, texts: list[str]) -> list[list[float]]:
46
  """Load a sentence-transformers model and encode `texts` under a ZeroGPU slot.
47
 
zsgdp/gpu/transformers_client.py CHANGED
@@ -19,7 +19,7 @@ from zsgdp.gpu.worker_prompts import prompt_for_task
19
  from zsgdp.gpu.zero_gpu import gpu as zero_gpu_slot
20
 
21
 
22
- @zero_gpu_slot(duration=120)
23
  def _gpu_run_pipeline(
24
  model_id: str,
25
  pipeline_task: str,
 
19
  from zsgdp.gpu.zero_gpu import gpu as zero_gpu_slot
20
 
21
 
22
+ @zero_gpu_slot(duration=60)
23
  def _gpu_run_pipeline(
24
  model_id: str,
25
  pipeline_task: str,