Update app.py
#1
by
Kh0128 - opened
app.py
CHANGED
|
@@ -7,13 +7,11 @@ Optimized for Hugging Face Spaces with lazy loading and fallbacks
|
|
| 7 |
import os
|
| 8 |
|
| 9 |
# Configure environment for CPU-only and memory optimization
|
| 10 |
-
os.environ['
|
| 11 |
-
os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:128'
|
| 12 |
os.environ['OMP_NUM_THREADS'] = '2' # Limit CPU threads
|
| 13 |
os.environ['MKL_NUM_THREADS'] = '2'
|
| 14 |
os.environ['NUMEXPR_NUM_THREADS'] = '2'
|
| 15 |
os.environ['TOKENIZERS_PARALLELISM'] = 'false' # Avoid tokenizer warnings
|
| 16 |
-
|
| 17 |
# Batchalign specific settings
|
| 18 |
os.environ['BATCHALIGN_CACHE'] = '/tmp/batchalign_cache'
|
| 19 |
os.environ['HF_HUB_CACHE'] = '/tmp/hf_cache' # Use tmp for model cache
|
|
|
|
| 7 |
import os
|
| 8 |
|
| 9 |
# Configure environment for CPU-only and memory optimization
|
| 10 |
+
os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:512'
|
|
|
|
| 11 |
os.environ['OMP_NUM_THREADS'] = '2' # Limit CPU threads
|
| 12 |
os.environ['MKL_NUM_THREADS'] = '2'
|
| 13 |
os.environ['NUMEXPR_NUM_THREADS'] = '2'
|
| 14 |
os.environ['TOKENIZERS_PARALLELISM'] = 'false' # Avoid tokenizer warnings
|
|
|
|
| 15 |
# Batchalign specific settings
|
| 16 |
os.environ['BATCHALIGN_CACHE'] = '/tmp/batchalign_cache'
|
| 17 |
os.environ['HF_HUB_CACHE'] = '/tmp/hf_cache' # Use tmp for model cache
|