Spaces:
Running
Running
Update config/production.yml
Browse files- config/production.yml +37 -3
config/production.yml
CHANGED
|
@@ -1,16 +1,26 @@
|
|
| 1 |
environment: production
|
|
|
|
| 2 |
model:
|
| 3 |
name: microsoft/Phi-3.5-mini-instruct
|
| 4 |
quantization: Q4_K_M
|
| 5 |
context_length: 4096
|
|
|
|
| 6 |
|
| 7 |
api:
|
| 8 |
rate_limiting:
|
| 9 |
enabled: true
|
| 10 |
requests_per_minute: 60
|
|
|
|
| 11 |
security:
|
| 12 |
input_sanitization: true
|
| 13 |
suspicious_pattern_detection: true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 14 |
|
| 15 |
monitoring:
|
| 16 |
enabled: true
|
|
@@ -18,14 +28,38 @@ monitoring:
|
|
| 18 |
- response_time
|
| 19 |
- error_rate
|
| 20 |
- system_resources
|
|
|
|
|
|
|
| 21 |
alerts:
|
| 22 |
-
- high_error_rate
|
| 23 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
|
| 25 |
supabase:
|
| 26 |
max_retries: 3
|
| 27 |
timeout: 30
|
|
|
|
| 28 |
|
| 29 |
caching:
|
| 30 |
enabled: true
|
| 31 |
-
ttl: 300
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
environment: production
|
| 2 |
+
|
| 3 |
model:
|
| 4 |
name: microsoft/Phi-3.5-mini-instruct
|
| 5 |
quantization: Q4_K_M
|
| 6 |
context_length: 4096
|
| 7 |
+
max_response_length: 500
|
| 8 |
|
| 9 |
api:
|
| 10 |
rate_limiting:
|
| 11 |
enabled: true
|
| 12 |
requests_per_minute: 60
|
| 13 |
+
burst_capacity: 10
|
| 14 |
security:
|
| 15 |
input_sanitization: true
|
| 16 |
suspicious_pattern_detection: true
|
| 17 |
+
max_input_length: 10000
|
| 18 |
+
cors:
|
| 19 |
+
allowed_origins:
|
| 20 |
+
- "https://www.saemstunes.com"
|
| 21 |
+
- "https://saemstunes.com"
|
| 22 |
+
allowed_methods: ["GET", "POST", "OPTIONS"]
|
| 23 |
+
allowed_headers: ["*"]
|
| 24 |
|
| 25 |
monitoring:
|
| 26 |
enabled: true
|
|
|
|
| 28 |
- response_time
|
| 29 |
- error_rate
|
| 30 |
- system_resources
|
| 31 |
+
- user_activity
|
| 32 |
+
- model_performance
|
| 33 |
alerts:
|
| 34 |
+
- high_error_rate:
|
| 35 |
+
threshold: 5%
|
| 36 |
+
duration: 5m
|
| 37 |
+
- slow_response:
|
| 38 |
+
threshold: 10s
|
| 39 |
+
duration: 2m
|
| 40 |
+
- system_overload:
|
| 41 |
+
cpu_threshold: 80%
|
| 42 |
+
memory_threshold: 90%
|
| 43 |
+
duration: 5m
|
| 44 |
|
| 45 |
supabase:
|
| 46 |
max_retries: 3
|
| 47 |
timeout: 30
|
| 48 |
+
connection_pool_size: 10
|
| 49 |
|
| 50 |
caching:
|
| 51 |
enabled: true
|
| 52 |
+
ttl: 300
|
| 53 |
+
max_size: 1000
|
| 54 |
+
|
| 55 |
+
logging:
|
| 56 |
+
level: INFO
|
| 57 |
+
format: json
|
| 58 |
+
file_rotation: "10 MB"
|
| 59 |
+
max_files: 5
|
| 60 |
+
|
| 61 |
+
deployment:
|
| 62 |
+
primary: "huggingface_spaces"
|
| 63 |
+
backup: "railway"
|
| 64 |
+
health_check_interval: 30
|
| 65 |
+
auto_restart: true
|