saemstunes commited on
Commit
9247f0a
·
verified ·
1 Parent(s): 563e7c0

Update config/production.yml

Browse files
Files changed (1) hide show
  1. config/production.yml +37 -3
config/production.yml CHANGED
@@ -1,16 +1,26 @@
1
  environment: production
 
2
  model:
3
  name: microsoft/Phi-3.5-mini-instruct
4
  quantization: Q4_K_M
5
  context_length: 4096
 
6
 
7
  api:
8
  rate_limiting:
9
  enabled: true
10
  requests_per_minute: 60
 
11
  security:
12
  input_sanitization: true
13
  suspicious_pattern_detection: true
 
 
 
 
 
 
 
14
 
15
  monitoring:
16
  enabled: true
@@ -18,14 +28,38 @@ monitoring:
18
  - response_time
19
  - error_rate
20
  - system_resources
 
 
21
  alerts:
22
- - high_error_rate
23
- - slow_response
 
 
 
 
 
 
 
 
24
 
25
  supabase:
26
  max_retries: 3
27
  timeout: 30
 
28
 
29
  caching:
30
  enabled: true
31
- ttl: 300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  environment: production
2
+
3
  model:
4
  name: microsoft/Phi-3.5-mini-instruct
5
  quantization: Q4_K_M
6
  context_length: 4096
7
+ max_response_length: 500
8
 
9
  api:
10
  rate_limiting:
11
  enabled: true
12
  requests_per_minute: 60
13
+ burst_capacity: 10
14
  security:
15
  input_sanitization: true
16
  suspicious_pattern_detection: true
17
+ max_input_length: 10000
18
+ cors:
19
+ allowed_origins:
20
+ - "https://www.saemstunes.com"
21
+ - "https://saemstunes.com"
22
+ allowed_methods: ["GET", "POST", "OPTIONS"]
23
+ allowed_headers: ["*"]
24
 
25
  monitoring:
26
  enabled: true
 
28
  - response_time
29
  - error_rate
30
  - system_resources
31
+ - user_activity
32
+ - model_performance
33
  alerts:
34
+ - high_error_rate:
35
+ threshold: 5%
36
+ duration: 5m
37
+ - slow_response:
38
+ threshold: 10s
39
+ duration: 2m
40
+ - system_overload:
41
+ cpu_threshold: 80%
42
+ memory_threshold: 90%
43
+ duration: 5m
44
 
45
  supabase:
46
  max_retries: 3
47
  timeout: 30
48
+ connection_pool_size: 10
49
 
50
  caching:
51
  enabled: true
52
+ ttl: 300
53
+ max_size: 1000
54
+
55
+ logging:
56
+ level: INFO
57
+ format: json
58
+ file_rotation: "10 MB"
59
+ max_files: 5
60
+
61
+ deployment:
62
+ primary: "huggingface_spaces"
63
+ backup: "railway"
64
+ health_check_interval: 30
65
+ auto_restart: true