Bruno7 commited on
Commit
467379f
·
verified ·
1 Parent(s): e3b9770

Upload ASR model - training_info.json (sanitized)

Browse files
Files changed (1) hide show
  1. training_info.json +55 -0
training_info.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "phase": 2,
3
+ "total_samples": 39857,
4
+ "saudi_samples": 11578,
5
+ "saudi_percentage": 29.0488496374539,
6
+ "estimated_cost": 13.275,
7
+ "final_wer": 141.16402945323517,
8
+ "config": {
9
+ "model_name": "openai/whisper-large-v3-turbo",
10
+ "max_duration_in_seconds": 30.0,
11
+ "min_duration_in_seconds": 0.5,
12
+ "lora_r": 64,
13
+ "lora_alpha": 128,
14
+ "lora_dropout": 0.1,
15
+ "target_modules": [
16
+ "q_proj",
17
+ "k_proj",
18
+ "v_proj",
19
+ "out_proj",
20
+ "fc1",
21
+ "fc2"
22
+ ],
23
+ "per_device_train_batch_size": 32,
24
+ "per_device_eval_batch_size": 2,
25
+ "gradient_accumulation_steps": 1,
26
+ "num_train_epochs": 1.0,
27
+ "learning_rate": 0.0001,
28
+ "warmup_ratio": 0.1,
29
+ "weight_decay": 0.01,
30
+ "dataloader_num_workers": 8,
31
+ "dataloader_pin_memory": true,
32
+ "gradient_checkpointing": true,
33
+ "fp16": true,
34
+ "fp16_full_eval": true,
35
+ "eval_steps": 200,
36
+ "save_steps": 200,
37
+ "logging_steps": 50,
38
+ "saudi_oversample_factor": 2.0,
39
+ "output_dir": "./whisper-arabic-saudi",
40
+ "hub_model_id": "whisper-large-v3-turbo-arabic-saudi",
41
+ "hf_token": "[REDACTED_TOKEN]",
42
+ "phase1_hours": 10,
43
+ "phase2_hours": 200,
44
+ "sada_local_dir": "/data/sada_audio_files/"
45
+ },
46
+ "_security_notice": {
47
+ "message": "Sensitive credentials have been automatically redacted for security",
48
+ "redacted_patterns": [
49
+ "huggingface_tokens",
50
+ "api_keys",
51
+ "access_tokens"
52
+ ],
53
+ "sanitized_at": "2025-06-11T10:33:24Z"
54
+ }
55
+ }