QomSSLab commited on
Commit
9e2ebbc
·
verified ·
1 Parent(s): f36dcf6

Add training logs and README

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -70,7 +70,7 @@
70
  "num_attention_heads": 16,
71
  "num_hidden_layers": 48,
72
  "num_key_value_heads": 8,
73
- "pad_token_id": 0,
74
  "query_pre_attn_scalar": 256,
75
  "rms_norm_eps": 1e-06,
76
  "rope_local_base_freq": 10000.0,
@@ -81,6 +81,6 @@
81
  "rope_theta": 1000000.0,
82
  "sliding_window": 1024,
83
  "transformers_version": "4.56.0",
84
- "use_cache": true,
85
  "vocab_size": 262208
86
  }
 
70
  "num_attention_heads": 16,
71
  "num_hidden_layers": 48,
72
  "num_key_value_heads": 8,
73
+ "pad_token_id": 1,
74
  "query_pre_attn_scalar": 256,
75
  "rms_norm_eps": 1e-06,
76
  "rope_local_base_freq": 10000.0,
 
81
  "rope_theta": 1000000.0,
82
  "sliding_window": 1024,
83
  "transformers_version": "4.56.0",
84
+ "use_cache": false,
85
  "vocab_size": 262208
86
  }