neeleshg23 commited on
Commit
fac43fa
·
verified ·
1 Parent(s): 997a525

Training in progress, step 2500

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
  3. training_args.bin +3 -0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./checkpoint-10000",
3
  "architectures": [
4
  "MambaForCausalLM"
5
  ],
@@ -24,8 +24,8 @@
24
  "time_step_min": 0.001,
25
  "time_step_rank": 100,
26
  "time_step_scale": 1.0,
27
- "torch_dtype": "float32",
28
- "transformers_version": "4.41.1",
29
  "use_bias": false,
30
  "use_cache": true,
31
  "use_conv_bias": true,
 
1
  {
2
+ "_name_or_path": "neeleshg23/draft-mamba-4-1600",
3
  "architectures": [
4
  "MambaForCausalLM"
5
  ],
 
24
  "time_step_min": 0.001,
25
  "time_step_rank": 100,
26
  "time_step_scale": 1.0,
27
+ "torch_dtype": "bfloat16",
28
+ "transformers_version": "4.47.1",
29
  "use_bias": false,
30
  "use_cache": true,
31
  "use_conv_bias": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae6fe05d47f04f59f51b2da9ab04b460f5df52f41200c78383c923f094bde840
3
- size 463658944
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c934472c3a06753d5254ae3b649afd095d7b7bfa3cd746e3c2cb0db8d783a43
3
+ size 232241360
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:248fbdad713297f54d9cb5336d3293ff25ab843df1f3ddac9ca486b51c34795c
3
+ size 5304