Keeby-smilyai commited on
Commit
73d6fa3
·
verified ·
1 Parent(s): 40116b8

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ model.keras filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "sam1",
3
+ "architectures": [
4
+ "SAM1ForCausalLM"
5
+ ],
6
+ "vocab_size": 50259,
7
+ "max_position_embeddings": 1024,
8
+ "hidden_size": 768,
9
+ "num_hidden_layers": 16,
10
+ "num_attention_heads": 12,
11
+ "intermediate_size": 5376,
12
+ "hidden_act": "silu",
13
+ "rope_theta": 10000,
14
+ "rms_norm_eps": 1e-05,
15
+ "bos_token_id": 50256,
16
+ "eos_token_id": 50256,
17
+ "pad_token_id": 50256,
18
+ "auto_map": {
19
+ "AutoModel": "modeling_sam1.SAM1ForCausalLM"
20
+ },
21
+ "custom_tokens": [
22
+ "<think>",
23
+ "</think>"
24
+ ]
25
+ }
model.keras ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e6b3e2aef7e4434e4a065897c12d081e3ec1b43bac7f2f25e85bb2449c9306d
3
+ size 3758410976
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "tokenizer_class": "GPT2Tokenizer",
3
+ "model_max_length": 1024,
4
+ "pad_token": "<|endoftext|>",
5
+ "eos_token": "<|endoftext|>",
6
+ "bos_token": "<|endoftext|>",
7
+ "unk_token": "<|endoftext|>",
8
+ "additional_special_tokens": [
9
+ "<think>",
10
+ "</think>"
11
+ ]
12
+ }
training_history.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ accuracy,loss,val_accuracy,val_loss
2
+ 0.9999410510063171,0.0007485541864298284,0.999991774559021,0.00012213260924909264