Irvollo commited on
Commit
9728ed8
·
verified ·
1 Parent(s): 3689a34

Upload folder using huggingface_hub

Browse files
chat_template.jinja ADDED
@@ -0,0 +1 @@
 
 
1
+ {{ bos_token }}{% for message in messages %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + '[/INST]' }}{% elif message['role'] == 'system' %}{{ '[SYSTEM_PROMPT] ' + message['content'] + '[/SYSTEM_PROMPT]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + eos_token }}{% else %}{{ raise_exception('Only user, system and assistant roles are supported!') }}{% endif %}{% endfor %}
config.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MistralForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 1,
7
+ "dtype": "bfloat16",
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 12288,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 28672,
14
+ "max_position_embeddings": 131072,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 96,
17
+ "num_hidden_layers": 88,
18
+ "num_key_value_heads": 8,
19
+ "quantization_config": {
20
+ "config_groups": {
21
+ "group_0": {
22
+ "format": "float-quantized",
23
+ "input_activations": {
24
+ "actorder": null,
25
+ "block_structure": null,
26
+ "dynamic": true,
27
+ "group_size": null,
28
+ "num_bits": 8,
29
+ "observer": null,
30
+ "observer_kwargs": {},
31
+ "scale_dtype": null,
32
+ "strategy": "token",
33
+ "symmetric": true,
34
+ "type": "float",
35
+ "zp_dtype": null
36
+ },
37
+ "output_activations": null,
38
+ "targets": [
39
+ "Linear"
40
+ ],
41
+ "weights": {
42
+ "actorder": null,
43
+ "block_structure": null,
44
+ "dynamic": false,
45
+ "group_size": null,
46
+ "num_bits": 8,
47
+ "observer": "memoryless_minmax",
48
+ "observer_kwargs": {},
49
+ "scale_dtype": null,
50
+ "strategy": "channel",
51
+ "symmetric": true,
52
+ "type": "float",
53
+ "zp_dtype": null
54
+ }
55
+ }
56
+ },
57
+ "format": "float-quantized",
58
+ "global_compression_ratio": null,
59
+ "ignore": [
60
+ "lm_head"
61
+ ],
62
+ "kv_cache_scheme": null,
63
+ "quant_method": "compressed-tensors",
64
+ "quantization_status": "compressed",
65
+ "sparsity_config": {},
66
+ "transform_config": {},
67
+ "version": "0.14.0.1"
68
+ },
69
+ "rms_norm_eps": 1e-05,
70
+ "rope_theta": 1000000.0,
71
+ "sliding_window": null,
72
+ "tie_word_embeddings": false,
73
+ "transformers_version": "4.57.6",
74
+ "use_cache": true,
75
+ "vocab_size": 32768
76
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.57.6"
6
+ }
model-00001-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:972393d1bd13f56c13da3b8bb3457f901c72c7ec097b01a319ff309f51f266cb
3
+ size 4958398128
model-00002-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b979cd3f5dd580f97e11963743eaf16e2d1cc725f467820d8f3b1b264bc9832
3
+ size 4832680488
model-00003-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ececfc09fb3d7178c20e6aa6dd4977f50e83ec0c7cbd537a5a48abe104aaaa2
3
+ size 4857866304
model-00004-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44576ac674fba2e095fc82d830c4aef134ea3bb17a585a92733020f7a64d3986
3
+ size 4832680552
model-00005-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb5c222ab67ceb84bf8ca09699aa5fb602a4c8c5d0a2820495c8c9d78715e476
3
+ size 4857866352
model-00006-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17484658bd05868d99d81fa21d366984029458b2b0da159429d543ba2b86367c
3
+ size 4832680552
model-00007-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e12a01f15015dbd981089347feb64dd7f8f6e20fe6ddf756c622b0a0e831cb39
3
+ size 4857866352
model-00008-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2fad71a8bbf806155aee40100e3936c48887360c443f31f326ade3b4ba55d11
3
+ size 4832680552
model-00009-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c18173cf7f80c2ba64bbc7c925ba141e11fb73d7b00bdbfb6bef1b0c43273f8f
3
+ size 4857866352
model-00010-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4af3ab98046f3e163ee2bd25f6d993a06ad4560b85943e627a1e74c185f7da1
3
+ size 4832680552
model-00011-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd9ff8969dd14c40cf344ce86d778c8dae7069c7269bd38fafe4bc40292d014e
3
+ size 4857866352
model-00012-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af013e9397ceebcf55a4044997c709f12128db81c498adcfb99a67807c7cf03c
3
+ size 4832680552
model-00013-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b22575391a302f906f425bf73ddef296d88e86fe868f01df9af4ad082dca9e72
3
+ size 4857866352
model-00014-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8053e2c113ce600b97f302c1ca15ab6d21da0c8289bf2ba5fd4dcdaed758741f
3
+ size 4832680552
model-00015-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da1ed2015e925ace27a278bfbf48e4c61aa8de671910d743bd248a683b1fc1e8
3
+ size 4857866352
model-00016-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e863c1e8ce63a224b7b0cb669628a54c27aa1684f67532a659b03341eb0f1d3
3
+ size 4832680552
model-00017-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79993590818106fefb119184c1b14a87d20bbaf0bbdfd13dbd2be8d501d17f02
3
+ size 4857866352
model-00018-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b437ccde918a57dad84788a1482902330d2f8e39a17869df76947072b8716e09
3
+ size 4832680552
model-00019-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eaae28ec72772d4d0969148eabee94c4ba0ec9ea919b792c08a7593e4058951
3
+ size 4857866352
model-00020-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d81ccfc35fa94d4b0119baca3d623dbde7c789a1cfe5139e3f7c9cd50f47632
3
+ size 4832680552
model-00021-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b1c9d654be0fed88184096d13249aba78a9b67fdb83bc425dd088b5c371d02
3
+ size 4857866352
model-00022-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a5f2de030bf279565831dad146fa000d33b50cb3689fb04967b466cede9a82b
3
+ size 4832680552
model-00023-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c74894fd5ce5fb0d5fec12e67d7a1c95fb83a2e5bb597799f3836ad14655f0
3
+ size 4857866352
model-00024-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4742ceb91259570902a29b496a3da22d65220c3f0b7e6beb8190046d49f48931
3
+ size 4832680552
model-00025-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:954065752bc7e0c8d39543b20b61c8419d63df5e866ebcb3c5b7c5ff0a814365
3
+ size 4857866352
model-00026-of-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dcf1aac0e1df87ae9cfff3cb3754acc8632a81b895b62638927aefd743b0686
3
+ size 2189695048
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
recipe.yaml ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ default_stage:
2
+ default_modifiers:
3
+ QuantizationModifier:
4
+ targets: [Linear]
5
+ ignore: [lm_head]
6
+ scheme: FP8_DYNAMIC
7
+ bypass_divisibility_checks: false
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff