HippolyteP commited on
Commit
a1f1d10
·
1 Parent(s): 26c44b9

Push model using huggingface_hub.

Browse files
Files changed (2) hide show
  1. README.md +10 -3
  2. config.json +43 -0
README.md CHANGED
@@ -1,3 +1,10 @@
1
- ---
2
- license: cc-by-4.0
3
- ---
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Code: [More Information Needed]
9
+ - Paper: [More Information Needed]
10
+ - Docs: [More Information Needed]
config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bridge_args": {
3
+ "bridge_type": "mlp",
4
+ "hidden_dim": 2048,
5
+ "in_dim": 3072,
6
+ "out_dim": 4096
7
+ },
8
+ "embedder": null,
9
+ "embedder_args": {
10
+ "causal_embedder": false,
11
+ "compress_rates": [
12
+ -8
13
+ ],
14
+ "cont_tok": true,
15
+ "memory_tokens": 0,
16
+ "n_truncated_layers": 2,
17
+ "pooling_module": {
18
+ "pool_type": "mean_pooled_queries",
19
+ "where": "before"
20
+ },
21
+ "rec_tok": true,
22
+ "train_embedding_mtx": true,
23
+ "trained_layers": 27
24
+ },
25
+ "empty_init": 1,
26
+ "llms": [],
27
+ "model_args": {
28
+ "_sliding_window": null,
29
+ "dim": 3072,
30
+ "head_dim": 128,
31
+ "hidden_dim": 8192,
32
+ "max_batch_size": 1,
33
+ "model_type": "transformer",
34
+ "n_heads": 24,
35
+ "n_kv_heads": 8,
36
+ "n_layers": 28,
37
+ "non_parametric_norm": false,
38
+ "norm_eps": "1e-05",
39
+ "rope_theta": 500000.0,
40
+ "sliding_window": null,
41
+ "vocab_size": 128256
42
+ }
43
+ }