Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +200 -0
- model/params/lm_head/kernel/2.0 +3 -0
- model/params/lm_head/kernel/3.0 +3 -0
- model/params/model/language_model/layers/0/mlp/gate_up_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/0/mlp/gate_up_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/0/self_attn/o_proj/kernel/0.1 +3 -0
- model/params/model/language_model/layers/10/mlp/down_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/10/mlp/gate_up_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/10/mlp/gate_up_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/10/self_attn/k_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/10/self_attn/o_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/10/self_attn/o_proj/kernel/0.1 +3 -0
- model/params/model/language_model/layers/10/self_attn/q_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/11/mlp/down_proj/kernel/0.3 +3 -0
- model/params/model/language_model/layers/11/mlp/gate_up_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/11/mlp/gate_up_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/11/self_attn/o_proj/kernel/0.2 +3 -0
- model/params/model/language_model/layers/11/self_attn/v_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/k_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/k_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/k_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/q_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/q_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/v_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/v_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/v_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/12/self_attn/v_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/13/mlp/down_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/13/mlp/down_proj/kernel/0.2 +3 -0
- model/params/model/language_model/layers/13/self_attn/k_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/k_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/k_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/k_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.1 +3 -0
- model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.2 +3 -0
- model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.3 +3 -0
- model/params/model/language_model/layers/13/self_attn/q_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/q_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/q_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/q_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/v_proj/kernel/2.0 +3 -0
- model/params/model/language_model/layers/13/self_attn/v_proj/kernel/3.0 +3 -0
- model/params/model/language_model/layers/14/mlp/down_proj/kernel/0.2 +3 -0
- model/params/model/language_model/layers/14/mlp/gate_up_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/14/self_attn/k_proj/kernel/1.0 +3 -0
- model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.0 +3 -0
- model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.1 +3 -0
- model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.2 +3 -0
- model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.3 +3 -0
.gitattributes
CHANGED
|
@@ -536,3 +536,203 @@ model/params/model/language_model/layers/18/self_attn/k_proj/kernel/2.0 filter=l
|
|
| 536 |
model/params/model/language_model/layers/0/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 537 |
model/params/lm_head/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 538 |
model/params/model/language_model/layers/1/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 536 |
model/params/model/language_model/layers/0/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 537 |
model/params/lm_head/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 538 |
model/params/model/language_model/layers/1/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 539 |
+
model/params/model/language_model/layers/10/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 540 |
+
model/params/model/language_model/layers/11/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 541 |
+
model/params/model/language_model/layers/14/mlp/gate_up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 542 |
+
model/params/model/language_model/layers/16/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 543 |
+
model/params/model/language_model/layers/10/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 544 |
+
model/params/model/language_model/layers/11/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 545 |
+
model/params/model/language_model/layers/37/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 546 |
+
model/params/model/language_model/layers/4/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 547 |
+
model/params/model/language_model/layers/37/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 548 |
+
model/params/model/language_model/layers/37/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 549 |
+
model/params/model/language_model/layers/36/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 550 |
+
model/params/model/language_model/layers/37/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 551 |
+
model/params/model/language_model/layers/37/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 552 |
+
model/params/model/language_model/layers/6/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 553 |
+
model/params/model/language_model/layers/37/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 554 |
+
model/params/model/language_model/layers/39/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 555 |
+
model/params/model/language_model/layers/36/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 556 |
+
model/params/model/language_model/layers/7/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 557 |
+
model/params/model/language_model/layers/37/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 558 |
+
model/params/model/language_model/layers/4/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 559 |
+
model/params/model/language_model/layers/38/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 560 |
+
model/params/model/language_model/layers/36/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 561 |
+
model/params/model/language_model/layers/37/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 562 |
+
model/params/model/language_model/layers/36/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 563 |
+
model/params/model/language_model/layers/36/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 564 |
+
model/params/model/language_model/layers/35/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 565 |
+
model/params/model/language_model/layers/36/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 566 |
+
model/params/model/language_model/layers/35/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 567 |
+
model/params/model/language_model/layers/39/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 568 |
+
model/params/model/language_model/layers/6/mlp/gate_up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 569 |
+
model/params/model/language_model/layers/7/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 570 |
+
model/params/model/language_model/layers/38/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 571 |
+
model/params/model/language_model/layers/36/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 572 |
+
model/params/model/language_model/layers/39/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 573 |
+
model/params/model/language_model/layers/37/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 574 |
+
model/params/model/language_model/layers/36/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 575 |
+
model/params/model/language_model/layers/38/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 576 |
+
model/params/model/language_model/layers/5/mlp/gate_up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 577 |
+
model/params/model/language_model/layers/36/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 578 |
+
model/params/model/language_model/layers/36/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 579 |
+
model/params/model/language_model/layers/38/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 580 |
+
model/params/model/language_model/layers/7/mlp/gate_up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 581 |
+
model/params/model/language_model/layers/6/mlp/gate_up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 582 |
+
model/params/model/language_model/layers/38/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 583 |
+
model/params/model/language_model/layers/5/mlp/gate_up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 584 |
+
model/params/model/language_model/layers/36/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 585 |
+
model/params/model/language_model/layers/5/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 586 |
+
model/params/model/language_model/layers/6/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 587 |
+
model/params/model/language_model/layers/39/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 588 |
+
model/params/model/language_model/layers/36/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 589 |
+
model/params/model/language_model/layers/35/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 590 |
+
model/params/model/language_model/layers/38/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 591 |
+
model/params/model/language_model/layers/35/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 592 |
+
model/params/model/language_model/layers/5/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 593 |
+
model/params/model/language_model/layers/36/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 594 |
+
model/params/model/language_model/layers/35/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 595 |
+
model/params/model/language_model/layers/35/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 596 |
+
model/params/model/language_model/layers/35/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 597 |
+
model/params/model/language_model/layers/36/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 598 |
+
model/params/model/language_model/layers/34/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 599 |
+
model/params/model/language_model/layers/36/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 600 |
+
model/params/model/language_model/layers/4/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 601 |
+
model/params/model/language_model/layers/38/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 602 |
+
model/params/model/language_model/layers/35/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 603 |
+
model/params/model/language_model/layers/35/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 604 |
+
model/params/model/language_model/layers/34/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 605 |
+
model/params/model/language_model/layers/37/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 606 |
+
model/params/model/language_model/layers/11/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 607 |
+
model/params/model/language_model/layers/11/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 608 |
+
model/params/model/language_model/layers/16/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 609 |
+
model/params/lm_head/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 610 |
+
model/params/model/language_model/layers/14/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 611 |
+
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 612 |
+
model/params/model/language_model/layers/17/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 613 |
+
model/params/model/language_model/layers/19/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 614 |
+
model/params/model/language_model/layers/14/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 615 |
+
model/params/model/language_model/layers/17/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 616 |
+
model/params/model/language_model/layers/17/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 617 |
+
model/params/model/language_model/layers/14/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 618 |
+
model/params/model/language_model/layers/13/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 619 |
+
model/params/model/language_model/layers/19/mlp/gate_up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 620 |
+
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 621 |
+
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 622 |
+
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 623 |
+
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 624 |
+
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 625 |
+
model/params/model/language_model/layers/19/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 626 |
+
model/params/model/language_model/layers/13/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 627 |
+
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 628 |
+
model/params/model/language_model/layers/14/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 629 |
+
model/params/model/language_model/layers/14/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 630 |
+
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 631 |
+
model/params/model/language_model/layers/16/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 632 |
+
model/params/model/language_model/layers/16/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 633 |
+
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 634 |
+
model/params/model/language_model/layers/15/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 635 |
+
model/params/model/language_model/layers/14/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 636 |
+
model/params/model/language_model/layers/17/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 637 |
+
model/params/model/language_model/layers/19/mlp/gate_up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 638 |
+
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 639 |
+
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 640 |
+
model/params/model/language_model/layers/15/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 641 |
+
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 642 |
+
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 643 |
+
model/params/model/language_model/layers/18/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 644 |
+
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 645 |
+
model/params/model/language_model/layers/15/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 646 |
+
model/params/model/language_model/layers/16/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 647 |
+
model/params/model/language_model/layers/18/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 648 |
+
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 649 |
+
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 650 |
+
model/params/model/language_model/layers/12/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 651 |
+
model/params/model/language_model/layers/16/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 652 |
+
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 653 |
+
model/params/model/language_model/layers/15/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 654 |
+
model/params/model/language_model/layers/12/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 655 |
+
model/params/model/language_model/layers/12/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 656 |
+
model/params/model/language_model/layers/12/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 657 |
+
model/params/model/language_model/layers/18/mlp/gate_up_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 658 |
+
model/params/model/language_model/layers/11/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 659 |
+
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 660 |
+
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 661 |
+
model/params/model/language_model/layers/18/mlp/gate_up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 662 |
+
model/params/model/language_model/layers/17/mlp/gate_up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 663 |
+
model/params/model/language_model/layers/14/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 664 |
+
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 665 |
+
model/params/model/language_model/layers/12/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 666 |
+
model/params/model/language_model/layers/10/mlp/gate_up_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 667 |
+
model/params/model/language_model/layers/10/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 668 |
+
model/params/model/language_model/layers/0/mlp/gate_up_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 669 |
+
model/params/lm_head/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 670 |
+
model/params/model/language_model/layers/10/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 671 |
+
model/params/model/language_model/layers/10/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 672 |
+
model/params/model/language_model/layers/10/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 673 |
+
model/params/model/language_model/layers/13/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 674 |
+
model/params/model/language_model/layers/0/mlp/gate_up_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 675 |
+
model/params/model/language_model/layers/13/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 676 |
+
model/params/model/language_model/layers/0/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 677 |
+
model/params/model/language_model/layers/7/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 678 |
+
model/params/model/language_model/layers/9/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 679 |
+
model/params/model/language_model/layers/8/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 680 |
+
model/params/model/language_model/layers/8/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 681 |
+
model/params/model/language_model/layers/9/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 682 |
+
model/params/model/language_model/layers/8/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 683 |
+
model/params/model/language_model/layers/8/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 684 |
+
model/params/model/language_model/layers/8/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 685 |
+
model/params/model/language_model/layers/7/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 686 |
+
model/params/model/language_model/layers/8/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 687 |
+
model/params/model/language_model/layers/8/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 688 |
+
model/params/model/language_model/layers/8/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 689 |
+
model/params/model/language_model/layers/7/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 690 |
+
model/params/model/language_model/layers/6/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 691 |
+
model/params/model/language_model/layers/8/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 692 |
+
model/params/model/language_model/layers/9/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 693 |
+
model/params/model/language_model/layers/8/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 694 |
+
model/params/model/language_model/layers/7/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 695 |
+
model/params/model/language_model/layers/7/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 696 |
+
model/params/model/language_model/layers/8/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 697 |
+
model/params/model/language_model/layers/6/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 698 |
+
model/params/model/language_model/layers/7/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 699 |
+
model/params/model/language_model/layers/7/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 700 |
+
model/params/model/language_model/layers/7/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 701 |
+
model/params/model/language_model/layers/8/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 702 |
+
model/params/model/language_model/layers/6/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 703 |
+
model/params/model/language_model/layers/8/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 704 |
+
model/params/model/language_model/layers/7/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 705 |
+
model/params/model/language_model/layers/6/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 706 |
+
model/params/model/language_model/layers/7/self_attn/k_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 707 |
+
model/params/model/language_model/layers/7/self_attn/k_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 708 |
+
model/params/model/language_model/layers/7/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 709 |
+
model/params/model/language_model/layers/6/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 710 |
+
model/params/model/language_model/layers/7/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 711 |
+
model/params/model/language_model/layers/6/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 712 |
+
model/params/model/language_model/layers/5/self_attn/v_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 713 |
+
model/params/model/language_model/layers/6/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 714 |
+
model/params/model/language_model/layers/7/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 715 |
+
model/params/model/language_model/layers/7/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 716 |
+
model/params/model/language_model/layers/7/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 717 |
+
model/params/model/language_model/layers/6/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 718 |
+
model/params/model/language_model/layers/6/self_attn/q_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 719 |
+
model/params/model/language_model/layers/6/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 720 |
+
model/params/model/language_model/layers/6/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 721 |
+
model/params/model/language_model/layers/6/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 722 |
+
model/params/model/language_model/layers/6/self_attn/q_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 723 |
+
model/params/model/language_model/layers/9/mlp/down_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 724 |
+
model/params/model/language_model/layers/9/mlp/down_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 725 |
+
model/params/model/language_model/layers/5/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 726 |
+
model/params/model/language_model/layers/5/self_attn/v_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
| 727 |
+
model/params/model/language_model/layers/6/self_attn/q_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
| 728 |
+
model/params/model/language_model/layers/9/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 729 |
+
model/params/model/language_model/layers/5/self_attn/k_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 730 |
+
model/params/model/language_model/layers/6/self_attn/o_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 731 |
+
model/params/model/language_model/layers/5/self_attn/v_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 732 |
+
model/params/model/language_model/layers/8/mlp/down_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
| 733 |
+
model/params/model/language_model/layers/5/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 734 |
+
model/params/model/language_model/layers/6/self_attn/o_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 735 |
+
model/params/model/language_model/layers/4/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 736 |
+
model/params/model/language_model/layers/9/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 737 |
+
model/params/model/language_model/layers/5/self_attn/o_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
| 738 |
+
model/params/model/language_model/layers/8/mlp/down_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
model/params/lm_head/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cebf323e63186c6e945c7873a01458fc7d7a3ba6a1e026f70ef89a00e60b800e
|
| 3 |
+
size 241620360
|
model/params/lm_head/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05cd759471ea280db8d58931cbb94d50398671e6a0bbf167aebc6c4f5a95f752
|
| 3 |
+
size 241396877
|
model/params/model/language_model/layers/0/mlp/gate_up_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce5b86b23494f666dd55b72b3ebf778211958c8cf1564a4c112c79fce378cafb
|
| 3 |
+
size 43562759
|
model/params/model/language_model/layers/0/mlp/gate_up_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29bf11e6b40ddf7171159958b5e5bd795c1fc81a070c1c1b9c8c58d0b4606772
|
| 3 |
+
size 43571282
|
model/params/model/language_model/layers/0/self_attn/o_proj/kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dde8f978dffddc6a18f3927615bfdf28f1af35ca0666ee7048dc85c988ec9d42
|
| 3 |
+
size 6514382
|
model/params/model/language_model/layers/10/mlp/down_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2591f482366c7843e04efd756d0792cb617bc157fad864f58e5a1c0c67feb9a5
|
| 3 |
+
size 21760162
|
model/params/model/language_model/layers/10/mlp/gate_up_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18f2aae6a48b2341feded0771a7d9ae0bb29c498af0147d2fbd132a908034f06
|
| 3 |
+
size 43505301
|
model/params/model/language_model/layers/10/mlp/gate_up_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccbf73c5aa9093e3ced76de5ebaf05c300e4be2119ba89a73876f4eef4a24a80
|
| 3 |
+
size 43506524
|
model/params/model/language_model/layers/10/self_attn/k_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71bdd4cf330766c10a748337a96b3d2f192f46a4d09b1a4231ca2218e9a48a8c
|
| 3 |
+
size 409753
|
model/params/model/language_model/layers/10/self_attn/o_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad31c5f455007fa27eecda0b84923886ea4a4c8d0a2236b96eb83c86f2a04f8d
|
| 3 |
+
size 6511223
|
model/params/model/language_model/layers/10/self_attn/o_proj/kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93a92bf2a611fc6f2054223ff6efbd4ca9bc5a49eb116857a6f3fbfb2a810e65
|
| 3 |
+
size 6509895
|
model/params/model/language_model/layers/10/self_attn/q_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c35d30e9bec7739152cc3a2d780e82aea60e88029b626cac10fe7158fceb876
|
| 3 |
+
size 6527187
|
model/params/model/language_model/layers/11/mlp/down_proj/kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15b8fe1a5f83383339cf39ddee6bdf1919d64980b8705316a85fc157dbe97e60
|
| 3 |
+
size 21757047
|
model/params/model/language_model/layers/11/mlp/gate_up_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2baccdd07e9a89dfb62ff920d652256ce453cd332dcc8f64d4b6510a37a90ab4
|
| 3 |
+
size 43508765
|
model/params/model/language_model/layers/11/mlp/gate_up_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:256f2f73cdf99c0cf7e5b2ac876e1ad98644b6c4c8fe09ac2d534bb9e5c0b079
|
| 3 |
+
size 43507014
|
model/params/model/language_model/layers/11/self_attn/o_proj/kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:291add5e0a9a5d18a60ebb6d21578c22fd15e283459061641c0ae931e1619f00
|
| 3 |
+
size 6510888
|
model/params/model/language_model/layers/11/self_attn/v_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c69921cb21159c782b59917f148c7764466dd9242425cf7a7f711c3fdd3eaf2
|
| 3 |
+
size 407011
|
model/params/model/language_model/layers/12/self_attn/k_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:716c9d34cf5f78f612449002e07c3b59093bc7a50a5b258c37e0ef124e92871b
|
| 3 |
+
size 409388
|
model/params/model/language_model/layers/12/self_attn/k_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e51b4bba00100ec613bcbb0fdea5fdfed55e05215d1870753ddc23511a70c673
|
| 3 |
+
size 409326
|
model/params/model/language_model/layers/12/self_attn/k_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a4b9cdf6331406278a16201944898f47e2c0ba9a840172dd5422eb115741853c
|
| 3 |
+
size 409223
|
model/params/model/language_model/layers/12/self_attn/q_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bce86dd28a4b2b301ef5519ba8865b9a8b5d1a068d220a4f490ef2b4f728d1c
|
| 3 |
+
size 6530753
|
model/params/model/language_model/layers/12/self_attn/q_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11c82c91167ff78ffd1117b6842a50e415e6c16858b640f6a3218d95236ed06e
|
| 3 |
+
size 6532063
|
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd5f21b462007017a6c7529eb15510177a8cff7e946876864acbdbcc0e04404f
|
| 3 |
+
size 407032
|
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce339b60d60c10a113dee54d020b490fa45e2b797adf80d8e389d6bbb5b7baeb
|
| 3 |
+
size 407087
|
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af8b21d20ebd469a1c68c951bbd87fdb7bc97c5c99492461cda7bfd5d339ac19
|
| 3 |
+
size 407005
|
model/params/model/language_model/layers/12/self_attn/v_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b0186194113e906fa34bba0e68f32ac5abd4ec790d197a7d4dc484c01106730
|
| 3 |
+
size 406876
|
model/params/model/language_model/layers/13/mlp/down_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1838ee9bc1b0d0b631959b134c863053dca53a56a0b7bb1e11bd47b3b10f6764
|
| 3 |
+
size 21776179
|
model/params/model/language_model/layers/13/mlp/down_proj/kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:378df209680e55a9f4cb86e0a06f775f220a0e0c80e557f15dfe428541e464af
|
| 3 |
+
size 21769812
|
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0a5fc66bf1264150a96ca7b1224268c35737a45dcb98327fac57d21227b4f0b
|
| 3 |
+
size 409222
|
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f2bf48fc178d0e86bce380e78930e4e59417007a46ff9f886ea9054e3e4df99
|
| 3 |
+
size 408777
|
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6780fef95a21a56c737f5e51a3dd804e878617b17320db60a4e8cda8e7ddadb
|
| 3 |
+
size 408909
|
model/params/model/language_model/layers/13/self_attn/k_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81001fbdaf913d8ed1a55a187306fd42e6b9f1b8e090fe10d08685a2a05eb18b
|
| 3 |
+
size 409082
|
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f9065107e725048b5b6630df07e36801bba9bd47d9126dc45980f44f528980d
|
| 3 |
+
size 6514624
|
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c3a427f26354fad49b1eed770aab001f26e96ca11f5703c8c10c7c31feb77c4
|
| 3 |
+
size 6513391
|
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25144f1cf2598075381f78eae48a068cf4e04dddfb0abfcb67f240d2d77bb8d5
|
| 3 |
+
size 6512592
|
model/params/model/language_model/layers/13/self_attn/o_proj/kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f409374d598d761a61328e4b87f7f546cea0f59d639052e47a77fc3f136aade
|
| 3 |
+
size 6517081
|
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d99919a0f463b8b51e941be06b4ab6a58a89f776ac4769051dddf695271ed8b
|
| 3 |
+
size 6537147
|
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c111523d7db9146631f8e23d4923555a19c75ff91cb6c234e6119c6debd29c1b
|
| 3 |
+
size 6537824
|
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:194121ea50a1bee350b5530551165fba0c94a4673cace7b25c35346b23d914fe
|
| 3 |
+
size 6537326
|
model/params/model/language_model/layers/13/self_attn/q_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b44391ebc221927b88828c22e5fa02b63552ef0ac043847897ff3e6a8615ce5a
|
| 3 |
+
size 6537464
|
model/params/model/language_model/layers/13/self_attn/v_proj/kernel/2.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7501b389d911a400e0c7fdbf2bb66a3c6e5e3d39ed01b7b6680be0aee96d1580
|
| 3 |
+
size 406917
|
model/params/model/language_model/layers/13/self_attn/v_proj/kernel/3.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5cf87e93c2d6171de703121b0a033287d6790b0cc5a51987169ce215cea438ee
|
| 3 |
+
size 407080
|
model/params/model/language_model/layers/14/mlp/down_proj/kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbac2c34ab33fece4afd84ec6d38f5079088efdaa4101f37c624029a9c28d770
|
| 3 |
+
size 21779877
|
model/params/model/language_model/layers/14/mlp/gate_up_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5268fb03e6b3fc1475288a5cf85c35b30c3a98451c7ffa543aae7502cf9531c8
|
| 3 |
+
size 43572251
|
model/params/model/language_model/layers/14/self_attn/k_proj/kernel/1.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d336e8d9a435633e4ba2205355bdd940c72b5f134bc244287c8eaa0a8dc53c77
|
| 3 |
+
size 409802
|
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ceb9dcf0d293e9ba96a63b239617acf2b8e89b0e7c3e7c3bc4377a0b148240d
|
| 3 |
+
size 6521579
|
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:521b3a06c6372c42af83418c8a43c8cfffe514b9b838f2d39b6d894c556c90be
|
| 3 |
+
size 6521793
|
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89440f0a0f9b6977c9100c14f24eafc4dcf81dc969d09f14b00b369fc66bb16b
|
| 3 |
+
size 6519535
|
model/params/model/language_model/layers/14/self_attn/o_proj/kernel/0.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8df1b33374f9035c828994bcf444c486e22c06740adb1595ee0c7c55e39ac08f
|
| 3 |
+
size 6521952
|