WendyHoang commited on
Commit
f731132
·
verified ·
1 Parent(s): 9570b8d

Add DeepSeek-14B checkpoints

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. fake-name-fake-cities/deepseek-12/README.md +7 -0
  2. fake-name-fake-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  3. fake-name-fake-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  4. fake-name-fake-cities/deepseek-12/expert_1.ckpt +3 -0
  5. fake-name-fake-cities/deepseek-12/expert_1.meta +0 -0
  6. fake-name-fake-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  7. fake-name-fake-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  8. fake-name-fake-cities/deepseek-12/expert_2.ckpt +3 -0
  9. fake-name-fake-cities/deepseek-12/expert_2.meta +0 -0
  10. fake-name-fake-cities/deepseek-123/README.md +7 -0
  11. fake-name-fake-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  12. fake-name-fake-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  13. fake-name-fake-cities/deepseek-123/expert_1.ckpt +3 -0
  14. fake-name-fake-cities/deepseek-123/expert_1.meta +0 -0
  15. fake-name-fake-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  16. fake-name-fake-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  17. fake-name-fake-cities/deepseek-123/expert_2.ckpt +3 -0
  18. fake-name-fake-cities/deepseek-123/expert_2.meta +0 -0
  19. fake-name-fake-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  20. fake-name-fake-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  21. fake-name-fake-cities/deepseek-123/expert_3.ckpt +3 -0
  22. fake-name-fake-cities/deepseek-123/expert_3.meta +0 -0
  23. fake-name-fake-cities/deepseek-mix/README.md +7 -0
  24. fake-name-fake-cities/deepseek-mix/expert_mix.ckpt +3 -0
  25. fake-name-fake-cities/deepseek-mix/expert_mix.meta +0 -0
  26. fake-name-real-cities/deepseek-12/README.md +7 -0
  27. fake-name-real-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  28. fake-name-real-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  29. fake-name-real-cities/deepseek-12/expert_1.ckpt +3 -0
  30. fake-name-real-cities/deepseek-12/expert_1.meta +0 -0
  31. fake-name-real-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  32. fake-name-real-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  33. fake-name-real-cities/deepseek-12/expert_2.ckpt +3 -0
  34. fake-name-real-cities/deepseek-12/expert_2.meta +0 -0
  35. fake-name-real-cities/deepseek-123/README.md +7 -0
  36. fake-name-real-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  37. fake-name-real-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  38. fake-name-real-cities/deepseek-123/expert_1.ckpt +3 -0
  39. fake-name-real-cities/deepseek-123/expert_1.meta +0 -0
  40. fake-name-real-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  41. fake-name-real-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  42. fake-name-real-cities/deepseek-123/expert_2.ckpt +3 -0
  43. fake-name-real-cities/deepseek-123/expert_2.meta +0 -0
  44. fake-name-real-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin +3 -0
  45. fake-name-real-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin +3 -0
  46. fake-name-real-cities/deepseek-123/expert_3.ckpt +3 -0
  47. fake-name-real-cities/deepseek-123/expert_3.meta +0 -0
  48. fake-name-real-cities/deepseek-mix/README.md +7 -0
  49. fake-name-real-cities/deepseek-mix/expert_mix.ckpt +3 -0
  50. fake-name-real-cities/deepseek-mix/expert_mix.meta +0 -0
fake-name-fake-cities/deepseek-12/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ Number of experts present in the library: 1
2
+
3
+ | Expert Name | Base Model | Trained on | Adapter Type |
4
+ | --- | --- | --- | --- |
5
+ | expert_1 | deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | hf://WendyHoang/two-hop-fake-names-fake-cities-v0/two-hop | lora |
6
+ Last updated on: 2025-03-05 17:11:38
7
+
fake-name-fake-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32988b9cef54560664aca08cc4aae2665664afa329dd0f8f3fc8822ec1cd85ca
3
+ size 10144
fake-name-fake-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c187952dadc93fd48110923d10a29fa2c2b8cea82501bc1a98c9ffd92c86a6cd
3
+ size 5934752
fake-name-fake-cities/deepseek-12/expert_1.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45d2da703b5e5a7d78c626ac42cf2f959df3a961b4af1bb3e9408758b8b6f111
3
+ size 100785138
fake-name-fake-cities/deepseek-12/expert_1.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-fake-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:897e4679f7ecafa444c4e375352a1e6ce588c401ddfa497c39c8a534e61e005f
3
+ size 10144
fake-name-fake-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d3a1177a3f172dc7d12ee31a1095def6d53f14267fe920fe4da8ae924dda94c
3
+ size 5931040
fake-name-fake-cities/deepseek-12/expert_2.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c3265d68f6d31e3eb213dfceeb9eab1f819770865867e081507237e01867475
3
+ size 100785138
fake-name-fake-cities/deepseek-12/expert_2.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-fake-cities/deepseek-123/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ Number of experts present in the library: 1
2
+
3
+ | Expert Name | Base Model | Trained on | Adapter Type |
4
+ | --- | --- | --- | --- |
5
+ | expert_1 | deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | hf://WendyHoang/two-hop-fake-names-fake-cities-v0/two-hop | lora |
6
+ Last updated on: 2025-03-05 17:11:38
7
+
fake-name-fake-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32988b9cef54560664aca08cc4aae2665664afa329dd0f8f3fc8822ec1cd85ca
3
+ size 10144
fake-name-fake-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c187952dadc93fd48110923d10a29fa2c2b8cea82501bc1a98c9ffd92c86a6cd
3
+ size 5934752
fake-name-fake-cities/deepseek-123/expert_1.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45d2da703b5e5a7d78c626ac42cf2f959df3a961b4af1bb3e9408758b8b6f111
3
+ size 100785138
fake-name-fake-cities/deepseek-123/expert_1.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-fake-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:897e4679f7ecafa444c4e375352a1e6ce588c401ddfa497c39c8a534e61e005f
3
+ size 10144
fake-name-fake-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d3a1177a3f172dc7d12ee31a1095def6d53f14267fe920fe4da8ae924dda94c
3
+ size 5931040
fake-name-fake-cities/deepseek-123/expert_2.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c3265d68f6d31e3eb213dfceeb9eab1f819770865867e081507237e01867475
3
+ size 100785138
fake-name-fake-cities/deepseek-123/expert_2.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-fake-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0593aa4d474e905ef4f68875bb1f653630669d00f057d5cf7141307ff2b10e2a
3
+ size 10144
fake-name-fake-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0436659f8f18404bafdeacf842000b11f172d425135b3741a8e36f7a43e551f0
3
+ size 5932384
fake-name-fake-cities/deepseek-123/expert_3.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae6b97769c4631551ce303fd5226d9f10c3904cf347eb5ae8949d487e1b88112
3
+ size 100785138
fake-name-fake-cities/deepseek-123/expert_3.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-fake-cities/deepseek-mix/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ Number of experts present in the library: 1
2
+
3
+ | Expert Name | Base Model | Trained on | Adapter Type |
4
+ | --- | --- | --- | --- |
5
+ | expert_mix | deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | hf://WendyHoang/two-hop-fake-names-fake-cities-v0/two-hop | lora |
6
+ Last updated on: 2025-03-05 17:42:30
7
+
fake-name-fake-cities/deepseek-mix/expert_mix.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3c391e98adc03a4dd34c652069458e1126bdffe3911927ced98a760f437e768
3
+ size 100785138
fake-name-fake-cities/deepseek-mix/expert_mix.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-real-cities/deepseek-12/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ Number of experts present in the library: 1
2
+
3
+ | Expert Name | Base Model | Trained on | Adapter Type |
4
+ | --- | --- | --- | --- |
5
+ | expert_1 | deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | hf://WendyHoang/two-hop-fake-names-real-cities-v0/two-hop | lora |
6
+ Last updated on: 2025-03-05 19:24:16
7
+
fake-name-real-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41bf5f56c2cee78a050f4a1b03b17f073e75d8684507e4ee30819448f8ac80fb
3
+ size 10144
fake-name-real-cities/deepseek-12/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55a83c525fc91485b645252ebec1d657772f3dd5af56a90f245c410a058aae1b
3
+ size 5932832
fake-name-real-cities/deepseek-12/expert_1.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12235bd6df617f4c3b1d1f6bd66b950ac6f71b209d608895b68ddd8079b5743e
3
+ size 100785138
fake-name-real-cities/deepseek-12/expert_1.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-real-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a06e77c13e47eacbe5dcccfba9f3b87f406dbc285026e7699e303ebf2d05f40
3
+ size 10144
fake-name-real-cities/deepseek-12/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77110a5c9eb2e7eda478e87467bd2292fcd6f151466aff467a22d8d2a79dc236
3
+ size 5937376
fake-name-real-cities/deepseek-12/expert_2.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23de76991e5f5d47f1e03567202ab338862cbb9d77812263cf413e54d1a16ddf
3
+ size 100785138
fake-name-real-cities/deepseek-12/expert_2.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-real-cities/deepseek-123/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ Number of experts present in the library: 1
2
+
3
+ | Expert Name | Base Model | Trained on | Adapter Type |
4
+ | --- | --- | --- | --- |
5
+ | expert_1 | deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | hf://WendyHoang/two-hop-fake-names-real-cities-v0/two-hop | lora |
6
+ Last updated on: 2025-03-05 19:24:16
7
+
fake-name-real-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41bf5f56c2cee78a050f4a1b03b17f073e75d8684507e4ee30819448f8ac80fb
3
+ size 10144
fake-name-real-cities/deepseek-123/expert_1.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55a83c525fc91485b645252ebec1d657772f3dd5af56a90f245c410a058aae1b
3
+ size 5932832
fake-name-real-cities/deepseek-123/expert_1.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12235bd6df617f4c3b1d1f6bd66b950ac6f71b209d608895b68ddd8079b5743e
3
+ size 100785138
fake-name-real-cities/deepseek-123/expert_1.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-real-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a06e77c13e47eacbe5dcccfba9f3b87f406dbc285026e7699e303ebf2d05f40
3
+ size 10144
fake-name-real-cities/deepseek-123/expert_2.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77110a5c9eb2e7eda478e87467bd2292fcd6f151466aff467a22d8d2a79dc236
3
+ size 5937376
fake-name-real-cities/deepseek-123/expert_2.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23de76991e5f5d47f1e03567202ab338862cbb9d77812263cf413e54d1a16ddf
3
+ size 100785138
fake-name-real-cities/deepseek-123/expert_2.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-real-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_eigvals.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5d3cfd95807dd9df6c3773958b2aba7876bcfcf0b8de76819016be9dab530f9
3
+ size 10144
fake-name-real-cities/deepseek-123/expert_3.arrowconfig-a8327e21d374166ceeb94c40d2e7676f_vectors.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c1e85d6a4de4278db2e4cb932e09efbc0fa73c4c8caf30a6654665b9bf05801
3
+ size 5933728
fake-name-real-cities/deepseek-123/expert_3.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30310e934ac9524f6cb7da94d04a69379458016cd1d6914c8c3e5b56d5f54c42
3
+ size 100785138
fake-name-real-cities/deepseek-123/expert_3.meta ADDED
Binary file (4.83 kB). View file
 
fake-name-real-cities/deepseek-mix/README.md ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ Number of experts present in the library: 1
2
+
3
+ | Expert Name | Base Model | Trained on | Adapter Type |
4
+ | --- | --- | --- | --- |
5
+ | expert_mix | deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | hf://WendyHoang/two-hop-fake-names-real-cities-v0/two-hop | lora |
6
+ Last updated on: 2025-03-05 19:55:48
7
+
fake-name-real-cities/deepseek-mix/expert_mix.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71291f462880c26a0f8a69e953bdb5f0e22105dc0a6e5fee75cbe20726ba30fe
3
+ size 100785138
fake-name-real-cities/deepseek-mix/expert_mix.meta ADDED
Binary file (4.83 kB). View file