Medyassino commited on
Commit
08b3b04
·
verified ·
1 Parent(s): 59dc998

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. gpt_300m_hf_jsonl_sft/model_epoch_01.pt +3 -0
  2. gpt_300m_hf_jsonl_sft/model_epoch_02.pt +3 -0
  3. gpt_300m_hf_jsonl_sft/model_epoch_03.pt +3 -0
  4. gpt_300m_hf_jsonl_sft/model_epoch_04.pt +3 -0
  5. gpt_300m_hf_jsonl_sft/model_epoch_05.pt +3 -0
  6. gpt_300m_hf_jsonl_sft/model_epoch_06.pt +3 -0
  7. gpt_300m_hf_jsonl_sft/model_epoch_07.pt +3 -0
  8. gpt_300m_hf_jsonl_sft/model_epoch_08.pt +3 -0
  9. gpt_300m_hf_jsonl_sft/model_epoch_09.pt +3 -0
  10. gpt_300m_hf_jsonl_sft/model_epoch_10.pt +3 -0
  11. gpt_300m_hf_jsonl_sft/model_last.pt +3 -0
  12. gpt_300m_hf_jsonl_sft/tokenizer_32k/tokenizer.json +0 -0
  13. gpt_300m_hf_jsonl_sft/tokenizer_32k/tokenizer_config.json +9 -0
  14. gpt_300m_hf_jsonl_sft_fast/model_epoch_01.pt +3 -0
  15. gpt_300m_hf_jsonl_sft_fast/model_epoch_02.pt +3 -0
  16. gpt_300m_hf_jsonl_sft_fast/model_epoch_03.pt +3 -0
  17. gpt_300m_hf_jsonl_sft_fast/model_last.pt +3 -0
  18. gpt_300m_hf_jsonl_sft_fast/tokenizer_32k/tokenizer.json +0 -0
  19. gpt_300m_hf_jsonl_sft_fast/tokenizer_32k/tokenizer_config.json +9 -0
  20. gpt_300m_hf_jsonl_sft_v2/model_epoch_01.pt +3 -0
  21. gpt_300m_hf_jsonl_sft_v2/model_epoch_02.pt +3 -0
  22. gpt_300m_hf_jsonl_sft_v2/model_epoch_03.pt +3 -0
  23. gpt_300m_hf_jsonl_sft_v2/model_last.pt +3 -0
  24. gpt_300m_hf_jsonl_sft_v2/tokenizer_32k/tokenizer.json +0 -0
  25. gpt_300m_hf_jsonl_sft_v2/tokenizer_32k/tokenizer_config.json +9 -0
  26. nlp_1b_h100_2h/model.pt +3 -0
  27. nlp_1b_h100_2h/model_best.pt +3 -0
  28. nlp_1b_h100_2h/model_epoch_01.pt +3 -0
  29. nlp_1b_h100_2h/model_epoch_02.pt +3 -0
  30. nlp_1b_h100_2h/train_state.pt +3 -0
  31. nlp_1b_h100_ft_nlp_mix_10ep_8h/model.pt +3 -0
  32. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_best.pt +3 -0
  33. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_01.pt +3 -0
  34. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_02.pt +3 -0
  35. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_03.pt +3 -0
  36. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_04.pt +3 -0
  37. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_05.pt +3 -0
  38. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_06.pt +3 -0
  39. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_07.pt +3 -0
  40. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_08.pt +3 -0
  41. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_09.pt +3 -0
  42. nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_10.pt +3 -0
  43. nlp_1b_h100_ft_nlp_mix_10ep_8h/train_state.pt +3 -0
  44. nlp_1b_h100_ft_nlp_mix_modern/model.pt +3 -0
  45. nlp_1b_h100_ft_nlp_mix_modern/model_best.pt +3 -0
  46. nlp_1b_h100_ft_nlp_mix_modern/model_epoch_01.pt +3 -0
  47. nlp_1b_h100_ft_nlp_mix_modern/model_epoch_02.pt +3 -0
  48. nlp_1b_h100_ft_nlp_mix_modern/model_epoch_03.pt +3 -0
  49. nlp_1b_h100_ft_nlp_mix_modern/model_epoch_04.pt +3 -0
  50. nlp_1b_h100_ft_nlp_mix_modern/model_epoch_05.pt +3 -0
gpt_300m_hf_jsonl_sft/model_epoch_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5316d372ce207083091cd9e91989423d980e74ec539901d5ab03a07007c0d296
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb07fd3b7dca856117d7d06e8f3785fec68db4ceabffd2b3ece220d61994eb2b
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e77a79c6d71ed83342782f2764e3e81b85e492934f90583635ae5399dd3adcf
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02a608fb8e245826721681bd61e2d71f92131eb7c96a8c9c5100171eeb042212
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b6939c0ff76d450ca871e98305e63120db0c1df702320e2a48aa74aff8b6d0b
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e2ed13059803996fa3fb8a62a17d5475dd759f35855b8e8885232903ce74e14
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b02a6c5f5bf750460db4dd2d6e3affdf79ff086bf494cb8bc6e95e85011b3e0d
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_08.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f36c30095a9264ef50fd37e1e4f0d867639066467ec586a58f0e354df844aea
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_09.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:757dc73f4cbdf5f07890e52d38374a7ece565851366bdecac2d711c334f72d72
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_epoch_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b25a81a74e636170cfeeb53ef737883bb982972a74ff9b5ea68e5e70f9d093e
3
+ size 3476704961
gpt_300m_hf_jsonl_sft/model_last.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01255beb1f6483a9839476e7d1a51b625175eaec10b6c51032290a4c7bd95780
3
+ size 3476702665
gpt_300m_hf_jsonl_sft/tokenizer_32k/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
gpt_300m_hf_jsonl_sft/tokenizer_32k/tokenizer_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<bos>",
4
+ "eos_token": "<eos>",
5
+ "model_max_length": 1000000000000000019884624838656,
6
+ "pad_token": "<pad>",
7
+ "tokenizer_class": "TokenizersBackend",
8
+ "unk_token": "<unk>"
9
+ }
gpt_300m_hf_jsonl_sft_fast/model_epoch_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:625971b99d5d2a3e6c08f410e2e132b1d5d1cf3d6fe0117d6ab6656ccab53011
3
+ size 3476704961
gpt_300m_hf_jsonl_sft_fast/model_epoch_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:573539ce7189a8f1fd074a9a9dd939ee167c40b6d5d208139401bb80062c08c6
3
+ size 3476704961
gpt_300m_hf_jsonl_sft_fast/model_epoch_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d1c651971c515d491d2caf9aff16d5ae75e87b9e432258181b27aebef010804
3
+ size 3476704961
gpt_300m_hf_jsonl_sft_fast/model_last.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ce0327f813c0e8a74ccdc3ff537ceaf9dfdd36b5dae1deffe5c2bec5208ef7a
3
+ size 3476702665
gpt_300m_hf_jsonl_sft_fast/tokenizer_32k/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
gpt_300m_hf_jsonl_sft_fast/tokenizer_32k/tokenizer_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<bos>",
4
+ "eos_token": "<eos>",
5
+ "model_max_length": 1000000000000000019884624838656,
6
+ "pad_token": "<pad>",
7
+ "tokenizer_class": "TokenizersBackend",
8
+ "unk_token": "<unk>"
9
+ }
gpt_300m_hf_jsonl_sft_v2/model_epoch_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:550bb73ddac988e76984f215a5fac49d180b0e3784cbc28e4539df6704f13037
3
+ size 3476704961
gpt_300m_hf_jsonl_sft_v2/model_epoch_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb22b7efbcea38f7f9a32e0e520e115e05e9f9b772a56a2d71fc667896ba64b0
3
+ size 3476704961
gpt_300m_hf_jsonl_sft_v2/model_epoch_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04b2260f4594168ce647de8a3c3dcbf2c0699381e64ce77142ae24c4abb0218d
3
+ size 3476704961
gpt_300m_hf_jsonl_sft_v2/model_last.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6e3e77064d079236dacf38730c3760ec13f4fdf011dcadb2514df88e1f26abe
3
+ size 3476702665
gpt_300m_hf_jsonl_sft_v2/tokenizer_32k/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
gpt_300m_hf_jsonl_sft_v2/tokenizer_32k/tokenizer_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<bos>",
4
+ "eos_token": "<eos>",
5
+ "model_max_length": 1000000000000000019884624838656,
6
+ "pad_token": "<pad>",
7
+ "tokenizer_class": "TokenizersBackend",
8
+ "unk_token": "<unk>"
9
+ }
nlp_1b_h100_2h/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a942aab6420da7d5e3a13e93d90652755d5ebabd23a3ac67c651f7f0b34f8b28
3
+ size 11462557015
nlp_1b_h100_2h/model_best.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80bc8ed8a60981469951735bebd228c05b1b55a2056712e38c492284039e96c2
3
+ size 11462571709
nlp_1b_h100_2h/model_epoch_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cd4da895e27f787809bb12a74066bf383d5bdc97884e8f8353462aa1338613d
3
+ size 11462574453
nlp_1b_h100_2h/model_epoch_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d2bde7c7280a81787e34f2fd274fdc7a44f0623c749689bb64313271ed20831
3
+ size 11462574453
nlp_1b_h100_2h/train_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7b81bc226e5ef6c922ddad5945aa7ff381520ab1e3cb5f9582a55c6e804999b
3
+ size 11462572395
nlp_1b_h100_ft_nlp_mix_10ep_8h/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b5de6c2be3e46e9a4a8326c2271ac7d9d65ee376d4cf267db938ebc17927c8d
3
+ size 3820833291
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_best.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbd37739e9bba74cecb3d88d33ee873aa6edc78ce10a4e771a1b7d765d49d218
3
+ size 3820845051
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bf665ea3542b18e3d62ae2739dc26a15907dddeddc2d19406be5514b68cb6b1
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1889f17cba79d0b0573fcea382d6670a4921af76abd5aa19dda7dd15e9a6d0
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fbe6baaf34529b98d41ff99bf97753161a2417f13d45b0df1eada25f413de24
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e292be516eb039d19436760207c05d79d82ca7bd34b8b4c453a9aec36c1d4c9
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eccbe592ac3130f180df0975330893cb4cdbff4da9bfb2ff7c9a78451abb1572
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_06.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f2282a0e28787ddd53a0c7787d78c961c1a624e9f9316b00de45d8bef51f366
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_07.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d575982e10a1ad97aa2a60488cdb9c7b3b23778c6e2496390b43daafc00e8abf
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_08.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96c84e78a244ff0d51e757108afb0646649b931de2c3a3209dbc3d20ec66be50
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_09.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea4684b94b7803044c887c7f73782066d2428460f6d07e429aee51c7bdc546b0
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/model_epoch_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dea56757e1272a70098bd3320374644ee346dbfa1ffbb6c25176a5d552395f5b
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_10ep_8h/train_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e95ee24eb1310d8316f00ad968f066f8f6834126c53cc82a7973897976ff0d6
3
+ size 11462574827
nlp_1b_h100_ft_nlp_mix_modern/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8339e96bb23e37442d92c5dd5a4503fd9f2f1ae8699c773f9f07d5043abdefc
3
+ size 3820833291
nlp_1b_h100_ft_nlp_mix_modern/model_best.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6367d3943ab92a28fa09fdd3c808277ec78a6b800f037521ecbcb791d1a044d6
3
+ size 3820845051
nlp_1b_h100_ft_nlp_mix_modern/model_epoch_01.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d1d94bdfefa708dc8d9332019cdbdb8479925b72f2b5e2ea48089b6270f8764
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_modern/model_epoch_02.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29227df24886105aed453ed5f6e08b659d2b4f4f7a8c6e7833143f6b49e286e8
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_modern/model_epoch_03.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b1763bf610808b3a1f36ea8b0119324c8b4b36987c677f6028f95bf8e4f6a2b
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_modern/model_epoch_04.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0d812813971eb6e8bcf09c141fcd317e71bce4b2311d96b8bd36e5d5a516e47
3
+ size 3820845755
nlp_1b_h100_ft_nlp_mix_modern/model_epoch_05.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:406b0e63c3cf2601f1aba8a9f210abf1f9636f7641702976b1c38cbad482fd5d
3
+ size 3820845755