ayousanz commited on Apr 11, 2024

Commit

c21a234

verified ·

1 Parent(s): 58dc91b

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

checkpoint-42000/config.json +25 -0
checkpoint-42000/generation_config.json +6 -0
checkpoint-42000/model.safetensors +3 -0
checkpoint-42000/optimizer.pt +3 -0
checkpoint-42000/rng_state_0.pth +3 -0
checkpoint-42000/rng_state_1.pth +3 -0
checkpoint-42000/scheduler.pt +3 -0
checkpoint-42000/special_tokens_map.json +30 -0
checkpoint-42000/spiece.model +3 -0
checkpoint-42000/tokenizer.json +0 -0
checkpoint-42000/tokenizer_config.json +47 -0
checkpoint-42000/trainer_state.json +0 -0
checkpoint-42000/training_args.bin +3 -0
checkpoint-43000/config.json +25 -0
checkpoint-43000/generation_config.json +6 -0
checkpoint-43000/model.safetensors +3 -0
checkpoint-43000/optimizer.pt +3 -0
checkpoint-43000/rng_state_0.pth +3 -0
checkpoint-43000/rng_state_1.pth +3 -0
checkpoint-43000/scheduler.pt +3 -0
checkpoint-43000/special_tokens_map.json +30 -0
checkpoint-43000/spiece.model +3 -0
checkpoint-43000/tokenizer.json +0 -0
checkpoint-43000/tokenizer_config.json +47 -0
checkpoint-43000/trainer_state.json +0 -0
checkpoint-43000/training_args.bin +3 -0
checkpoint-44000/config.json +25 -0
checkpoint-44000/generation_config.json +6 -0
checkpoint-44000/model.safetensors +3 -0
checkpoint-44000/optimizer.pt +3 -0
checkpoint-44000/rng_state_0.pth +3 -0
checkpoint-44000/rng_state_1.pth +3 -0
checkpoint-44000/scheduler.pt +3 -0
checkpoint-44000/special_tokens_map.json +30 -0
checkpoint-44000/spiece.model +3 -0
checkpoint-44000/tokenizer.json +0 -0
checkpoint-44000/tokenizer_config.json +47 -0
checkpoint-44000/trainer_state.json +0 -0
checkpoint-44000/training_args.bin +3 -0
checkpoint-45000/config.json +25 -0
checkpoint-45000/generation_config.json +6 -0
checkpoint-45000/model.safetensors +3 -0
checkpoint-45000/optimizer.pt +3 -0
checkpoint-45000/rng_state_0.pth +3 -0
checkpoint-45000/rng_state_1.pth +3 -0
checkpoint-45000/scheduler.pt +3 -0
checkpoint-45000/special_tokens_map.json +30 -0
checkpoint-45000/spiece.model +3 -0
checkpoint-45000/tokenizer.json +0 -0
checkpoint-45000/tokenizer_config.json +47 -0

checkpoint-42000/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "None",
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "hidden_act": "silu",
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 2400,
+  "max_position_embeddings": 4096,
+  "model_type": "mistral",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 10000.0,
+  "sliding_window": 1024,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-42000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "transformers_version": "4.35.2"
+}

checkpoint-42000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:46d6a74205226153c7ea2e0c97f3d12424969eb6cf24ee6c63ba1c78191ef5e6
+size 1421709600

checkpoint-42000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de54cb99d80d79f0b6a7b7486ceaac1809e7af5d29b6b31718114ee9657b8b0e
+size 712761658

checkpoint-42000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f26a6d5ed9c5a3802e5d26f3703c66f8a5dab02cdea54ca59b17bc5824ac1a4b
+size 14512

checkpoint-42000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f7d8eb55ec39784a21119a2b22ec723a2ec1758ca85298ae52af0fd00ecceee
+size 14512

checkpoint-42000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fc14fb7e32834d062fb3f6af42921ca80d4b710f136ac624c10d598afb3e21b
+size 1064

checkpoint-42000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-42000/spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:604cb0c2f073ba13f04739ced6f8310f4f00ab344feea6cb5c4012af3876c684
+size 1249735

checkpoint-42000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-42000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "legacy": true,
+  "model_max_length": 50000,
+  "pad_token": "[PAD]",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
+  "unk_token": "[UNK]"
+}

checkpoint-42000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-42000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e155e14ea10bc818c6d546606d5c422939b7900b506b462ed99a246bcc2dbf79
+size 4600

checkpoint-43000/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "None",
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "hidden_act": "silu",
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 2400,
+  "max_position_embeddings": 4096,
+  "model_type": "mistral",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 10000.0,
+  "sliding_window": 1024,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-43000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "transformers_version": "4.35.2"
+}

checkpoint-43000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c889035b174aac9ad61f229de04ecc362bd23cc0c89138663f39e49ed89b86c
+size 1421709600

checkpoint-43000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68ee60f2eb8071a5ab58168a97683369593ee5441b171f2366554a0a3ff3a82d
+size 712761658

checkpoint-43000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7a46cfb281df1ee9eb2b6d5bf8f522cc261375d6cc061a7f831b99f82b44c62
+size 14512

checkpoint-43000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6804f9be22b28f887e06ec0c0bae307b4cd4c6a9fd680b4fc2351e9ba5b062b
+size 14512

checkpoint-43000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:041fe72aa9be4abbdea46b9568cf6294d7346559787effb76fa559fc30a1a19f
+size 1064

checkpoint-43000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-43000/spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:604cb0c2f073ba13f04739ced6f8310f4f00ab344feea6cb5c4012af3876c684
+size 1249735

checkpoint-43000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-43000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "legacy": true,
+  "model_max_length": 50000,
+  "pad_token": "[PAD]",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
+  "unk_token": "[UNK]"
+}

checkpoint-43000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-43000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e155e14ea10bc818c6d546606d5c422939b7900b506b462ed99a246bcc2dbf79
+size 4600

checkpoint-44000/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "None",
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "hidden_act": "silu",
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 2400,
+  "max_position_embeddings": 4096,
+  "model_type": "mistral",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 10000.0,
+  "sliding_window": 1024,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-44000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "transformers_version": "4.35.2"
+}

checkpoint-44000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:437f7a2f80c9d36a4ed847d03f1039ad15f0e994f3e0916ae60c97b27a8981a9
+size 1421709600

checkpoint-44000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a4a7b218db3591a66da548068764c03aa245c4cb64b2d7479cfbc2ba2ece692
+size 712761658

checkpoint-44000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c26f400a532a77a8b43a792de9f3cf07f51be4a5020289021d98978fe9b1ddac
+size 14512

checkpoint-44000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2ac0d24f1312218de1e388e3e1c4e0c19ebc17a4d905f26f378e6a39862428c
+size 14512

checkpoint-44000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68a1e2417b9baacab06a0a166979ef2b8eed646d71adf8e6f4d8f1c9d91cad93
+size 1064

checkpoint-44000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-44000/spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:604cb0c2f073ba13f04739ced6f8310f4f00ab344feea6cb5c4012af3876c684
+size 1249735

checkpoint-44000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-44000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "legacy": true,
+  "model_max_length": 50000,
+  "pad_token": "[PAD]",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
+  "unk_token": "[UNK]"
+}

checkpoint-44000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-44000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e155e14ea10bc818c6d546606d5c422939b7900b506b462ed99a246bcc2dbf79
+size 4600

checkpoint-45000/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "None",
+  "architectures": [
+    "MistralForCausalLM"
+  ],
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "hidden_act": "silu",
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 2400,
+  "max_position_embeddings": 4096,
+  "model_type": "mistral",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_theta": 10000.0,
+  "sliding_window": 1024,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-45000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 0,
+  "eos_token_id": 0,
+  "transformers_version": "4.35.2"
+}

checkpoint-45000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6c5bd234ddfa34f4e0d1d966e404cf367264c363ee9c8b0bffffc5970195595
+size 1421709600

checkpoint-45000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0ad6b1d3106a40cb764468287692224e8302fece8d64f3a4a79d62a975fd9b6
+size 712761658

checkpoint-45000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6769c3a5012a8c8eea976d61baa487126263f185fbe6f2ebbbbfad39b96e1e2
+size 14512

checkpoint-45000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c57710d7e52f14d65517700d49762c20c8de978ffe8c4550dbe8e2039b6c698c
+size 14512

checkpoint-45000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61fd4bf6ad594e4cf0a9ccb0a644e5419662c4659d2ef42c89aabf5a2ba3ca3c
+size 1064

checkpoint-45000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-45000/spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:604cb0c2f073ba13f04739ced6f8310f4f00ab344feea6cb5c4012af3876c684
+size 1249735

checkpoint-45000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-45000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "legacy": true,
+  "model_max_length": 50000,
+  "pad_token": "[PAD]",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
+  "unk_token": "[UNK]"
+}