craa commited on Dec 5, 2025

Commit

74a34fb

verified ·

1 Parent(s): 2d6c118

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

resemble_to_drop_frequency_3591/checkpoint-40000/config.json +31 -0
resemble_to_drop_frequency_3591/checkpoint-40000/generation_config.json +6 -0
resemble_to_drop_frequency_3591/checkpoint-40000/merges.txt +0 -0
resemble_to_drop_frequency_3591/checkpoint-40000/model.safetensors +3 -0
resemble_to_drop_frequency_3591/checkpoint-40000/optimizer.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-40000/rng_state.pth +3 -0
resemble_to_drop_frequency_3591/checkpoint-40000/scaler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-40000/scheduler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-40000/special_tokens_map.json +5 -0
resemble_to_drop_frequency_3591/checkpoint-40000/tokenizer.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-40000/tokenizer_config.json +20 -0
resemble_to_drop_frequency_3591/checkpoint-40000/trainer_state.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-40000/training_args.bin +3 -0
resemble_to_drop_frequency_3591/checkpoint-40000/vocab.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-50000/config.json +31 -0
resemble_to_drop_frequency_3591/checkpoint-50000/generation_config.json +6 -0
resemble_to_drop_frequency_3591/checkpoint-50000/merges.txt +0 -0
resemble_to_drop_frequency_3591/checkpoint-50000/model.safetensors +3 -0
resemble_to_drop_frequency_3591/checkpoint-50000/optimizer.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-50000/rng_state.pth +3 -0
resemble_to_drop_frequency_3591/checkpoint-50000/scaler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-50000/scheduler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-50000/special_tokens_map.json +5 -0
resemble_to_drop_frequency_3591/checkpoint-50000/tokenizer.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-50000/tokenizer_config.json +20 -0
resemble_to_drop_frequency_3591/checkpoint-50000/trainer_state.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-50000/training_args.bin +3 -0
resemble_to_drop_frequency_3591/checkpoint-50000/vocab.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-60000/config.json +31 -0
resemble_to_drop_frequency_3591/checkpoint-60000/generation_config.json +6 -0
resemble_to_drop_frequency_3591/checkpoint-60000/merges.txt +0 -0
resemble_to_drop_frequency_3591/checkpoint-60000/model.safetensors +3 -0
resemble_to_drop_frequency_3591/checkpoint-60000/optimizer.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-60000/rng_state.pth +3 -0
resemble_to_drop_frequency_3591/checkpoint-60000/scaler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-60000/scheduler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-60000/special_tokens_map.json +5 -0
resemble_to_drop_frequency_3591/checkpoint-60000/tokenizer.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-60000/tokenizer_config.json +20 -0
resemble_to_drop_frequency_3591/checkpoint-60000/trainer_state.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-60000/training_args.bin +3 -0
resemble_to_drop_frequency_3591/checkpoint-60000/vocab.json +0 -0
resemble_to_drop_frequency_3591/checkpoint-70000/config.json +31 -0
resemble_to_drop_frequency_3591/checkpoint-70000/generation_config.json +6 -0
resemble_to_drop_frequency_3591/checkpoint-70000/merges.txt +0 -0
resemble_to_drop_frequency_3591/checkpoint-70000/model.safetensors +3 -0
resemble_to_drop_frequency_3591/checkpoint-70000/optimizer.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-70000/rng_state.pth +3 -0
resemble_to_drop_frequency_3591/checkpoint-70000/scaler.pt +3 -0
resemble_to_drop_frequency_3591/checkpoint-70000/scheduler.pt +3 -0

resemble_to_drop_frequency_3591/checkpoint-40000/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

resemble_to_drop_frequency_3591/checkpoint-40000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.55.2"
+}

resemble_to_drop_frequency_3591/checkpoint-40000/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-40000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d77fffe19c0ac6915706b2c6df80af612b079a72057e5fea40cc622450665ad
+size 497774208

resemble_to_drop_frequency_3591/checkpoint-40000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:643583a5a7c070d199d7a8e29d5b7370e38ccc556b4157ed216d7696654efc4d
+size 995644811

resemble_to_drop_frequency_3591/checkpoint-40000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae39a9c54fe946639529d1ec86e921d976be8714da9f1762f8be2f57aa5e3ece
+size 14645

resemble_to_drop_frequency_3591/checkpoint-40000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:728e44349b28ca534e2b04df0e5dc3845fb30a911dc7d7a13ef962caa844372e
+size 1383

resemble_to_drop_frequency_3591/checkpoint-40000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2358aa5657b1e21f344557abc28c2385065d2ed2f82389cf3ff94ad7b8bd44f
+size 1465

resemble_to_drop_frequency_3591/checkpoint-40000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

resemble_to_drop_frequency_3591/checkpoint-40000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-40000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

resemble_to_drop_frequency_3591/checkpoint-40000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-40000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bec96c10e17a6d709f2402982e5e9fcc043d9077a59703780c138d2104dbd481
+size 5969

resemble_to_drop_frequency_3591/checkpoint-40000/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-50000/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

resemble_to_drop_frequency_3591/checkpoint-50000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.55.2"
+}

resemble_to_drop_frequency_3591/checkpoint-50000/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-50000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6e7b4791865d3360541eab474f20fb67c793814c87fb433d077b938d24c1bd0
+size 497774208

resemble_to_drop_frequency_3591/checkpoint-50000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2061d5f87abaedc9462a4bd4c6cc81c627d08979a1996baf8f7f803220d1da8
+size 995644811

resemble_to_drop_frequency_3591/checkpoint-50000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:12f39e2465dbc023814fa665f7a732d148eb0e4b1ae7a6db53ef88a35421f165
+size 14645

resemble_to_drop_frequency_3591/checkpoint-50000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab6f83cb1957ae158df43ef61dafe2cadd5b16c24e6f0928531ae5d811029227
+size 1383

resemble_to_drop_frequency_3591/checkpoint-50000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:377c4525c7c71feb1a629cb8c76d31b37815acb15a41dfc2e1832b672584f32f
+size 1465

resemble_to_drop_frequency_3591/checkpoint-50000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

resemble_to_drop_frequency_3591/checkpoint-50000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-50000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

resemble_to_drop_frequency_3591/checkpoint-50000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-50000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bec96c10e17a6d709f2402982e5e9fcc043d9077a59703780c138d2104dbd481
+size 5969

resemble_to_drop_frequency_3591/checkpoint-50000/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-60000/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

resemble_to_drop_frequency_3591/checkpoint-60000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.55.2"
+}

resemble_to_drop_frequency_3591/checkpoint-60000/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-60000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33df32af352d40440772eede67abafc28a402a1148ef8978eca82ac546494caa
+size 497774208

resemble_to_drop_frequency_3591/checkpoint-60000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1b63779ca404c21bf487ebef04690d3f9052a79ff07d3f658e31f7fe9cecd526
+size 995644811

resemble_to_drop_frequency_3591/checkpoint-60000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e37a80bb23d827365ee82911accebb2560873d4d6ee73dd7508bbda3a4150e79
+size 14645

resemble_to_drop_frequency_3591/checkpoint-60000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:65ac0498f9b9a1cbc22618943d83c80c9a7141feb98a468c9a8ec940b55b0710
+size 1383

resemble_to_drop_frequency_3591/checkpoint-60000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3c70200a195f5b6062f0194e47843ceb01c33595efcd51f2af84bf2de1f1765
+size 1465

resemble_to_drop_frequency_3591/checkpoint-60000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

resemble_to_drop_frequency_3591/checkpoint-60000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-60000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

resemble_to_drop_frequency_3591/checkpoint-60000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-60000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bec96c10e17a6d709f2402982e5e9fcc043d9077a59703780c138d2104dbd481
+size 5969

resemble_to_drop_frequency_3591/checkpoint-60000/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-70000/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_cache": true,
+  "vocab_size": 50257
+}

resemble_to_drop_frequency_3591/checkpoint-70000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.55.2"
+}

resemble_to_drop_frequency_3591/checkpoint-70000/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

resemble_to_drop_frequency_3591/checkpoint-70000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5e1544a9e1a3a80a2f64d3a36cf47802ac2b842a83e44af81a500178c2f97422
+size 497774208

resemble_to_drop_frequency_3591/checkpoint-70000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:55203275b0ff0ef0f8e021771f3ef94d8200c2b60e9e260d966706fb3acbc4a0
+size 995644811

resemble_to_drop_frequency_3591/checkpoint-70000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac247caa082213ce75fa070a37e9d4196639932aac7ebadd8312cda9d99502ee
+size 14645

resemble_to_drop_frequency_3591/checkpoint-70000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a8ded865ec6ac91caef657c3b3ed159cd2fbf7ce24e435ad72251afa3b3a2ecc
+size 1383

resemble_to_drop_frequency_3591/checkpoint-70000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5d9147f6c552b97d557708553469c436b903ee5755fef452f0f9cdd97c2e62e
+size 1465