hbin0701 commited on May 14, 2025

Commit

3e31391

verified ·

1 Parent(s): 65127e4

Upload folder using huggingface_hub

Browse files

Files changed (20) hide show

config.json +1 -0
decoder.pt +3 -0
decoder_model/config.json +40 -0
decoder_model/generation_config.json +6 -0
decoder_model/model.safetensors +3 -0
decoder_to_translator_proj.pt +3 -0
encoder.pt +3 -0
encoder_model/config.json +40 -0
encoder_model/generation_config.json +6 -0
encoder_model/model.safetensors +3 -0
encoder_to_decoder_proj.pt +3 -0
tokenizer/merges.txt +0 -0
tokenizer/special_tokens_map.json +6 -0
tokenizer/tokenizer.json +0 -0
tokenizer/tokenizer_config.json +21 -0
tokenizer/vocab.json +0 -0
translator.pt +3 -0
translator_model/config.json +40 -0
translator_model/generation_config.json +6 -0
translator_model/model.safetensors +3 -0

config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"task": "csqa", "share_param": false, "use_cont": true, "use_dist": false, "use_mse": false, "dropout_rate": 0.2, "encoder_path": "/home/hyeonbin/Latent_Step/src/new/1.6_models/csqa/encoder2", "decoder_path": "hbin0701/csqa-cot", "translator_path": "/home/hyeonbin/Latent_Step/src/new/1.6_models/csqa/decoder2", "tokenizer_name": "gpt2"}

decoder.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35d851b383d27fd6ca2f2c22c01ffc7a0b3928a9b7eee638da039cbdca595019
+size 253631068

decoder_model/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "hbin0701/csqa-cot",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "pad_token_id": 50256,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.48.0",
+  "use_cache": false,
+  "vocab_size": 50257
+}

decoder_model/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.48.0"
+}

decoder_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0bf4a45b382621e4316cbe6a2298c798e9bf60e4da74e76ac574934e7d102ed8
+size 248894656

decoder_to_translator_proj.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e12ea13ec8fb727f7edad197383c6fa648a3af1136310b168ab8692046e56193
+size 253606075

encoder.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5c05955e66dcefb0b4a7a257d3934e14c4032f6cda8bffa49d3986c9ee335eb
+size 248934474

encoder_model/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "/home/hyeonbin/Latent_Step/src/new/1.6_models/csqa/encoder2",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "pad_token_id": 50256,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.48.0",
+  "use_cache": false,
+  "vocab_size": 50257
+}

encoder_model/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.48.0"
+}

encoder_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:efd6cb1b23715360a4db8984386714da89b0a486545328531318dc978fb3e314
+size 248894656

encoder_to_decoder_proj.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b83adba24950cfdc8da4ea849e5cb6fe8d935eee94339a524e10918b04ac3a90
+size 253606060

tokenizer/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "pad_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

tokenizer/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
+  "model_max_length": 1024,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

tokenizer/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

translator.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:11506f15322d8c7731b51830b6b33f32b7e5d9a5861c87d0a0a4235295a483dc
+size 248935506

translator_model/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "/home/hyeonbin/Latent_Step/src/new/1.6_models/csqa/decoder2",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "pad_token_id": 50256,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.48.0",
+  "use_cache": false,
+  "vocab_size": 50257
+}

translator_model/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.48.0"
+}

translator_model/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:efd6cb1b23715360a4db8984386714da89b0a486545328531318dc978fb3e314
+size 248894656