Upload folder using huggingface_hub

Browse files

Files changed (11) hide show

config.json +65 -46
legacy_files/added_tokens.json +29 -0
legacy_files/hf_quant_config.json +14 -0
legacy_files/special_tokens_map.json +48 -0
model-00001-of-00005.safetensors +2 -2
model-00002-of-00005.safetensors +2 -2
model-00003-of-00005.safetensors +2 -2
model-00004-of-00005.safetensors +2 -2
model-00005-of-00005.safetensors +2 -2
model.safetensors.index.json +0 -0
modeling_iquestloopcoder.py +1 -1

config.json CHANGED Viewed

@@ -1,50 +1,69 @@
 {
-    "architectures": [
-        "IQuestLoopCoderForCausalLM"
-    ],
-    "attention_bias": false,
-    "attention_dropout": 0.0,
-    "auto_map": {
-        "AutoConfig": "configuration_iquestloopcoder.IQuestLoopCoderConfig",
-        "AutoModel": "modeling_iquestloopcoder.IQuestLoopCoderModel",
-        "AutoModelForCausalLM": "modeling_iquestloopcoder.IQuestLoopCoderForCausalLM"
     },
-    "bos_token_id": 1,
-    "dtype": "bfloat16",
-    "eos_token_id": [
-        2,
-        75864,
-        75869
     ],
-    "head_dim": 128,
-    "hidden_act": "silu",
-    "hidden_size": 5120,
-    "initializer_range": 0.02,
-    "intermediate_size": 27648,
-    "loop_num": 2,
-    "loop_window_size": 64,
-    "max_position_embeddings": 131072,
-    "mlp_bias": false,
-    "model_type": "iquestloopcoder",
-    "num_attention_heads": 40,
-    "num_hidden_layers": 80,
-    "num_key_value_heads": 8,
-    "rms_norm_eps": 1e-05,
-    "rope_scaling": null,
-    "rope_theta": 500000,
-    "tie_word_embeddings": false,
-    "transformers_version": "4.57.3",
-    "use_cache": true,
-    "vocab_size": 76800,
-    "quantization_config": {
-        "ignore": [
-            "lm_head"
-        ],
-        "quant_algo": "NVFP4",
-        "producer": {
-            "name": "modelopt",
-            "version": "0.40.0"
-        },
-        "quant_method": "modelopt"
-    }
 }

 {
+  "architectures": [
+    "IQuestLoopCoderForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "auto_map": {
+    "AutoConfig": "configuration_iquestloopcoder.IQuestLoopCoderConfig",
+    "AutoModel": "modeling_iquestloopcoder.IQuestLoopCoderModel",
+    "AutoModelForCausalLM": "modeling_iquestloopcoder.IQuestLoopCoderForCausalLM"
+  },
+  "bos_token_id": 1,
+  "dtype": "bfloat16",
+  "eos_token_id": [
+    2,
+    75864,
+    75869
+  ],
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 5120,
+  "initializer_range": 0.02,
+  "intermediate_size": 27648,
+  "loop_num": 2,
+  "loop_window_size": 64,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "iquestloopcoder",
+  "num_attention_heads": 40,
+  "num_hidden_layers": 80,
+  "num_key_value_heads": 8,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 500000,
+  "tie_word_embeddings": false,
+  "transformers_version": "4.56.0",
+  "use_cache": true,
+  "vocab_size": 76800,
+  "quantization_config": {
+    "config_groups": {
+      "group_0": {
+        "input_activations": {
+          "dynamic": false,
+          "num_bits": 4,
+          "type": "float",
+          "group_size": 16
+        },
+        "weights": {
+          "dynamic": false,
+          "num_bits": 4,
+          "type": "float",
+          "group_size": 16
+        },
+        "targets": [
+          "Linear"
+        ]
+      }
     },
+    "ignore": [
+      "lm_head"
     ],
+    "quant_algo": "NVFP4",
+    "producer": {
+      "name": "modelopt",
+      "version": "0.41.0"
+    },
+    "quant_method": "modelopt"
+  }
 }

legacy_files/added_tokens.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "</think>": 75873,
+  "</tool_call>": 75877,
+  "</tool_response>": 75879,
+  "</tools>": 75875,
+  "<CLS>": 75858,
+  "<EOD>": 75860,
+  "<MASK>": 75861,
+  "<PAD>": 75862,
+  "<SEP>": 75859,
+  "<think>": 75872,
+  "<tool_call>": 75876,
+  "<tool_response>": 75878,
+  "<tools>": 75874,
+  "<|CLS|>": 75880,
+  "<|EOD|>": 75882,
+  "<|MASK|>": 75883,
+  "<|PAD|>": 75884,
+  "<|SEP|>": 75881,
+  "<|endoftext|>": 75869,
+  "<|file_sep|>": 75871,
+  "<|fim_middle|>": 75866,
+  "<|fim_pad|>": 75868,
+  "<|fim_prefix|>": 75865,
+  "<|fim_suffix|>": 75867,
+  "<|im_end|>": 75864,
+  "<|im_start|>": 75863,
+  "<|repo_name|>": 75870
+}

legacy_files/hf_quant_config.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+    "producer": {
+        "name": "modelopt",
+        "version": "0.41.0"
+    },
+    "quantization": {
+        "quant_algo": "NVFP4",
+        "kv_cache_quant_algo": null,
+        "group_size": 16,
+        "exclude_modules": [
+            "lm_head"
+        ]
+    }
+}

legacy_files/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "additional_special_tokens": [
+    "<|CLS|>",
+    "<|SEP|>",
+    "<|EOD|>",
+    "<|MASK|>",
+    "<|PAD|>",
+    "<|fim_prefix|>",
+    "<|fim_middle|>",
+    "<|fim_suffix|>",
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|fim_pad|>",
+    "<|endoftext|>",
+    "<|repo_name|>",
+    "<|file_sep|>",
+    "<think>",
+    "</think>"
+  ],
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|im_end|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": true
+  }
+}

model-00001-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:76b5af107a20f8e0e0bdae5c45c579a13dc2f659aaacb0ca389ab3524f566935
-size 4937199704

 version https://git-lfs.github.com/spec/v1
+oid sha256:fdb421765450b1973baefbf307181772772e106240e2720dcccc182e764c4c18
+size 4936202752

model-00002-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9010c28d8b6e9f46384072a54e45eb87ee3d70dc7dddda5f091f46b52a88fa79
-size 4938439016

 version https://git-lfs.github.com/spec/v1
+oid sha256:53393123f0b2a92ad6a39c8799f9af1cb3cc68bddb8bcc5f9f11e479cf2def73
+size 4937255232

model-00003-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:318b778d7802aea8a05427a195a948a3292896d4c6c25ceeb9b1f03b21d9329f
-size 4938439016

 version https://git-lfs.github.com/spec/v1
+oid sha256:8488ee175bf2ebe7e0fa6529a62be49c38834f7127c680c3ce188d399bebb8ac
+size 4937255232

model-00004-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1edc5eba6f5dc7b5b0cd993b3a4b1e8df5524a44ff7b82919d8a0fe1982c03d4
-size 4938439016

 version https://git-lfs.github.com/spec/v1
+oid sha256:49276ddde39b3f45328cfd845fc8547fbfcc76cd615fd917ea4d08e5e6148ca0
+size 4937255232

model-00005-of-00005.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:783ed16140e9f0e19c10819b71bb032391da2d72e10c750cdfae6d7d9f6ed523
-size 3769818152

 version https://git-lfs.github.com/spec/v1
+oid sha256:1f2cb2b12e1631542403147c084c7792d0622cfbec968df1319e540baa80ce9c
+size 3769105000

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

modeling_iquestloopcoder.py CHANGED Viewed

@@ -884,7 +884,7 @@ class IQuestLoopCoderModel(IQuestLoopCoderPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
     @auto_docstring
     def forward(
         self,

         # Initialize weights and apply final processing
         self.post_init()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,