MerantixMomentum
/

acip_llama1_7b

Text Generation

feature-extraction

Model card Files Files and versions

martingenzel commited on Apr 28, 2025

Commit

755d958

·

verified ·

1 Parent(s): f50e653

Add model

Files changed (2) hide show

README.md +10 -4
config.json +7 -7

README.md CHANGED Viewed

@@ -1,9 +1,15 @@
 ---
 license: other
-datasets: ['allenai/c4']
-language: ['en']
-metrics: ['perplexity', 'accuracy']
-tags: ['acip', 'pytorch']
 base_model:
 - jeffwan/llama-7b-hf
 pipeline_tag: text-generation

 ---
 license: other
+datasets:
+- allenai/c4
+language:
+- en
+metrics:
+- perplexity
+- accuracy
+tags:
+- acip
+- pytorch
 base_model:
 - jeffwan/llama-7b-hf
 pipeline_tag: text-generation

config.json CHANGED Viewed

@@ -9,9 +9,9 @@
         "bias": "none",
         "eva_config": null,
         "exclude_modules": [
-          "parametrization",
           "base",
-          "ortho"
         ],
         "fan_in_fan_out": false,
         "inference_mode": false,
@@ -31,14 +31,14 @@
         "rank_pattern": {},
         "revision": null,
         "target_modules": [
-          "up_proj",
-          "q_proj",
-          "k_proj",
-          "v_proj",
-          "ortho",
           "base",
           "gate_proj",
           "o_proj",
           "down_proj"
         ],
         "task_type": "CAUSAL_LM",

         "bias": "none",
         "eva_config": null,
         "exclude_modules": [
           "base",
+          "ortho",
+          "parametrization"
         ],
         "fan_in_fan_out": false,
         "inference_mode": false,
         "rank_pattern": {},
         "revision": null,
         "target_modules": [
           "base",
           "gate_proj",
+          "up_proj",
+          "ortho",
           "o_proj",
+          "v_proj",
+          "q_proj",
+          "k_proj",
           "down_proj"
         ],
         "task_type": "CAUSAL_LM",