nathan0 commited on Oct 30, 2023

Commit

bfd39e8

1 Parent(s): 4b6e875

first commit

Browse files

llama-2-delta-tune-model-div-sal

Files changed (22) hide show

README.md +7 -1
adapter_config.json +21 -0
adapter_model.bin +3 -0
all_results.json +9 -0
best_model_structure.txt +1 -0
checkpoint-1130/README.md +9 -0
checkpoint-1130/adapter_config.json +21 -0
checkpoint-1130/adapter_model.bin +3 -0
checkpoint-1130/optimizer.pt +3 -0
checkpoint-1130/rng_state.pth +3 -0
checkpoint-1130/scheduler.pt +3 -0
checkpoint-1130/special_tokens_map.json +12 -0
checkpoint-1130/tokenizer.json +0 -0
checkpoint-1130/tokenizer.model +3 -0
checkpoint-1130/tokenizer_config.json +33 -0
checkpoint-1130/trainer_state.json +82 -0
checkpoint-1130/training_args.bin +3 -0
eval_results.json +9 -0
llama2-7b-delta-arc_challenge +27 -0
llama2-7b-delta-hellaswag +27 -0
llama2-7b-delta-mmlu +419 -0
llama2-7b-delta-truthqa +27 -0

README.md CHANGED Viewed

@@ -1,3 +1,9 @@
 ---
-license: apache-2.0
 ---

 ---
+library_name: peft
 ---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/home/vmagent/app/dataset/Llama-2-7b-hf",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 7,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 7,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8528895ce3b148285e487611cb9e3fcff148a1b33af0ae7b371c038b8e47af7f
+size 11303289

all_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 1.0,
+    "eval_loss": 0.9328290820121765,
+    "eval_runtime": 4637.6182,
+    "eval_samples": 15601,
+    "eval_samples_per_second": 3.364,
+    "eval_steps_per_second": 0.421,
+    "eval_tokens": 1974952
+}

best_model_structure.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"num_hidden_layers": [1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 1, 1], "r": [11, 3, 12, 1, 8, 11, 7, 12, 12, 6, 12, 1, 6, 11, 8, 3, 2, 12, 12, 5, 2, 3, 9, 2, 4, 12, 10, 1, 12, 2, 9, 7], "alpha": [6, 6, 6, 2, 3, 6, 5, 5, 1, 4, 2, 3, 6, 6, 3, 5, 1, 2, 6, 2, 2, 2, 3, 1, 4, 2, 6, 2, 2, 4, 6, 1]}

checkpoint-1130/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+---
+library_name: peft
+---
+## Training procedure
+### Framework versions
+- PEFT 0.4.0

checkpoint-1130/adapter_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "auto_mapping": null,
+  "base_model_name_or_path": "/home/vmagent/app/dataset/Llama-2-7b-hf",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 7,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 7,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-1130/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8528895ce3b148285e487611cb9e3fcff148a1b33af0ae7b371c038b8e47af7f
+size 11303289

checkpoint-1130/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:618f443ea86970abd066a87c6e263550cd27aaf80beae923ba65198a7286877d
+size 22615621

checkpoint-1130/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2baed73f84e733959faa04603c46e4711d40efc68cce45fe24a86cd4ef848a9
+size 13553

checkpoint-1130/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bdb9c410cb1fee55c64962fef791dbcf270d380ace861d4a88a849eae5737e19
+size 627

checkpoint-1130/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-1130/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1130/tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723

checkpoint-1130/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,33 @@

+{
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": false,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "legacy": false,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": null,
+  "padding_side": "right",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-1130/trainer_state.json ADDED Viewed

	@@ -0,0 +1,82 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "global_step": 1130,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.09,
+      "learning_rate": 9.115044247787611e-05,
+      "loss": 1.0612,
+      "step": 100
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 8.230088495575221e-05,
+      "loss": 0.93,
+      "step": 200
+    },
+    {
+      "epoch": 0.27,
+      "learning_rate": 7.345132743362832e-05,
+      "loss": 0.9098,
+      "step": 300
+    },
+    {
+      "epoch": 0.35,
+      "learning_rate": 6.460176991150442e-05,
+      "loss": 0.9033,
+      "step": 400
+    },
+    {
+      "epoch": 0.44,
+      "learning_rate": 5.575221238938053e-05,
+      "loss": 0.8943,
+      "step": 500
+    },
+    {
+      "epoch": 0.53,
+      "learning_rate": 4.690265486725664e-05,
+      "loss": 0.8932,
+      "step": 600
+    },
+    {
+      "epoch": 0.62,
+      "learning_rate": 3.8053097345132744e-05,
+      "loss": 0.9019,
+      "step": 700
+    },
+    {
+      "epoch": 0.71,
+      "learning_rate": 2.9203539823008852e-05,
+      "loss": 0.8881,
+      "step": 800
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 2.0353982300884957e-05,
+      "loss": 0.8929,
+      "step": 900
+    },
+    {
+      "epoch": 0.88,
+      "learning_rate": 1.1504424778761062e-05,
+      "loss": 0.8916,
+      "step": 1000
+    },
+    {
+      "epoch": 0.97,
+      "learning_rate": 2.6548672566371683e-06,
+      "loss": 0.8882,
+      "step": 1100
+    }
+  ],
+  "max_steps": 1130,
+  "num_train_epochs": 1,
+  "total_flos": 1.8342786143512166e+17,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1130/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6eedaba58b8a9174ee307f742d1df91a3623ab4c51b3f334d1569a644cc1cffa
+size 4091

eval_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 1.0,
+    "eval_loss": 0.9328290820121765,
+    "eval_runtime": 4637.6182,
+    "eval_samples": 15601,
+    "eval_samples_per_second": 3.364,
+    "eval_steps_per_second": 0.421,
+    "eval_tokens": 1974952
+}

llama2-7b-delta-arc_challenge ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "results": {
+    "arc_challenge": {
+      "acc": 0.4974402730375427,
+      "acc_stderr": 0.014611199329843788,
+      "acc_norm": 0.5366894197952219,
+      "acc_norm_stderr": 0.01457200052775699
+    }
+  },
+  "versions": {
+    "arc_challenge": 0
+  },
+  "config": {
+    "model": "hf-causal-experimental",
+    "model_args": "pretrained=/home/vmagent/app/data/Llama-2-7b-hf,peft=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal,use_accelerate=True,delta=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal/best_model_structure.txt",
+    "num_fewshot": 25,
+    "batch_size": "auto",
+    "batch_sizes": [
+      16
+    ],
+    "device": null,
+    "no_cache": false,
+    "limit": null,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

llama2-7b-delta-hellaswag ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "results": {
+    "hellaswag": {
+      "acc": 0.5876319458275244,
+      "acc_stderr": 0.004912547040132876,
+      "acc_norm": 0.7783310097590121,
+      "acc_norm_stderr": 0.004145206350032315
+    }
+  },
+  "versions": {
+    "hellaswag": 0
+  },
+  "config": {
+    "model": "hf-causal-experimental",
+    "model_args": "pretrained=/home/vmagent/app/data/Llama-2-7b-hf,peft=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal,use_accelerate=True,delta=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal/best_model_structure.txt",
+    "num_fewshot": 10,
+    "batch_size": "auto",
+    "batch_sizes": [
+      16
+    ],
+    "device": null,
+    "no_cache": false,
+    "limit": null,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

llama2-7b-delta-mmlu ADDED Viewed

	@@ -0,0 +1,419 @@

+{
+  "results": {
+    "hendrycksTest-abstract_algebra": {
+      "acc": 0.34,
+      "acc_stderr": 0.04760952285695236,
+      "acc_norm": 0.34,
+      "acc_norm_stderr": 0.04760952285695236
+    },
+    "hendrycksTest-anatomy": {
+      "acc": 0.45925925925925926,
+      "acc_stderr": 0.04304979692464242,
+      "acc_norm": 0.45925925925925926,
+      "acc_norm_stderr": 0.04304979692464242
+    },
+    "hendrycksTest-astronomy": {
+      "acc": 0.40131578947368424,
+      "acc_stderr": 0.039889037033362836,
+      "acc_norm": 0.40131578947368424,
+      "acc_norm_stderr": 0.039889037033362836
+    },
+    "hendrycksTest-business_ethics": {
+      "acc": 0.49,
+      "acc_stderr": 0.05024183937956912,
+      "acc_norm": 0.49,
+      "acc_norm_stderr": 0.05024183937956912
+    },
+    "hendrycksTest-clinical_knowledge": {
+      "acc": 0.44150943396226416,
+      "acc_stderr": 0.030561590426731844,
+      "acc_norm": 0.44150943396226416,
+      "acc_norm_stderr": 0.030561590426731844
+    },
+    "hendrycksTest-college_biology": {
+      "acc": 0.4513888888888889,
+      "acc_stderr": 0.04161402398403279,
+      "acc_norm": 0.4513888888888889,
+      "acc_norm_stderr": 0.04161402398403279
+    },
+    "hendrycksTest-college_chemistry": {
+      "acc": 0.35,
+      "acc_stderr": 0.0479372485441102,
+      "acc_norm": 0.35,
+      "acc_norm_stderr": 0.0479372485441102
+    },
+    "hendrycksTest-college_computer_science": {
+      "acc": 0.36,
+      "acc_stderr": 0.04824181513244218,
+      "acc_norm": 0.36,
+      "acc_norm_stderr": 0.04824181513244218
+    },
+    "hendrycksTest-college_mathematics": {
+      "acc": 0.35,
+      "acc_stderr": 0.047937248544110196,
+      "acc_norm": 0.35,
+      "acc_norm_stderr": 0.047937248544110196
+    },
+    "hendrycksTest-college_medicine": {
+      "acc": 0.42196531791907516,
+      "acc_stderr": 0.0376574669386515,
+      "acc_norm": 0.42196531791907516,
+      "acc_norm_stderr": 0.0376574669386515
+    },
+    "hendrycksTest-college_physics": {
+      "acc": 0.23529411764705882,
+      "acc_stderr": 0.04220773659171453,
+      "acc_norm": 0.23529411764705882,
+      "acc_norm_stderr": 0.04220773659171453
+    },
+    "hendrycksTest-computer_security": {
+      "acc": 0.59,
+      "acc_stderr": 0.049431107042371025,
+      "acc_norm": 0.59,
+      "acc_norm_stderr": 0.049431107042371025
+    },
+    "hendrycksTest-conceptual_physics": {
+      "acc": 0.4340425531914894,
+      "acc_stderr": 0.03240038086792747,
+      "acc_norm": 0.4340425531914894,
+      "acc_norm_stderr": 0.03240038086792747
+    },
+    "hendrycksTest-econometrics": {
+      "acc": 0.32456140350877194,
+      "acc_stderr": 0.04404556157374768,
+      "acc_norm": 0.32456140350877194,
+      "acc_norm_stderr": 0.04404556157374768
+    },
+    "hendrycksTest-electrical_engineering": {
+      "acc": 0.3931034482758621,
+      "acc_stderr": 0.0407032901370707,
+      "acc_norm": 0.3931034482758621,
+      "acc_norm_stderr": 0.0407032901370707
+    },
+    "hendrycksTest-elementary_mathematics": {
+      "acc": 0.28835978835978837,
+      "acc_stderr": 0.0233306540545359,
+      "acc_norm": 0.28835978835978837,
+      "acc_norm_stderr": 0.0233306540545359
+    },
+    "hendrycksTest-formal_logic": {
+      "acc": 0.30158730158730157,
+      "acc_stderr": 0.04104947269903394,
+      "acc_norm": 0.30158730158730157,
+      "acc_norm_stderr": 0.04104947269903394
+    },
+    "hendrycksTest-global_facts": {
+      "acc": 0.3,
+      "acc_stderr": 0.046056618647183814,
+      "acc_norm": 0.3,
+      "acc_norm_stderr": 0.046056618647183814
+    },
+    "hendrycksTest-high_school_biology": {
+      "acc": 0.47419354838709676,
+      "acc_stderr": 0.02840609505765332,
+      "acc_norm": 0.47419354838709676,
+      "acc_norm_stderr": 0.02840609505765332
+    },
+    "hendrycksTest-high_school_chemistry": {
+      "acc": 0.3448275862068966,
+      "acc_stderr": 0.03344283744280458,
+      "acc_norm": 0.3448275862068966,
+      "acc_norm_stderr": 0.03344283744280458
+    },
+    "hendrycksTest-high_school_computer_science": {
+      "acc": 0.39,
+      "acc_stderr": 0.04902071300001975,
+      "acc_norm": 0.39,
+      "acc_norm_stderr": 0.04902071300001975
+    },
+    "hendrycksTest-high_school_european_history": {
+      "acc": 0.6060606060606061,
+      "acc_stderr": 0.03815494308688931,
+      "acc_norm": 0.6060606060606061,
+      "acc_norm_stderr": 0.03815494308688931
+    },
+    "hendrycksTest-high_school_geography": {
+      "acc": 0.5505050505050505,
+      "acc_stderr": 0.035441324919479704,
+      "acc_norm": 0.5505050505050505,
+      "acc_norm_stderr": 0.035441324919479704
+    },
+    "hendrycksTest-high_school_government_and_politics": {
+      "acc": 0.689119170984456,
+      "acc_stderr": 0.03340361906276585,
+      "acc_norm": 0.689119170984456,
+      "acc_norm_stderr": 0.03340361906276585
+    },
+    "hendrycksTest-high_school_macroeconomics": {
+      "acc": 0.4282051282051282,
+      "acc_stderr": 0.025088301454694834,
+      "acc_norm": 0.4282051282051282,
+      "acc_norm_stderr": 0.025088301454694834
+    },
+    "hendrycksTest-high_school_mathematics": {
+      "acc": 0.2851851851851852,
+      "acc_stderr": 0.027528599210340496,
+      "acc_norm": 0.2851851851851852,
+      "acc_norm_stderr": 0.027528599210340496
+    },
+    "hendrycksTest-high_school_microeconomics": {
+      "acc": 0.38235294117647056,
+      "acc_stderr": 0.03156663099215416,
+      "acc_norm": 0.38235294117647056,
+      "acc_norm_stderr": 0.03156663099215416
+    },
+    "hendrycksTest-high_school_physics": {
+      "acc": 0.3509933774834437,
+      "acc_stderr": 0.03896981964257375,
+      "acc_norm": 0.3509933774834437,
+      "acc_norm_stderr": 0.03896981964257375
+    },
+    "hendrycksTest-high_school_psychology": {
+      "acc": 0.6146788990825688,
+      "acc_stderr": 0.02086585085279412,
+      "acc_norm": 0.6146788990825688,
+      "acc_norm_stderr": 0.02086585085279412
+    },
+    "hendrycksTest-high_school_statistics": {
+      "acc": 0.25462962962962965,
+      "acc_stderr": 0.02971127586000535,
+      "acc_norm": 0.25462962962962965,
+      "acc_norm_stderr": 0.02971127586000535
+    },
+    "hendrycksTest-high_school_us_history": {
+      "acc": 0.5490196078431373,
+      "acc_stderr": 0.03492406104163613,
+      "acc_norm": 0.5490196078431373,
+      "acc_norm_stderr": 0.03492406104163613
+    },
+    "hendrycksTest-high_school_world_history": {
+      "acc": 0.6244725738396625,
+      "acc_stderr": 0.03152256243091156,
+      "acc_norm": 0.6244725738396625,
+      "acc_norm_stderr": 0.03152256243091156
+    },
+    "hendrycksTest-human_aging": {
+      "acc": 0.5381165919282511,
+      "acc_stderr": 0.033460150119732274,
+      "acc_norm": 0.5381165919282511,
+      "acc_norm_stderr": 0.033460150119732274
+    },
+    "hendrycksTest-human_sexuality": {
+      "acc": 0.5343511450381679,
+      "acc_stderr": 0.043749285605997376,
+      "acc_norm": 0.5343511450381679,
+      "acc_norm_stderr": 0.043749285605997376
+    },
+    "hendrycksTest-international_law": {
+      "acc": 0.6033057851239669,
+      "acc_stderr": 0.044658697805310094,
+      "acc_norm": 0.6033057851239669,
+      "acc_norm_stderr": 0.044658697805310094
+    },
+    "hendrycksTest-jurisprudence": {
+      "acc": 0.49074074074074076,
+      "acc_stderr": 0.04832853553437055,
+      "acc_norm": 0.49074074074074076,
+      "acc_norm_stderr": 0.04832853553437055
+    },
+    "hendrycksTest-logical_fallacies": {
+      "acc": 0.48466257668711654,
+      "acc_stderr": 0.039265223787088424,
+      "acc_norm": 0.48466257668711654,
+      "acc_norm_stderr": 0.039265223787088424
+    },
+    "hendrycksTest-machine_learning": {
+      "acc": 0.375,
+      "acc_stderr": 0.04595091388086298,
+      "acc_norm": 0.375,
+      "acc_norm_stderr": 0.04595091388086298
+    },
+    "hendrycksTest-management": {
+      "acc": 0.5145631067961165,
+      "acc_stderr": 0.049486373240266356,
+      "acc_norm": 0.5145631067961165,
+      "acc_norm_stderr": 0.049486373240266356
+    },
+    "hendrycksTest-marketing": {
+      "acc": 0.6837606837606838,
+      "acc_stderr": 0.03046365674734027,
+      "acc_norm": 0.6837606837606838,
+      "acc_norm_stderr": 0.03046365674734027
+    },
+    "hendrycksTest-medical_genetics": {
+      "acc": 0.53,
+      "acc_stderr": 0.05016135580465919,
+      "acc_norm": 0.53,
+      "acc_norm_stderr": 0.05016135580465919
+    },
+    "hendrycksTest-miscellaneous": {
+      "acc": 0.6232439335887612,
+      "acc_stderr": 0.01732829290730305,
+      "acc_norm": 0.6232439335887612,
+      "acc_norm_stderr": 0.01732829290730305
+    },
+    "hendrycksTest-moral_disputes": {
+      "acc": 0.49421965317919075,
+      "acc_stderr": 0.026917296179149116,
+      "acc_norm": 0.49421965317919075,
+      "acc_norm_stderr": 0.026917296179149116
+    },
+    "hendrycksTest-moral_scenarios": {
+      "acc": 0.2446927374301676,
+      "acc_stderr": 0.014378169884098435,
+      "acc_norm": 0.2446927374301676,
+      "acc_norm_stderr": 0.014378169884098435
+    },
+    "hendrycksTest-nutrition": {
+      "acc": 0.4673202614379085,
+      "acc_stderr": 0.02856869975222588,
+      "acc_norm": 0.4673202614379085,
+      "acc_norm_stderr": 0.02856869975222588
+    },
+    "hendrycksTest-philosophy": {
+      "acc": 0.5884244372990354,
+      "acc_stderr": 0.027950481494401262,
+      "acc_norm": 0.5884244372990354,
+      "acc_norm_stderr": 0.027950481494401262
+    },
+    "hendrycksTest-prehistory": {
+      "acc": 0.5,
+      "acc_stderr": 0.02782074420373286,
+      "acc_norm": 0.5,
+      "acc_norm_stderr": 0.02782074420373286
+    },
+    "hendrycksTest-professional_accounting": {
+      "acc": 0.3475177304964539,
+      "acc_stderr": 0.028406627809590954,
+      "acc_norm": 0.3475177304964539,
+      "acc_norm_stderr": 0.028406627809590954
+    },
+    "hendrycksTest-professional_law": {
+      "acc": 0.3683181225554107,
+      "acc_stderr": 0.012319403369564639,
+      "acc_norm": 0.3683181225554107,
+      "acc_norm_stderr": 0.012319403369564639
+    },
+    "hendrycksTest-professional_medicine": {
+      "acc": 0.5330882352941176,
+      "acc_stderr": 0.03030625772246832,
+      "acc_norm": 0.5330882352941176,
+      "acc_norm_stderr": 0.03030625772246832
+    },
+    "hendrycksTest-professional_psychology": {
+      "acc": 0.42320261437908496,
+      "acc_stderr": 0.019987809769482064,
+      "acc_norm": 0.42320261437908496,
+      "acc_norm_stderr": 0.019987809769482064
+    },
+    "hendrycksTest-public_relations": {
+      "acc": 0.5363636363636364,
+      "acc_stderr": 0.04776449162396197,
+      "acc_norm": 0.5363636363636364,
+      "acc_norm_stderr": 0.04776449162396197
+    },
+    "hendrycksTest-security_studies": {
+      "acc": 0.42448979591836733,
+      "acc_stderr": 0.031642094879429414,
+      "acc_norm": 0.42448979591836733,
+      "acc_norm_stderr": 0.031642094879429414
+    },
+    "hendrycksTest-sociology": {
+      "acc": 0.5621890547263682,
+      "acc_stderr": 0.035080801121998406,
+      "acc_norm": 0.5621890547263682,
+      "acc_norm_stderr": 0.035080801121998406
+    },
+    "hendrycksTest-us_foreign_policy": {
+      "acc": 0.69,
+      "acc_stderr": 0.04648231987117316,
+      "acc_norm": 0.69,
+      "acc_norm_stderr": 0.04648231987117316
+    },
+    "hendrycksTest-virology": {
+      "acc": 0.3855421686746988,
+      "acc_stderr": 0.037891344246115496,
+      "acc_norm": 0.3855421686746988,
+      "acc_norm_stderr": 0.037891344246115496
+    },
+    "hendrycksTest-world_religions": {
+      "acc": 0.6666666666666666,
+      "acc_stderr": 0.036155076303109365,
+      "acc_norm": 0.6666666666666666,
+      "acc_norm_stderr": 0.036155076303109365
+    }
+  },
+  "versions": {
+    "hendrycksTest-abstract_algebra": 1,
+    "hendrycksTest-anatomy": 1,
+    "hendrycksTest-astronomy": 1,
+    "hendrycksTest-business_ethics": 1,
+    "hendrycksTest-clinical_knowledge": 1,
+    "hendrycksTest-college_biology": 1,
+    "hendrycksTest-college_chemistry": 1,
+    "hendrycksTest-college_computer_science": 1,
+    "hendrycksTest-college_mathematics": 1,
+    "hendrycksTest-college_medicine": 1,
+    "hendrycksTest-college_physics": 1,
+    "hendrycksTest-computer_security": 1,
+    "hendrycksTest-conceptual_physics": 1,
+    "hendrycksTest-econometrics": 1,
+    "hendrycksTest-electrical_engineering": 1,
+    "hendrycksTest-elementary_mathematics": 1,
+    "hendrycksTest-formal_logic": 1,
+    "hendrycksTest-global_facts": 1,
+    "hendrycksTest-high_school_biology": 1,
+    "hendrycksTest-high_school_chemistry": 1,
+    "hendrycksTest-high_school_computer_science": 1,
+    "hendrycksTest-high_school_european_history": 1,
+    "hendrycksTest-high_school_geography": 1,
+    "hendrycksTest-high_school_government_and_politics": 1,
+    "hendrycksTest-high_school_macroeconomics": 1,
+    "hendrycksTest-high_school_mathematics": 1,
+    "hendrycksTest-high_school_microeconomics": 1,
+    "hendrycksTest-high_school_physics": 1,
+    "hendrycksTest-high_school_psychology": 1,
+    "hendrycksTest-high_school_statistics": 1,
+    "hendrycksTest-high_school_us_history": 1,
+    "hendrycksTest-high_school_world_history": 1,
+    "hendrycksTest-human_aging": 1,
+    "hendrycksTest-human_sexuality": 1,
+    "hendrycksTest-international_law": 1,
+    "hendrycksTest-jurisprudence": 1,
+    "hendrycksTest-logical_fallacies": 1,
+    "hendrycksTest-machine_learning": 1,
+    "hendrycksTest-management": 1,
+    "hendrycksTest-marketing": 1,
+    "hendrycksTest-medical_genetics": 1,
+    "hendrycksTest-miscellaneous": 1,
+    "hendrycksTest-moral_disputes": 1,
+    "hendrycksTest-moral_scenarios": 1,
+    "hendrycksTest-nutrition": 1,
+    "hendrycksTest-philosophy": 1,
+    "hendrycksTest-prehistory": 1,
+    "hendrycksTest-professional_accounting": 1,
+    "hendrycksTest-professional_law": 1,
+    "hendrycksTest-professional_medicine": 1,
+    "hendrycksTest-professional_psychology": 1,
+    "hendrycksTest-public_relations": 1,
+    "hendrycksTest-security_studies": 1,
+    "hendrycksTest-sociology": 1,
+    "hendrycksTest-us_foreign_policy": 1,
+    "hendrycksTest-virology": 1,
+    "hendrycksTest-world_religions": 1
+  },
+  "config": {
+    "model": "hf-causal-experimental",
+    "model_args": "pretrained=/home/vmagent/app/data/Llama-2-7b-hf,peft=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal,use_accelerate=True,delta=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal/best_model_structure.txt",
+    "num_fewshot": 5,
+    "batch_size": "auto",
+    "batch_sizes": [
+      8
+    ],
+    "device": null,
+    "no_cache": false,
+    "limit": null,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}

llama2-7b-delta-truthqa ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "results": {
+    "truthfulqa_mc": {
+      "mc1": 0.3084455324357405,
+      "mc1_stderr": 0.01616803938315687,
+      "mc2": 0.45625480379943195,
+      "mc2_stderr": 0.014763037659441128
+    }
+  },
+  "versions": {
+    "truthfulqa_mc": 1
+  },
+  "config": {
+    "model": "hf-causal-experimental",
+    "model_args": "pretrained=/home/vmagent/app/data/Llama-2-7b-hf,peft=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal,use_accelerate=True,delta=/home/vmagent/app/data/llama-2-delta-tune-model-div-sal/best_model_structure.txt",
+    "num_fewshot": 0,
+    "batch_size": "auto",
+    "batch_sizes": [
+      32
+    ],
+    "device": null,
+    "no_cache": false,
+    "limit": null,
+    "bootstrap_iters": 100000,
+    "description_dict": {}
+  }
+}