Adding `safetensors` variant of this model

by SFconvertbot - opened Jul 31, 2023

←

Files changed (3) hide show

README.md CHANGED Viewed

@@ -5,19 +5,46 @@ language:
 tags:
   - generation
 license: apache-2.0
----
-Pretrained GPT2 with expanded n_ctx up to 2048(also with expanded embedding dimension to 1536) in Korean.
-# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
-Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_psyche__kogpt)
-| Metric                | Value                     |
-|-----------------------|---------------------------|
-| Avg.                  | 24.27   |
-| ARC (25-shot)         | 21.16          |
-| HellaSwag (10-shot)   | 28.11    |
-| MMLU (5-shot)         | 26.56         |
-| TruthfulQA (0-shot)   | 42.06   |
-| Winogrande (5-shot)   | 49.09   |
-| GSM8K (5-shot)        | 0.0        |
-| DROP (3-shot)         | 2.89         |

 tags:
   - generation
 license: apache-2.0
+model-index:
+  - name: task_1
+    results:
+      - task:
+          type: natural-language-generation
+        dataset:
+          type: hellaswag
+          name: hellaswag(10 shots)
+        metrics:
+          - type: acc_norm
+            value: 27.7
+  - name: task_2
+    results:
+      - task:
+          type: natural-language-generation
+        dataset:
+          type: ARC
+          name: ARC(25 shots)
+        metrics:
+          - type: acc_norm
+            value: 23.8
+  - name: task_3
+    results:
+      - task:
+          type: natural-language-generation
+        dataset:
+          type: MMLU
+          name: MMLU(5 shots)
+        metrics:
+          - type: acc
+            value: 24.9
+  - name: task_4
+    results:
+      - task:
+          type: natural-language-generation
+        dataset:
+          type: TruthfulQA
+          name: TruthfulQA(0 shots)
+        metrics:
+          - type: mc2
+            value: 46.5
+---

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "psyche/kogpt",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"

 {
+  "_name_or_path": "runs/checkpoint-100000",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"

model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a97b23bfa8be7ce6e1cf0eaeee05774361fd096c6d057fc7d1bf653b098150dd
-size 1569143832