Adding `safetensors` variant of this model

#5
by SFconvertbot - opened
Files changed (5) hide show
  1. README.md +42 -15
  2. config.json +2 -2
  3. generation_config.json +1 -1
  4. pytorch_model.bin +2 -2
  5. rust_model.ot +3 -0
README.md CHANGED
@@ -5,19 +5,46 @@ language:
5
  tags:
6
  - generation
7
  license: apache-2.0
8
- ---
9
-
10
- Pretrained GPT2 with expanded n_ctx up to 2048(also with expanded embedding dimension to 1536) in Korean.
11
- # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
12
- Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_psyche__kogpt)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
 
14
- | Metric | Value |
15
- |-----------------------|---------------------------|
16
- | Avg. | 24.27 |
17
- | ARC (25-shot) | 21.16 |
18
- | HellaSwag (10-shot) | 28.11 |
19
- | MMLU (5-shot) | 26.56 |
20
- | TruthfulQA (0-shot) | 42.06 |
21
- | Winogrande (5-shot) | 49.09 |
22
- | GSM8K (5-shot) | 0.0 |
23
- | DROP (3-shot) | 2.89 |
 
 
5
  tags:
6
  - generation
7
  license: apache-2.0
8
+ model-index:
9
+ - name: task_1
10
+ results:
11
+ - task:
12
+ type: natural-language-generation
13
+ dataset:
14
+ type: hellaswag
15
+ name: hellaswag(10 shots)
16
+ metrics:
17
+ - type: acc_norm
18
+ value: 27.7
19
+ - name: task_2
20
+ results:
21
+ - task:
22
+ type: natural-language-generation
23
+ dataset:
24
+ type: ARC
25
+ name: ARC(25 shots)
26
+ metrics:
27
+ - type: acc_norm
28
+ value: 23.8
29
+ - name: task_3
30
+ results:
31
+ - task:
32
+ type: natural-language-generation
33
+ dataset:
34
+ type: MMLU
35
+ name: MMLU(5 shots)
36
+ metrics:
37
+ - type: acc
38
+ value: 24.9
39
 
40
+ - name: task_4
41
+ results:
42
+ - task:
43
+ type: natural-language-generation
44
+ dataset:
45
+ type: TruthfulQA
46
+ name: TruthfulQA(0 shots)
47
+ metrics:
48
+ - type: mc2
49
+ value: 46.5
50
+ ---
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "psyche/kogpt",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -33,7 +33,7 @@
33
  }
34
  },
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.31.0",
37
  "use_cache": true,
38
  "vocab_size": 32002
39
  }
 
1
  {
2
+ "_name_or_path": "runs/checkpoint-47500",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
33
  }
34
  },
35
  "torch_dtype": "float32",
36
+ "transformers_version": "4.30.2",
37
  "use_cache": true,
38
  "vocab_size": 32002
39
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
- "transformers_version": "4.31.0"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
+ "transformers_version": "4.30.2"
6
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bb7be5d1b9b55633082dd466d75a8f6028b02bfa2255a430cdb6b63a3ac1e6d
3
- size 1569174365
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6174fe3c21d632e922a498fd5d347893add6efd757af0c3f7c316d9e78040346
3
+ size 891699345
rust_model.ot ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e80d7e388967e4b2a2cb00047bc0cc7751fbe6249dd09a18f5e16bee8e62db61
3
+ size 1817336536