Adding `safetensors` variant of this model

#4
by psyche - opened
Files changed (5) hide show
  1. README.md +0 -23
  2. config.json +2 -2
  3. generation_config.json +1 -1
  4. pytorch_model.bin +2 -2
  5. rust_model.ot +3 -0
README.md DELETED
@@ -1,23 +0,0 @@
1
- ---
2
- language:
3
- - en
4
- - ko
5
- tags:
6
- - generation
7
- license: apache-2.0
8
- ---
9
-
10
- Pretrained GPT2 with expanded n_ctx up to 2048(also with expanded embedding dimension to 1536) in Korean.
11
- # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
12
- Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_psyche__kogpt)
13
-
14
- | Metric | Value |
15
- |-----------------------|---------------------------|
16
- | Avg. | 24.27 |
17
- | ARC (25-shot) | 21.16 |
18
- | HellaSwag (10-shot) | 28.11 |
19
- | MMLU (5-shot) | 26.56 |
20
- | TruthfulQA (0-shot) | 42.06 |
21
- | Winogrande (5-shot) | 49.09 |
22
- | GSM8K (5-shot) | 0.0 |
23
- | DROP (3-shot) | 2.89 |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "psyche/kogpt",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -33,7 +33,7 @@
33
  }
34
  },
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.31.0",
37
  "use_cache": true,
38
  "vocab_size": 32002
39
  }
 
1
  {
2
+ "_name_or_path": "runs/checkpoint-66000",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
33
  }
34
  },
35
  "torch_dtype": "float32",
36
+ "transformers_version": "4.30.2",
37
  "use_cache": true,
38
  "vocab_size": 32002
39
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
- "transformers_version": "4.31.0"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
+ "transformers_version": "4.30.2"
6
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bb7be5d1b9b55633082dd466d75a8f6028b02bfa2255a430cdb6b63a3ac1e6d
3
- size 1569174365
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6174fe3c21d632e922a498fd5d347893add6efd757af0c3f7c316d9e78040346
3
+ size 891699345
rust_model.ot ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e80d7e388967e4b2a2cb00047bc0cc7751fbe6249dd09a18f5e16bee8e62db61
3
+ size 1817336536