Sharathhebbar24
/

math_gpt2_sft

Text Generation

Eval Results (legacy)

text-generation-inference

Model card Files Files and versions

Sharathhebbar24 commited on Apr 5, 2024

Commit

d54f3a8

·

verified ·

1 Parent(s): ad5ba78

Upload model

Files changed (4) hide show

README.md +2 -0
config.json +3 -3
generation_config.json +1 -1
model.safetensors +2 -2

README.md CHANGED Viewed

@@ -6,6 +6,8 @@ tags:
 - maths
 - gpt2
 - mathgpt2
 datasets:
 - meta-math/MetaMathQA
 - ArtifactAI/arxiv-math-instruct-50k

 - maths
 - gpt2
 - mathgpt2
+- trl
+- sft
 datasets:
 - meta-math/MetaMathQA
 - ArtifactAI/arxiv-math-instruct-50k

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "Sharathhebbar24/math_gpt2_sft",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
@@ -32,8 +32,8 @@
       "max_length": 50
     }
   },
-  "torch_dtype": "float16",
-  "transformers_version": "4.35.2",
   "use_cache": true,
   "vocab_size": 50257
 }

 {
+  "_name_or_path": "Sharathhebbar24/math_gpt2",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
       "max_length": 50
     }
   },
+  "torch_dtype": "float32",
+  "transformers_version": "4.39.3",
   "use_cache": true,
   "vocab_size": 50257
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "transformers_version": "4.35.2"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "transformers_version": "4.39.3"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5fd424652f5ad4f8d0256006df54b8fbcef86faca0ad50b6a5936fbdcf060099
-size 248894512

 version https://git-lfs.github.com/spec/v1
+oid sha256:76e4cb5e488f9e194cf936ccea0fa8fdbb2fc45f19a6bf7d05526f744c96146a
+size 497774208