Instructions to use bryanmildort/gpt_neo_notes with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use bryanmildort/gpt_neo_notes with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("text-generation", model="bryanmildort/gpt_neo_notes")# Load model directly from transformers import AutoTokenizer, AutoModelForCausalLM tokenizer = AutoTokenizer.from_pretrained("bryanmildort/gpt_neo_notes") model = AutoModelForCausalLM.from_pretrained("bryanmildort/gpt_neo_notes") - Notebooks
- Google Colab
- Kaggle
- Local Apps Settings
- vLLM
How to use bryanmildort/gpt_neo_notes with vLLM:
Install from pip and serve model
# Install vLLM from pip: pip install vllm # Start the vLLM server: vllm serve "bryanmildort/gpt_neo_notes" # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:8000/v1/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "bryanmildort/gpt_neo_notes", "prompt": "Once upon a time,", "max_tokens": 512, "temperature": 0.5 }'Use Docker
docker model run hf.co/bryanmildort/gpt_neo_notes
- SGLang
How to use bryanmildort/gpt_neo_notes with SGLang:
Install from pip and serve model
# Install SGLang from pip: pip install sglang # Start the SGLang server: python3 -m sglang.launch_server \ --model-path "bryanmildort/gpt_neo_notes" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "bryanmildort/gpt_neo_notes", "prompt": "Once upon a time,", "max_tokens": 512, "temperature": 0.5 }'Use Docker images
docker run --gpus all \ --shm-size 32g \ -p 30000:30000 \ -v ~/.cache/huggingface:/root/.cache/huggingface \ --env "HF_TOKEN=<secret>" \ --ipc=host \ lmsysorg/sglang:latest \ python3 -m sglang.launch_server \ --model-path "bryanmildort/gpt_neo_notes" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "bryanmildort/gpt_neo_notes", "prompt": "Once upon a time,", "max_tokens": 512, "temperature": 0.5 }' - Docker Model Runner
How to use bryanmildort/gpt_neo_notes with Docker Model Runner:
docker model run hf.co/bryanmildort/gpt_neo_notes
Commit ·
a07eb96
1
Parent(s): d311cdf
Upload 9 files
Browse files- config.json +2 -2
- generation_config.json +1 -1
- pytorch_model-00001-of-00002.bin +2 -2
- pytorch_model-00002-of-00002.bin +2 -2
- pytorch_model.bin.index.json +7 -7
- training_args.bin +2 -2
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"activation_function": "gelu_new",
|
| 4 |
"architectures": [
|
| 5 |
"GPTNeoForCausalLM"
|
|
@@ -75,7 +75,7 @@
|
|
| 75 |
},
|
| 76 |
"tokenizer_class": "GPT2Tokenizer",
|
| 77 |
"torch_dtype": "float32",
|
| 78 |
-
"transformers_version": "4.
|
| 79 |
"use_cache": true,
|
| 80 |
"vocab_size": 50258,
|
| 81 |
"window_size": 256
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "./notes-nlp/gpt_neo_notes_pre",
|
| 3 |
"activation_function": "gelu_new",
|
| 4 |
"architectures": [
|
| 5 |
"GPTNeoForCausalLM"
|
|
|
|
| 75 |
},
|
| 76 |
"tokenizer_class": "GPT2Tokenizer",
|
| 77 |
"torch_dtype": "float32",
|
| 78 |
+
"transformers_version": "4.27.2",
|
| 79 |
"use_cache": true,
|
| 80 |
"vocab_size": 50258,
|
| 81 |
"window_size": 256
|
generation_config.json
CHANGED
|
@@ -2,5 +2,5 @@
|
|
| 2 |
"_from_model_config": true,
|
| 3 |
"bos_token_id": 50256,
|
| 4 |
"eos_token_id": 50256,
|
| 5 |
-
"transformers_version": "4.
|
| 6 |
}
|
|
|
|
| 2 |
"_from_model_config": true,
|
| 3 |
"bos_token_id": 50256,
|
| 4 |
"eos_token_id": 50256,
|
| 5 |
+
"transformers_version": "4.27.2"
|
| 6 |
}
|
pytorch_model-00001-of-00002.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8998bd59cf93fe14a866d72a521e63f67ed1b6727bc70496bb4e76fde1ceb84
|
| 3 |
+
size 10106068835
|
pytorch_model-00002-of-00002.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82cd5c78a022746235382eef2800dd18a0eb542f230d7abb6d17bead95c937a2
|
| 3 |
+
size 633553991
|
pytorch_model.bin.index.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
-
"total_size":
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"transformer.h.0.attn.attention.bias": "pytorch_model-00001-of-00002.bin",
|
|
@@ -346,8 +346,8 @@
|
|
| 346 |
"transformer.h.29.ln_2.weight": "pytorch_model-00001-of-00002.bin",
|
| 347 |
"transformer.h.29.mlp.c_fc.bias": "pytorch_model-00001-of-00002.bin",
|
| 348 |
"transformer.h.29.mlp.c_fc.weight": "pytorch_model-00001-of-00002.bin",
|
| 349 |
-
"transformer.h.29.mlp.c_proj.bias": "pytorch_model-
|
| 350 |
-
"transformer.h.29.mlp.c_proj.weight": "pytorch_model-
|
| 351 |
"transformer.h.3.attn.attention.bias": "pytorch_model-00001-of-00002.bin",
|
| 352 |
"transformer.h.3.attn.attention.k_proj.weight": "pytorch_model-00001-of-00002.bin",
|
| 353 |
"transformer.h.3.attn.attention.masked_bias": "pytorch_model-00001-of-00002.bin",
|
|
@@ -363,15 +363,15 @@
|
|
| 363 |
"transformer.h.3.mlp.c_fc.weight": "pytorch_model-00001-of-00002.bin",
|
| 364 |
"transformer.h.3.mlp.c_proj.bias": "pytorch_model-00001-of-00002.bin",
|
| 365 |
"transformer.h.3.mlp.c_proj.weight": "pytorch_model-00001-of-00002.bin",
|
| 366 |
-
"transformer.h.30.attn.attention.bias": "pytorch_model-
|
| 367 |
"transformer.h.30.attn.attention.k_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 368 |
-
"transformer.h.30.attn.attention.masked_bias": "pytorch_model-
|
| 369 |
"transformer.h.30.attn.attention.out_proj.bias": "pytorch_model-00002-of-00002.bin",
|
| 370 |
"transformer.h.30.attn.attention.out_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 371 |
"transformer.h.30.attn.attention.q_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 372 |
"transformer.h.30.attn.attention.v_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 373 |
-
"transformer.h.30.ln_1.bias": "pytorch_model-
|
| 374 |
-
"transformer.h.30.ln_1.weight": "pytorch_model-
|
| 375 |
"transformer.h.30.ln_2.bias": "pytorch_model-00002-of-00002.bin",
|
| 376 |
"transformer.h.30.ln_2.weight": "pytorch_model-00002-of-00002.bin",
|
| 377 |
"transformer.h.30.mlp.c_fc.bias": "pytorch_model-00002-of-00002.bin",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
+
"total_size": 10622017664.0
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"transformer.h.0.attn.attention.bias": "pytorch_model-00001-of-00002.bin",
|
|
|
|
| 346 |
"transformer.h.29.ln_2.weight": "pytorch_model-00001-of-00002.bin",
|
| 347 |
"transformer.h.29.mlp.c_fc.bias": "pytorch_model-00001-of-00002.bin",
|
| 348 |
"transformer.h.29.mlp.c_fc.weight": "pytorch_model-00001-of-00002.bin",
|
| 349 |
+
"transformer.h.29.mlp.c_proj.bias": "pytorch_model-00001-of-00002.bin",
|
| 350 |
+
"transformer.h.29.mlp.c_proj.weight": "pytorch_model-00001-of-00002.bin",
|
| 351 |
"transformer.h.3.attn.attention.bias": "pytorch_model-00001-of-00002.bin",
|
| 352 |
"transformer.h.3.attn.attention.k_proj.weight": "pytorch_model-00001-of-00002.bin",
|
| 353 |
"transformer.h.3.attn.attention.masked_bias": "pytorch_model-00001-of-00002.bin",
|
|
|
|
| 363 |
"transformer.h.3.mlp.c_fc.weight": "pytorch_model-00001-of-00002.bin",
|
| 364 |
"transformer.h.3.mlp.c_proj.bias": "pytorch_model-00001-of-00002.bin",
|
| 365 |
"transformer.h.3.mlp.c_proj.weight": "pytorch_model-00001-of-00002.bin",
|
| 366 |
+
"transformer.h.30.attn.attention.bias": "pytorch_model-00001-of-00002.bin",
|
| 367 |
"transformer.h.30.attn.attention.k_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 368 |
+
"transformer.h.30.attn.attention.masked_bias": "pytorch_model-00001-of-00002.bin",
|
| 369 |
"transformer.h.30.attn.attention.out_proj.bias": "pytorch_model-00002-of-00002.bin",
|
| 370 |
"transformer.h.30.attn.attention.out_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 371 |
"transformer.h.30.attn.attention.q_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 372 |
"transformer.h.30.attn.attention.v_proj.weight": "pytorch_model-00002-of-00002.bin",
|
| 373 |
+
"transformer.h.30.ln_1.bias": "pytorch_model-00001-of-00002.bin",
|
| 374 |
+
"transformer.h.30.ln_1.weight": "pytorch_model-00001-of-00002.bin",
|
| 375 |
"transformer.h.30.ln_2.bias": "pytorch_model-00002-of-00002.bin",
|
| 376 |
"transformer.h.30.ln_2.weight": "pytorch_model-00002-of-00002.bin",
|
| 377 |
"transformer.h.30.mlp.c_fc.bias": "pytorch_model-00002-of-00002.bin",
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1366c71c60e969557fe221b2103dac00c9b4c2153c6081f264bda847cd37c95
|
| 3 |
+
size 3515
|