marius-baseten commited on
Commit
ce12321
·
verified ·
1 Parent(s): a0a5af4

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. config.json +3 -3
  2. gpt_float16_tp1_rank0.engine +2 -2
config.json CHANGED
@@ -6,12 +6,12 @@
6
  "hidden_size": 768,
7
  "int8": false,
8
  "lora_target_modules": null,
9
- "max_batch_size": 16,
10
  "max_beam_width": 1,
11
  "max_draft_len": 0,
12
- "max_input_len": 512,
13
  "max_num_tokens": null,
14
- "max_output_len": 200,
15
  "max_position_embeddings": 1024,
16
  "max_prompt_embedding_table_size": 0,
17
  "name": "gpt",
 
6
  "hidden_size": 768,
7
  "int8": false,
8
  "lora_target_modules": null,
9
+ "max_batch_size": 32,
10
  "max_beam_width": 1,
11
  "max_draft_len": 0,
12
+ "max_input_len": 1024,
13
  "max_num_tokens": null,
14
+ "max_output_len": 2048,
15
  "max_position_embeddings": 1024,
16
  "max_prompt_embedding_table_size": 0,
17
  "name": "gpt",
gpt_float16_tp1_rank0.engine CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f92cab6ffe048accc1475d3187147c664daa820d31c09fa42e8c0fc54f1a5dc3
3
- size 328056100
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50ffa47bfbe312d8d243e97995a83e0494c312d03d0ba18dd2577b7b9a684e24
3
+ size 328061308