Add base model card (text-completion; no reasoning/tool-calling) + LICENSE.md

#2
by joerowell - opened
Files changed (2) hide show
  1. README.md +2 -7
  2. config.json +2 -2
README.md CHANGED
@@ -7,7 +7,6 @@ extra_gated_description: >-
7
  tags:
8
  - laguna-m.1
9
  - vllm
10
- - sglang
11
  - bf16
12
  - moe
13
  license: apache-2.0
@@ -87,10 +86,6 @@ completion = client.completions.create(
87
  print(completion.choices[0].text)
88
  ```
89
 
90
- ### SGLang
91
-
92
- Laguna M.1-base is supported in SGLang via [sgl-project/sglang#28400](https://github.com/sgl-project/sglang/pull/28400). As a completion model, serve it without the reasoning/tool-call parsers. A full serving recipe will be added here.
93
-
94
  ### Transformers
95
 
96
  Laguna is supported in Transformers `v5.7.0` and later ([huggingface/transformers#45673](https://github.com/huggingface/transformers/pull/45673)).
@@ -116,8 +111,8 @@ print(tokenizer.decode(outputs[0], skip_special_tokens=True))
116
 
117
  This model is licensed under the [Apache 2.0 License](https://huggingface.co/poolside/Laguna-M.1-base/blob/main/LICENSE.md).
118
 
119
- ## Intended and Responsible Use
120
 
121
- Laguna M.1 is designed for software engineering and agentic coding use cases, and you are responsible for confirming that it is appropriate for your intended application. Laguna M.1 is subject to the [Apache 2.0 License](https://huggingface.co/poolside/Laguna-M.1/blob/main/LICENSE.md), and should be used consistently with Poolside's [Acceptable Use Policy](https://poolside.ai/legal/acceptable-use-policy). We advise against circumventing Laguna M.1 safety guardrails without implementing substantially equivalent mitigations appropriate for your use case.
122
 
123
  Please report security vulnerabilities or safety concerns to [security@poolside.ai](mailto:security@poolside.ai).
 
7
  tags:
8
  - laguna-m.1
9
  - vllm
 
10
  - bf16
11
  - moe
12
  license: apache-2.0
 
86
  print(completion.choices[0].text)
87
  ```
88
 
 
 
 
 
89
  ### Transformers
90
 
91
  Laguna is supported in Transformers `v5.7.0` and later ([huggingface/transformers#45673](https://github.com/huggingface/transformers/pull/45673)).
 
111
 
112
  This model is licensed under the [Apache 2.0 License](https://huggingface.co/poolside/Laguna-M.1-base/blob/main/LICENSE.md).
113
 
114
+ ## Intended and Responsible Use
115
 
116
+ Laguna M.1-base is a base (pre-instruct) model intended for research and as a starting point for further training; you are responsible for confirming that it is appropriate for your intended application. It is subject to the [Apache 2.0 License](https://huggingface.co/poolside/Laguna-M.1-base/blob/main/LICENSE.md), and should be used consistently with Poolside's [Acceptable Use Policy](https://poolside.ai/legal/acceptable-use-policy). As a base model without post-training, it has not been through safety tuning; apply appropriate mitigations for your use case.
117
 
118
  Please report security vulnerabilities or safety concerns to [security@poolside.ai](mailto:security@poolside.ai).
config.json CHANGED
@@ -14,7 +14,7 @@
14
  "num_attention_heads": 64,
15
  "num_key_value_heads": 8,
16
  "head_dim": 128,
17
- "max_position_embeddings": 262144,
18
  "attention_bias": false,
19
  "attention_dropout": 0.0,
20
  "rms_norm_eps": 1e-06,
@@ -45,7 +45,7 @@
45
  "full_attention": {
46
  "rope_theta": 500000.0,
47
  "rope_type": "yarn",
48
- "factor": 64.0,
49
  "original_max_position_embeddings": 4096,
50
  "beta_slow": 1.0,
51
  "beta_fast": 64.0,
 
14
  "num_attention_heads": 64,
15
  "num_key_value_heads": 8,
16
  "head_dim": 128,
17
+ "max_position_embeddings": 131072,
18
  "attention_bias": false,
19
  "attention_dropout": 0.0,
20
  "rms_norm_eps": 1e-06,
 
45
  "full_attention": {
46
  "rope_theta": 500000.0,
47
  "rope_type": "yarn",
48
+ "factor": 32.0,
49
  "original_max_position_embeddings": 4096,
50
  "beta_slow": 1.0,
51
  "beta_fast": 64.0,