Update README.md
Browse files
README.md
CHANGED
|
@@ -94,7 +94,7 @@ from transformers import AutoConfig, AutoModelForCausalLM
|
|
| 94 |
repo_name = "nvidia/Nemotron-Flash-3B-Instruct"
|
| 95 |
|
| 96 |
config = AutoConfig.from_pretrained(repo_name, trust_remote_code=True)
|
| 97 |
-
setattr(config, "
|
| 98 |
model = AutoModelForCausalLM.from_pretrained(repo_name, config=config, torch_dtype=torch.bfloat16, trust_remote_code=True)
|
| 99 |
```
|
| 100 |
|
|
|
|
| 94 |
repo_name = "nvidia/Nemotron-Flash-3B-Instruct"
|
| 95 |
|
| 96 |
config = AutoConfig.from_pretrained(repo_name, trust_remote_code=True)
|
| 97 |
+
setattr(config, "attn_implementation_new", "flash_attention_2")
|
| 98 |
model = AutoModelForCausalLM.from_pretrained(repo_name, config=config, torch_dtype=torch.bfloat16, trust_remote_code=True)
|
| 99 |
```
|
| 100 |
|