Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
|
@@ -41,6 +41,7 @@ Unlike autoregressive models, DiffReaper-5 generates the entire response in para
|
|
| 41 |
```python
|
| 42 |
import torch
|
| 43 |
import torch.nn.functional as F
|
|
|
|
| 44 |
|
| 45 |
def generate(model, tokenizer, prompt, steps=10):
|
| 46 |
model.eval()
|
|
@@ -62,6 +63,10 @@ def generate(model, tokenizer, prompt, steps=10):
|
|
| 62 |
norm_r = F.normalize(r_noise, dim=-1)
|
| 63 |
logits = torch.matmul(norm_r, norm_weights.T)
|
| 64 |
return tokenizer.decode(torch.argmax(logits, dim=-1)[0])
|
|
|
|
|
|
|
|
|
|
|
|
|
| 65 |
```
|
| 66 |
|
| 67 |
## 🎯 Fine-tuning
|
|
|
|
| 41 |
```python
|
| 42 |
import torch
|
| 43 |
import torch.nn.functional as F
|
| 44 |
+
# Assuming DiffReaperModel is defined as per train_autogrow.py
|
| 45 |
|
| 46 |
def generate(model, tokenizer, prompt, steps=10):
|
| 47 |
model.eval()
|
|
|
|
| 63 |
norm_r = F.normalize(r_noise, dim=-1)
|
| 64 |
logits = torch.matmul(norm_r, norm_weights.T)
|
| 65 |
return tokenizer.decode(torch.argmax(logits, dim=-1)[0])
|
| 66 |
+
|
| 67 |
+
# --- Loading Example ---
|
| 68 |
+
# model = DiffReaperModel(vocab_size=50257, n_embd=1024, n_head=16, n_layer=12).to("cuda")
|
| 69 |
+
# model.load_state_dict(torch.load("cropmark_latest.pt"))
|
| 70 |
```
|
| 71 |
|
| 72 |
## 🎯 Fine-tuning
|