darwinkernelpanic commited on
Commit
0a0a218
·
verified ·
1 Parent(s): e7e1fc5

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +5 -0
README.md CHANGED
@@ -41,6 +41,7 @@ Unlike autoregressive models, DiffReaper-5 generates the entire response in para
41
  ```python
42
  import torch
43
  import torch.nn.functional as F
 
44
 
45
  def generate(model, tokenizer, prompt, steps=10):
46
  model.eval()
@@ -62,6 +63,10 @@ def generate(model, tokenizer, prompt, steps=10):
62
  norm_r = F.normalize(r_noise, dim=-1)
63
  logits = torch.matmul(norm_r, norm_weights.T)
64
  return tokenizer.decode(torch.argmax(logits, dim=-1)[0])
 
 
 
 
65
  ```
66
 
67
  ## 🎯 Fine-tuning
 
41
  ```python
42
  import torch
43
  import torch.nn.functional as F
44
+ # Assuming DiffReaperModel is defined as per train_autogrow.py
45
 
46
  def generate(model, tokenizer, prompt, steps=10):
47
  model.eval()
 
63
  norm_r = F.normalize(r_noise, dim=-1)
64
  logits = torch.matmul(norm_r, norm_weights.T)
65
  return tokenizer.decode(torch.argmax(logits, dim=-1)[0])
66
+
67
+ # --- Loading Example ---
68
+ # model = DiffReaperModel(vocab_size=50257, n_embd=1024, n_head=16, n_layer=12).to("cuda")
69
+ # model.load_state_dict(torch.load("cropmark_latest.pt"))
70
  ```
71
 
72
  ## 🎯 Fine-tuning