Update lora_w2w.py
Browse files- lora_w2w.py +2 -1
lora_w2w.py
CHANGED
|
@@ -83,7 +83,7 @@ class LoRAModule(nn.Module):
|
|
| 83 |
alpha = alpha.detach().numpy()
|
| 84 |
alpha = lora_dim if alpha is None or alpha == 0 else alpha
|
| 85 |
self.scale = alpha / self.lora_dim
|
| 86 |
-
|
| 87 |
|
| 88 |
|
| 89 |
self.multiplier = multiplier
|
|
@@ -96,6 +96,7 @@ class LoRAModule(nn.Module):
|
|
| 96 |
|
| 97 |
def forward(self, x):
|
| 98 |
print(self.org_forward(x).dtype)
|
|
|
|
| 99 |
|
| 100 |
return self.org_forward(x) +\
|
| 101 |
(x@((self.proj@self.v1.T)*self.std1+self.mean1).T)@(((self.proj@self.v2.T)*self.std2+self.mean2))*self.multiplier*self.scale
|
|
|
|
| 83 |
alpha = alpha.detach().numpy()
|
| 84 |
alpha = lora_dim if alpha is None or alpha == 0 else alpha
|
| 85 |
self.scale = alpha / self.lora_dim
|
| 86 |
+
self.scale = self.scale.bfloat16()
|
| 87 |
|
| 88 |
|
| 89 |
self.multiplier = multiplier
|
|
|
|
| 96 |
|
| 97 |
def forward(self, x):
|
| 98 |
print(self.org_forward(x).dtype)
|
| 99 |
+
print((x@((self.proj@self.v1.T)*self.std1+self.mean1).T).dtype)
|
| 100 |
|
| 101 |
return self.org_forward(x) +\
|
| 102 |
(x@((self.proj@self.v1.T)*self.std1+self.mean1).T)@(((self.proj@self.v2.T)*self.std2+self.mean2))*self.multiplier*self.scale
|