yagizdevre commited on
Commit
1f5f496
·
1 Parent(s): 43bd63d
__pycache__/configuration_ministu.cpython-312.pyc CHANGED
Binary files a/__pycache__/configuration_ministu.cpython-312.pyc and b/__pycache__/configuration_ministu.cpython-312.pyc differ
 
layers.py CHANGED
@@ -57,6 +57,7 @@ class STULayer(nn.Module):
57
 
58
  # Normalize and apply STU
59
  x_normed = self.stu_norm(x).to(dtype=self.stu.M_inputs.dtype) # Match dtype for STU
 
60
  x_stu = self.stu(x_normed).to(dtype=x.dtype) # Ensure output matches `x`'s dtype
61
  x = x + x_stu
62
 
 
57
 
58
  # Normalize and apply STU
59
  x_normed = self.stu_norm(x).to(dtype=self.stu.M_inputs.dtype) # Match dtype for STU
60
+ print(f"x dtype: {x.dtype}")
61
  x_stu = self.stu(x_normed).to(dtype=x.dtype) # Ensure output matches `x`'s dtype
62
  x = x + x_stu
63