Maxtimer97 commited on
Commit
3d4c21e
·
1 Parent(s): bdf9fdc

Corrected device assignment error

Browse files
Files changed (1) hide show
  1. modeling_chatglm.py +1 -1
modeling_chatglm.py CHANGED
@@ -505,7 +505,7 @@ class NativeSparseAttention(CoreAttention):
505
  y_seqlens[seqlens < self.kernel_size] = 0
506
  cmp_seqlens = torch.cat(
507
  [
508
- torch.zeros(1, dtype=torch.int32, device="cuda"),
509
  torch.cumsum(y_seqlens, dim=0),
510
  ],
511
  dim=0,
 
505
  y_seqlens[seqlens < self.kernel_size] = 0
506
  cmp_seqlens = torch.cat(
507
  [
508
+ torch.zeros(1, dtype=torch.int32, device=y_seqlens.device),
509
  torch.cumsum(y_seqlens, dim=0),
510
  ],
511
  dim=0,