zai-org
/

chatglm2-6b

Model card Files Files and versions

duzx16 commited on Jul 5, 2023

Commit

0ecfe0b

·

1 Parent(s): 31d45da

Fix prefix projection

Files changed (1) hide show

modeling_chatglm.py +4 -3

modeling_chatglm.py CHANGED Viewed

@@ -68,11 +68,12 @@ class PrefixEncoder(torch.nn.Module):
         self.prefix_projection = config.prefix_projection
         if self.prefix_projection:
             # Use a two-layer MLP to encode the prefix
-            self.embedding = torch.nn.Embedding(config.pre_seq_len, config.hidden_size)
             self.trans = torch.nn.Sequential(
-                torch.nn.Linear(config.hidden_size, config.hidden_size),
                 torch.nn.Tanh(),
-                torch.nn.Linear(config.hidden_size, config.num_layers * config.hidden_size * 2)
             )
         else:
             self.embedding = torch.nn.Embedding(config.pre_seq_len,

         self.prefix_projection = config.prefix_projection
         if self.prefix_projection:
             # Use a two-layer MLP to encode the prefix
+            kv_size = config.num_layers * config.kv_channels * config.multi_query_group_num * 2
+            self.embedding = torch.nn.Embedding(config.pre_seq_len, kv_size)
             self.trans = torch.nn.Sequential(
+                torch.nn.Linear(kv_size, config.hidden_size),
                 torch.nn.Tanh(),
+                torch.nn.Linear(config.hidden_size, kv_size)
             )
         else:
             self.embedding = torch.nn.Embedding(config.pre_seq_len,