guanwenyu1995 commited on
Commit
27f0f34
·
verified ·
1 Parent(s): cadc794

Update modeling_minicpm.py: hardcode bias=False in MLP LinearQuantizer

Browse files
Files changed (1) hide show
  1. modeling_minicpm.py +3 -3
modeling_minicpm.py CHANGED
@@ -863,9 +863,9 @@ class MiniCPMMLP(nn.Module):
863
  self.config = config
864
  self.hidden_size = config.hidden_size
865
  self.intermediate_size = config.intermediate_size
866
- self.gate_proj = LinearQuantizer(self.hidden_size, self.intermediate_size, bias=config.mlp_bias, quant_type="ternary", bit=4, group_size=-1)
867
- self.up_proj = LinearQuantizer(self.hidden_size, self.intermediate_size, bias=config.mlp_bias, quant_type="ternary", bit=4, group_size=-1)
868
- self.down_proj = LinearQuantizer(self.intermediate_size, self.hidden_size, bias=config.mlp_bias, quant_type="ternary", bit=4, group_size=-1)
869
  # self.gate_proj = nn.Linear(self.hidden_size, self.intermediate_size, bias=False)
870
  # self.up_proj = nn.Linear(self.hidden_size, self.intermediate_size, bias=False)
871
  # self.down_proj = nn.Linear(self.intermediate_size, self.hidden_size, bias=False)
 
863
  self.config = config
864
  self.hidden_size = config.hidden_size
865
  self.intermediate_size = config.intermediate_size
866
+ self.gate_proj = LinearQuantizer(self.hidden_size, self.intermediate_size, bias=False, quant_type="ternary", bit=4, group_size=-1)
867
+ self.up_proj = LinearQuantizer(self.hidden_size, self.intermediate_size, bias=False, quant_type="ternary", bit=4, group_size=-1)
868
+ self.down_proj = LinearQuantizer(self.intermediate_size, self.hidden_size, bias=False, quant_type="ternary", bit=4, group_size=-1)
869
  # self.gate_proj = nn.Linear(self.hidden_size, self.intermediate_size, bias=False)
870
  # self.up_proj = nn.Linear(self.hidden_size, self.intermediate_size, bias=False)
871
  # self.down_proj = nn.Linear(self.intermediate_size, self.hidden_size, bias=False)