Merge pull request #37 from ModelTC/ttt

llmc-reviewer · web-flow · commit 98b8ec2987ad · 2024-08-23T06:10:40.000+08:00
remove redundant code
diff --git a/llmc/compression/quantization/quarot.py b/llmc/compression/quantization/quarot.py
@@ -92,15 +92,6 @@ def block_transform(self, block):
         logger.info(f'block:{block}')
         logger.info(f'End transform the {self.block_idx+1}-th block')
 
-    def bake_mean_into_linear(self, linear):
-        linear_dtype = linear.weight.dtype
-        W_ = linear.weight.data.double()
-        linear.weight.data = W_ - W_.mean(dim=-2, keepdim=True)
-        linear.weight.data = linear.weight.data.to(linear_dtype)
-        if linear.bias is not None:
-            b_ = linear.bias.data.double()
-            linear.bias.data = b_ - b_.mean()
-            linear.bias.data = linear.bias.data.to(linear_dtype)
 
     @torch.no_grad()
     def subset_transform(self, block, subset):
@@ -117,7 +108,7 @@ def subset_transform(self, block, subset):
             self.rotate_pre_layers(layers, self.Q)
         else:
             if self.config['model']['type'] in ['Opt', 'StableLm']:
-                self.bake_mean_into_linear(layers[0])
+                self.bake_mean_into_fc(layers[0])
 
             if 'is_mlp' in subset and subset['is_mlp']:
                 self.rotate_post_layers(