feat(qmodule): avoid random weights initialization

huggingface · Aug 24, 2024 · a1c310b · a1c310b
1 parent 04c8010
commit a1c310b
Showing 1 changed file with 7 additions and 1 deletion.
diff --git a/optimum/quanto/nn/qmodule.py b/optimum/quanto/nn/qmodule.py
@@ -201,9 +201,15 @@ def from_module(
         activations: Optional[qtype] = None,
         optimizer: Optional[Optimizer] = None,
     ):
-        qmodule = cls.qcreate(module, weights, activations, optimizer)
+        # Create the quantized module on the meta device to prevent weights intialization
+        qmodule = cls.qcreate(module, weights, activations, optimizer, device="meta")
         if qmodule is None:
             return None
+        # Move the quantized module to the target device, but with empty weights
+        qmodule = qmodule.to_empty(device=module.weight.device)
+        # Set scales that were initialized to empty values
+        qmodule.input_scale = torch.ones_like(qmodule.input_scale)
+        qmodule.output_scale = torch.ones_like(qmodule.output_scale)
         with torch.no_grad():
             qmodule.weight.copy_(module.weight)
             if module.bias is not None: