Rely on type promotion for LoRA merge (#1248)

Lightning-AI · Apr 9, 2024 · dc1945c · dc1945c
1 parent 2b37b6b
commit dc1945c
Showing 1 changed file with 2 additions and 8 deletions.
diff --git a/litgpt/lora.py b/litgpt/lora.py
@@ -156,16 +156,10 @@ def merge(self) -> None:
                 # assign updated weights and quantize by moving to CUDA device
                 self.linear.weight = bnb.nn.Params4bit(weight_data, requires_grad=False, **weight.__dict__)
                 self.linear.weight.cuda(weight.device)
-            # if the pretrained weights and LoRA weights are of compatible dtypes - simply sum them
-            elif torch.finfo(pretrained_dtype).max >= torch.finfo(lora_data.dtype).max:
+            else:
                 # self.linear might be on CPU and lora_data on CUDA
+                # the inplace add will preserve the dtype of linear.weight
                 self.linear.weight.data += lora_data.to(device=self.linear.weight.data.device)
-            else:
-                raise NotImplementedError(
-                    f"Cannot merge the pretrained weights of type {pretrained_dtype}"
-                    f" and LoRA weights of type {lora_data.dtype}"
-                )
-
             self.merged = True
 
     def forward(self, x: torch.Tensor) -> torch.Tensor: