Passing device type in torch GradScaler (#345)

quic-swatia · shubhagr-quic · commit 1a1f6cdfe2ce · 2025-04-21T10:56:26.000+05:30
Passing device type in torch GradScaler(), in case of CUDA and CPU so
that it picks up the correct device in case of CPU.

Signed-off-by: Swati Allabadi &lt;quic_sallabad@quicinc.com&gt;
Co-authored-by: Swati Allabadi &lt;quic_sallabad@quicinc.com&gt;
diff --git a/QEfficient/finetune/utils/train_utils.py b/QEfficient/finetune/utils/train_utils.py
@@ -83,6 +83,7 @@ def train(
     best_val_loss = float("inf")
     total_train_steps = 0
     max_steps_reached = False  # Flag to indicate max training steps reached
+    device_type = device.split(":")[0]
 
     tensorboard_updates = None
     if train_config.enable_ddp:
@@ -95,7 +96,7 @@ def train(
         if device.startswith("qaic"):
             scaler = QAicGradScaler()
         else:
-            scaler = GradScaler()
+            scaler = GradScaler(device_type)
 
     loss_0_counter = torch.tensor([0]).to(device)