fix: set fp32 when using cpu bc bf16 is slow (#44)

- fix: set fp32 when using cpu bc bf16 is slow (6787a0f57730d94a2dda30bf54ab96382ce09536)

Files changed (1) hide show

configuration_xlm_roberta.py CHANGED Viewed

@@ -126,3 +126,5 @@ class XLMRobertaFlashConfig(PretrainedConfig):
             self.torch_dtype = getattr(torch, torch_dtype)
         else:
             self.torch_dtype = torch_dtype

             self.torch_dtype = getattr(torch, torch_dtype)
         else:
             self.torch_dtype = torch_dtype
+        if not self.use_flash_attn or not torch.cuda.is_available():
+            self.torch_dtype = torch.float32