pre-commit

wcrzlh · wcrzlh · commit ee27ea934d86 · 2025-11-04T20:37:32.000+08:00
diff --git a/mindone/transformers/masking_utils.py b/mindone/transformers/masking_utils.py
@@ -304,15 +304,15 @@ def sdpa_mask_recent_torch(
 
     # Similar to `kv_arange = mint.arange(start=kv_offset, end=kv_offset + kv_length, device=cache_position.device)`
     # but without data-dependent slicing (i.e. torch.compile friendly)
-    kv_arange = mint.arange(kv_length, device=cache_position.device)
+    kv_arange = mint.arange(kv_length)
     kv_arange += kv_offset
 
     # Potentially add the padding 2D mask
     if padding_mask is not None:
         mask_function = and_masks(mask_function, padding_mask_function(padding_mask))
 
-    batch_arange = mint.arange(batch_size, device=cache_position.device)
-    head_arange = mint.arange(1, device=cache_position.device)
+    batch_arange = mint.arange(batch_size)
+    head_arange = mint.arange(1)
     # This creates the 4D mask easily. Note that we need this context manager as vmap cannot handle slicing a tensor from
     # scalar tensor (it internally calls `.item()` which vmap does not allow, but this context works around it
     # We don't need to add an offset to the mask_function either, as we vmap directly the correct indices for k and kv indices
diff --git a/mindone/transformers/modeling_utils.py b/mindone/transformers/modeling_utils.py
@@ -2458,7 +2458,7 @@ def from_pretrained(
 
         if transformers_explicit_filename is not None:
             if not transformers_explicit_filename.endswith(
-                    ".safetensors"
+                ".safetensors"
             ) and not transformers_explicit_filename.endswith(".safetensors.index.json"):
                 raise ValueError(
                     "The transformers file in the config seems to be incorrect: it is neither a safetensors file "
@@ -2483,8 +2483,9 @@ def from_pretrained(
             if is_local:
                 if transformers_explicit_filename is not None:
                     # If the filename is explicitly defined, load this by default.
-                    archive_file = os.path.join(pretrained_model_name_or_path, subfolder,
-                                                transformers_explicit_filename)
+                    archive_file = os.path.join(
+                        pretrained_model_name_or_path, subfolder, transformers_explicit_filename
+                    )
                     is_sharded = transformers_explicit_filename.endswith(".safetensors.index.json")
                 elif from_tf and os.path.isfile(
                     os.path.join(pretrained_model_name_or_path, subfolder, TF_WEIGHTS_NAME + ".index")