Lightning-AI · robTheBuildr · Sep 23, 2025 · Sep 23, 2025 · bhimrazy · Sep 23, 2025
@@ -312,6 +312,16 @@ def load_index_file(input_dir: str) -> dict[str, Any]:
         return data
     except FileNotFoundError:
         raise FileNotFoundError(f"Index file not found at {index_filepath}.")
+    except json.decoder.JSONDecodeError:
+        with open(index_filepath) as f:
+            raw_data = f.read()
+            raw_data += "}"  # close the json content it has been truncated by a character
+            data = json.loads(raw_data)  # load json from string
+        if "chunks" not in data and "shards" in data:
+            # load mds shard-based index file and adapt to chunks format
+            return adapt_mds_shards_to_chunks(data)
+
+        return data
 merge_cache._merge_no_wait(node_rank if num_nodes > 1 else None, getattr(self, "existing_index", None)) 
 self._upload_index(output_dir, cache_dir, num_nodes, node_rank) 
 if node_rank is None: 
     with open(os.path.join(self._cache_dir, _INDEX_FILENAME), "w") as f: 
         data = {"chunks": chunks_info, "config": config, "updated_at": str(time())} 
         json.dump(data, f, sort_keys=True) 
 else: 
     with open(os.path.join(self._cache_dir, f"{node_rank}-{_INDEX_FILENAME}"), "w") as f: 
         json.dump({"chunks": chunks_info, "config": config}, f, sort_keys=True) 
 merge_cache._merge_no_wait(node_rank if num_nodes > 1 else None, getattr(self, "existing_index", None)) 
  
 self._upload_index(output_dir, cache_dir, num_nodes, node_rank) 
  
 if node_rank is None: 
     with open(os.path.join(self._cache_dir, _INDEX_FILENAME), "w") as f: 
         data = {"chunks": chunks_info, "config": config, "updated_at": str(time())} 
         json.dump(data, f, sort_keys=True) 
 else: 
     with open(os.path.join(self._cache_dir, f"{node_rank}-{_INDEX_FILENAME}"), "w") as f: 
         json.dump({"chunks": chunks_info, "config": config}, f, sort_keys=True) 
 
 
 def adapt_mds_shards_to_chunks(data: dict[str, Any]) -> dict[str, Any]: