Lightning-AI · mpeex · Dec 8, 2025 · Dec 8, 2025 · Jan 8, 2026 · deependujha
@@ -464,10 +464,12 @@ def __getitem__(self, index: ChunkedIndex | int | slice) -> Any:
             if isinstance(self.transform, list):
                 for transform_fn in self.transform:
                     item = transform_fn(item)
+                    if item is None:
+                        break
             else:
                 item = self.transform(item)
 
-        return item
+        return item if item else self.__next__()
 
     def __next__(self) -> Any:
         # check if we have reached the end of the dataset (i.e., all the chunks have been processed)

@@ -591,11 +591,13 @@ def download_file(self, remote_filepath: str, local_filepath: str) -> None:
             FileLock(local_filepath + ".lock", timeout=0),
             tempfile.TemporaryDirectory() as tmpdir,
         ):
-            _, _, _, repo_org, repo_name, path = remote_filepath.split("/", 5)
-            repo_id = f"{repo_org}/{repo_name}"
+            _, _, _, repo_org, repo_name_revision, path = remote_filepath.split("/", 5)
+            splits = repo_name_revision.split("@", 2)
+            repo_id = f"{repo_org}/{splits[0]}"
             downloaded_path = hf_hub_download(
                 repo_id,
                 path,
+                revision=splits[1] if len(splits) == 2 else None,
                 cache_dir=tmpdir,
                 repo_type="dataset",
                 **self._storage_options,