NVIDIA-NeMo · suiyoubi · Aug 20, 2025 · Jul 9, 2025 · Jul 9, 2025 · Jul 10, 2025
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
@@ -41,7 +41,7 @@ jobs:
         run: |
           pip install -U pip
           cd ray-curator
-          pip install --no-cache-dir ".[dev,text]"
+          pip install --no-cache-dir ".[dev,text,video]"
           pip install --no-cache-dir pytest-asyncio coverage
 
       - name: Run tests

diff --git a/ray-curator/pyproject.toml b/ray-curator/pyproject.toml
@@ -24,6 +24,7 @@ dependencies = [
     "loguru",
     "mecab-python3",
     "pyarrow",
+    "pynvml==11.5.3",
     "ray[default,data]",
     "torch",
     "transformers>=4.48.0",
@@ -58,6 +59,17 @@ dev = [
     "pytest-loguru",
     "ruff==0.11.4",
 ]
+video = [
+    "av==13.1.0",
+    "opencv-python",
+    "torchvision",
+    "einops",
+]
+video_cuda = [
+    "PyNvVideoCodec==1.0.2",
+    "cvcuda_cu12",
+    "pycuda",
+]
 
 [tool.setuptools]
 packages = ["ray_curator"]

diff --git a/ray-curator/ray_curator/examples/video/video_read_example.py b/ray-curator/ray_curator/examples/video/video_read_example.py
@@ -0,0 +1,51 @@
+import argparse
+
+from ray_curator.backends.xenna import XennaExecutor
+from ray_curator.pipeline import Pipeline
+from ray_curator.stages.video.io.video_reader_download import VideoReaderDownloadStage
+
+
+def create_video_reading_pipeline(args: argparse.Namespace) -> Pipeline:
+
+    # Define pipeline
+    pipeline = Pipeline(name="video_reading", description="Read videos from a folder and extract metadata on video level.")
+
+    # Add stages
+    # Add the composite stage that combines reading and downloading
+    pipeline.add_stage(VideoReaderDownloadStage(
+        input_video_path=args.video_folder,
+        video_limit=args.video_limit,
+        verbose=args.verbose
+    ))
+
+    # TODO: Add Writer stage in the following PR
+
+    return pipeline
+
+
+def main(args: argparse.Namespace) -> None:
+
+    pipeline = create_video_reading_pipeline(args)
+
+    # Print pipeline description
+    print(pipeline.describe())
+    print("\n" + "=" * 50 + "\n")
+
+    # Create executor
+    executor = XennaExecutor()
+
+    # Execute pipeline
+    print("Starting pipeline execution...")
+    pipeline.run(executor)
+
+    # Print results
+    print("\nPipeline completed!")
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    # General arguments
+    parser.add_argument("--video-folder", type=str, required=True, help="Path to the video folder")
+    parser.add_argument("--video-limit", type=int, default=-1, help="Limit the number of videos to read")
+    parser.add_argument("--verbose", action="store_true", default=False, help="Verbose output")
+    args = parser.parse_args()
+    main(args)