From a243ab18cac5d39432c604f50f5ca8334da06d88 Mon Sep 17 00:00:00 2001
From: Scott Schneider <scott.a.s@gmail.com>
Date: Thu, 3 Apr 2025 06:33:03 -0700
Subject: [PATCH 1/2] Enable public decoder creation with file like object

---
 src/torchcodec/_core/ops.py               |  2 +-
 src/torchcodec/decoders/_audio_decoder.py |  8 +++--
 src/torchcodec/decoders/_decoder_utils.py | 19 +++++++++--
 src/torchcodec/decoders/_video_decoder.py |  8 +++--
 test/test_decoders.py                     | 41 +++++++++++++++++++++--
 5 files changed, 68 insertions(+), 10 deletions(-)

diff --git a/src/torchcodec/_core/ops.py b/src/torchcodec/_core/ops.py
index 0f0bdfe2..d9a17e68 100644
--- a/src/torchcodec/_core/ops.py
+++ b/src/torchcodec/_core/ops.py
@@ -141,7 +141,7 @@ def create_from_bytes(
 
 
 def create_from_file_like(
-    file_like: Union[io.RawIOBase, io.BytesIO], seek_mode: Optional[str] = None
+    file_like: Union[io.RawIOBase, io.BufferedReader], seek_mode: Optional[str] = None
 ) -> torch.Tensor:
     assert _pybind_ops is not None
     return _convert_to_tensor(_pybind_ops.create_from_file_like(file_like, seek_mode))
diff --git a/src/torchcodec/decoders/_audio_decoder.py b/src/torchcodec/decoders/_audio_decoder.py
index 002743ff..f9731429 100644
--- a/src/torchcodec/decoders/_audio_decoder.py
+++ b/src/torchcodec/decoders/_audio_decoder.py
@@ -4,6 +4,7 @@
 # This source code is licensed under the BSD-style license found in the
 # LICENSE file in the root directory of this source tree.
 
+import io
 from pathlib import Path
 from typing import Optional, Union
 
@@ -25,10 +26,13 @@ class AudioDecoder:
     Returned samples are float samples normalized in [-1, 1]
 
     Args:
-        source (str, ``Pathlib.path``, ``torch.Tensor``, or bytes): The source of the audio:
+        source (str, ``Pathlib.path``,
+                ``io.RawIOBase``, ``io.BufferedReader``,
+                bytes, or ``torch.Tensor``): The source of the audio:
 
             - If ``str``: a local path or a URL to a video or audio file.
             - If ``Pathlib.path``: a path to a local video or audio file.
+            - If ``io.RawIOBase`` or ``io.BufferedReader``: a file-like object that refers to a audio file.
             - If ``bytes`` object or ``torch.Tensor``: the raw encoded audio data.
         stream_index (int, optional): Specifies which stream in the file to decode samples from.
             Note that this index is absolute across all media types. If left unspecified, then
@@ -45,7 +49,7 @@ class AudioDecoder:
 
     def __init__(
         self,
-        source: Union[str, Path, bytes, Tensor],
+        source: Union[str, Path, io.RawIOBase, io.BufferedReader, bytes, Tensor],
         *,
         stream_index: Optional[int] = None,
         sample_rate: Optional[int] = None,
diff --git a/src/torchcodec/decoders/_decoder_utils.py b/src/torchcodec/decoders/_decoder_utils.py
index c5534711..53eba66c 100644
--- a/src/torchcodec/decoders/_decoder_utils.py
+++ b/src/torchcodec/decoders/_decoder_utils.py
@@ -4,6 +4,7 @@
 # This source code is licensed under the BSD-style license found in the
 # LICENSE file in the root directory of this source tree.
 
+import io
 from pathlib import Path
 
 from typing import Union
@@ -18,18 +19,32 @@
 
 
 def create_decoder(
-    *, source: Union[str, Path, bytes, Tensor], seek_mode: str
+    *,
+    source: Union[str, Path, io.RawIOBase, io.BufferedReader, bytes, Tensor],
+    seek_mode: str,
 ) -> Tensor:
     if isinstance(source, str):
         return core.create_from_file(source, seek_mode)
     elif isinstance(source, Path):
         return core.create_from_file(str(source), seek_mode)
+    elif isinstance(source, io.RawIOBase) or isinstance(source, io.BufferedReader):
+        return core.create_from_file_like(source, seek_mode)
     elif isinstance(source, bytes):
         return core.create_from_bytes(source, seek_mode)
     elif isinstance(source, Tensor):
         return core.create_from_tensor(source, seek_mode)
+    elif isinstance(source, io.TextIOBase):
+        raise TypeError(
+            "source is of type io.TextIOBase; did you forget to specify binary reading?"
+        )
+    elif hasattr(source, "read") and hasattr(source, "seek"):
+        # This check must be after checking for text-based reading. Also placing
+        # it last in general to be defensive: hasattr is a blunt instrument. We
+        # could use the inspect module to check for methods with the right
+        # signature.
+        return core.create_from_file_like(source, seek_mode)
 
     raise TypeError(
         f"Unknown source type: {type(source)}. "
-        "Supported types are str, Path, bytes and Tensor."
+        "Supported types are str, Path, io.RawIOBase, io.BufferedReader, bytes and Tensor."
     )
diff --git a/src/torchcodec/decoders/_video_decoder.py b/src/torchcodec/decoders/_video_decoder.py
index 8a894925..5bbbc41b 100644
--- a/src/torchcodec/decoders/_video_decoder.py
+++ b/src/torchcodec/decoders/_video_decoder.py
@@ -4,6 +4,7 @@
 # This source code is licensed under the BSD-style license found in the
 # LICENSE file in the root directory of this source tree.
 
+import io
 import numbers
 from pathlib import Path
 from typing import Literal, Optional, Tuple, Union
@@ -21,10 +22,13 @@ class VideoDecoder:
     """A single-stream video decoder.
 
     Args:
-        source (str, ``Pathlib.path``, ``torch.Tensor``, or bytes): The source of the video.
+        source (str, ``Pathlib.path``,
+                ``io.RawIOBase``, ``io.BufferedReader``,
+                bytes, or ``torch.Tensor``): The source of the video:
 
             - If ``str``: a local path or a URL to a video file.
             - If ``Pathlib.path``: a path to a local video file.
+            - If ``io.RawIOBase`` or ``io.BufferedReader``: a file-like object that refers to a video file.
             - If ``bytes`` object or ``torch.Tensor``: the raw encoded video data.
         stream_index (int, optional): Specifies which stream in the video to decode frames from.
             Note that this index is absolute across all media types. If left unspecified, then
@@ -66,7 +70,7 @@ class VideoDecoder:
 
     def __init__(
         self,
-        source: Union[str, Path, bytes, Tensor],
+        source: Union[str, Path, io.RawIOBase, io.BufferedReader, bytes, Tensor],
         *,
         stream_index: Optional[int] = None,
         dimension_order: Literal["NCHW", "NHWC"] = "NCHW",
diff --git a/test/test_decoders.py b/test/test_decoders.py
index e11981e9..c68e1ace 100644
--- a/test/test_decoders.py
+++ b/test/test_decoders.py
@@ -45,18 +45,48 @@ class TestDecoder:
             (AudioDecoder, NASA_AUDIO_MP3),
         ),
     )
-    @pytest.mark.parametrize("source_kind", ("str", "path", "tensor", "bytes"))
+    @pytest.mark.parametrize(
+        "source_kind",
+        (
+            "str",
+            "path",
+            "file_like_rawio",
+            "file_like_bufferedio",
+            "file_like_custom",
+            "bytes",
+            "tensor",
+        ),
+    )
     def test_create(self, Decoder, asset, source_kind):
         if source_kind == "str":
             source = str(asset.path)
         elif source_kind == "path":
             source = asset.path
-        elif source_kind == "tensor":
-            source = asset.to_tensor()
+        elif source_kind == "file_like_rawio":
+            source = open(asset.path, mode="rb", buffering=0)
+        elif source_kind == "file_like_bufferedio":
+            source = open(asset.path, mode="rb", buffering=4096)
+        elif source_kind == "file_like_custom":
+            # This class purposefully does not inherit from io.RawIOBase or
+            # io.BufferedReader. We are testing the case when users pass an
+            # object that has the right methods but is an arbitrary type.
+            class CustomReader:
+                def __init__(self, file):
+                    self._file = file
+
+                def read(self, size: int) -> bytes:
+                    return self._file.read(size)
+
+                def seek(self, offset: int, whence: int) -> bytes:
+                    return self._file.seek(offset, whence)
+
+            source = CustomReader(open(asset.path, mode="rb", buffering=0))
         elif source_kind == "bytes":
             path = str(asset.path)
             with open(path, "rb") as f:
                 source = f.read()
+        elif source_kind == "tensor":
+            source = asset.to_tensor()
         else:
             raise ValueError("Oops, double check the parametrization of this test!")
 
@@ -76,6 +106,11 @@ def test_create_fails(self, Decoder):
         with pytest.raises(ValueError, match="No valid stream found"):
             Decoder(NASA_VIDEO.path, stream_index=2)
 
+        # user mistakenly forgets to specify binary reading when creating a file
+        # like object from open()
+        with pytest.raises(TypeError, match="binary reading?"):
+            Decoder(open(NASA_VIDEO.path, "r"))
+
 
 class TestVideoDecoder:
     @pytest.mark.parametrize("seek_mode", ("exact", "approximate"))

From 8fbeaface7e48c1289f0b54da17c6411d4c10de4 Mon Sep 17 00:00:00 2001
From: Scott Schneider <scott.a.s@gmail.com>
Date: Thu, 3 Apr 2025 08:52:44 -0700
Subject: [PATCH 2/2] Say file-like instead of io types

---
 src/torchcodec/decoders/_audio_decoder.py | 8 ++++----
 src/torchcodec/decoders/_decoder_utils.py | 6 ++++--
 src/torchcodec/decoders/_video_decoder.py | 8 ++++----
 3 files changed, 12 insertions(+), 10 deletions(-)

diff --git a/src/torchcodec/decoders/_audio_decoder.py b/src/torchcodec/decoders/_audio_decoder.py
index f9731429..4b73e94c 100644
--- a/src/torchcodec/decoders/_audio_decoder.py
+++ b/src/torchcodec/decoders/_audio_decoder.py
@@ -26,14 +26,14 @@ class AudioDecoder:
     Returned samples are float samples normalized in [-1, 1]
 
     Args:
-        source (str, ``Pathlib.path``,
-                ``io.RawIOBase``, ``io.BufferedReader``,
-                bytes, or ``torch.Tensor``): The source of the audio:
+        source (str, ``Pathlib.path``, bytes, ``torch.Tensor`` or file-like object): The source of the video:
 
             - If ``str``: a local path or a URL to a video or audio file.
             - If ``Pathlib.path``: a path to a local video or audio file.
-            - If ``io.RawIOBase`` or ``io.BufferedReader``: a file-like object that refers to a audio file.
             - If ``bytes`` object or ``torch.Tensor``: the raw encoded audio data.
+            - If file-like object: we read video data from the object on demand. The object must
+              expose the methods ``read(self, size: int) -> bytes`` and
+              ``seek(self, offset: int, whence: int) -> bytes``. Read more in TODO_FILE_LIKE_TUTORIAL.
         stream_index (int, optional): Specifies which stream in the file to decode samples from.
             Note that this index is absolute across all media types. If left unspecified, then
             the :term:`best stream` is used.
diff --git a/src/torchcodec/decoders/_decoder_utils.py b/src/torchcodec/decoders/_decoder_utils.py
index 53eba66c..287cfb4e 100644
--- a/src/torchcodec/decoders/_decoder_utils.py
+++ b/src/torchcodec/decoders/_decoder_utils.py
@@ -35,7 +35,7 @@ def create_decoder(
         return core.create_from_tensor(source, seek_mode)
     elif isinstance(source, io.TextIOBase):
         raise TypeError(
-            "source is of type io.TextIOBase; did you forget to specify binary reading?"
+            "source is for reading text, likely from open(..., 'r'). Try with 'rb' for binary reading?"
         )
     elif hasattr(source, "read") and hasattr(source, "seek"):
         # This check must be after checking for text-based reading. Also placing
@@ -46,5 +46,7 @@ def create_decoder(
 
     raise TypeError(
         f"Unknown source type: {type(source)}. "
-        "Supported types are str, Path, io.RawIOBase, io.BufferedReader, bytes and Tensor."
+        "Supported types are str, Path, bytes, Tensor and file-like objects with "
+        "read(self, size: int) -> bytes and "
+        "seek(self, offset: int, whence: int) -> bytes methods."
     )
diff --git a/src/torchcodec/decoders/_video_decoder.py b/src/torchcodec/decoders/_video_decoder.py
index 5bbbc41b..884bf275 100644
--- a/src/torchcodec/decoders/_video_decoder.py
+++ b/src/torchcodec/decoders/_video_decoder.py
@@ -22,14 +22,14 @@ class VideoDecoder:
     """A single-stream video decoder.
 
     Args:
-        source (str, ``Pathlib.path``,
-                ``io.RawIOBase``, ``io.BufferedReader``,
-                bytes, or ``torch.Tensor``): The source of the video:
+        source (str, ``Pathlib.path``, bytes, ``torch.Tensor`` or file-like object): The source of the video:
 
             - If ``str``: a local path or a URL to a video file.
             - If ``Pathlib.path``: a path to a local video file.
-            - If ``io.RawIOBase`` or ``io.BufferedReader``: a file-like object that refers to a video file.
             - If ``bytes`` object or ``torch.Tensor``: the raw encoded video data.
+            - If file-like object: we read video data from the object on demand. The object must
+              expose the methods ``read(self, size: int) -> bytes`` and
+              ``seek(self, offset: int, whence: int) -> bytes``. Read more in TODO_FILE_LIKE_TUTORIAL.
         stream_index (int, optional): Specifies which stream in the video to decode frames from.
             Note that this index is absolute across all media types. If left unspecified, then
             the :term:`best stream` is used.