init

danionella · Oct 5, 2024 · 6e8e91d · 6e8e91d
1 parent 79d30e2
commit 6e8e91d
Show file tree

Hide file tree

Showing 4 changed files with 142 additions and 21 deletions.
diff --git a/pyproject.toml b/pyproject.toml
@@ -25,7 +25,7 @@ classifiers = [
 ]
 requires-python = ">=3.9"
 dependencies = [
-    "numpy",
+    "numpy","av"
 ]
 
 [project.optional-dependencies]

diff --git a/src/napari_pyav/__init__.py b/src/napari_pyav/__init__.py
@@ -1,4 +1,4 @@
-__version__ = "0.0.1"
+__version__ = "0.0.2"
 
 from ._reader import napari_get_reader
 

diff --git a/src/napari_pyav/_reader.py b/src/napari_pyav/_reader.py
@@ -6,7 +6,7 @@
 https://napari.org/stable/plugins/guides.html?#readers
 """
 import numpy as np
-
+import av
 
 def napari_get_reader(path):
     """A basic implementation of a Reader contribution.
@@ -22,15 +22,12 @@ def napari_get_reader(path):
         If the path is a recognized format, return a function that accepts the
         same path or list of paths, and returns a list of layer data tuples.
     """
-    if isinstance(path, list):
-        # reader plugins may be handed single path, or a list of paths.
-        # if it is a list, it is assumed to be an image stack...
-        # so we are only going to look at the first file.
-        path = path[0]
+    # if isinstance(path, list):
+    #     raise ValueError("This reader only supports single file paths")
 
-    # if we know we cannot read the file, we immediately return None.
-    if not path.endswith(".npy"):
-        return None
+    # # if we know we cannot read the file, we immediately return None.
+    # if not path.endswith(".mp4"):
+    #     return None
 
     # otherwise we return the *function* that can read ``path``.
     return reader_function
@@ -58,15 +55,139 @@ def reader_function(path):
         layer. Both "meta", and "layer_type" are optional. napari will
         default to layer_type=="image" if not provided
     """
-    # handle both a string and a list of strings
     paths = [path] if isinstance(path, str) else path
-    # load all files into array
-    arrays = [np.load(_path) for _path in paths]
-    # stack arrays into single array
-    data = np.squeeze(np.stack(arrays))
+    out = [(FastVideoReader(path), {}, 'image') for path in paths]
+    return out
+
+
+class FastVideoReader:
+    ''' A class to read video files quickly, using the pyav package. It allows for fast seeking and reading of frames. 
+    
+    Args:
+        filename (str): path to the video file
+        threading (bool): enable threading in the decoder. Default is True.
+        read_format (str): format to read the video in. Default is 'gray'. Other options include 'rgb24', 'bgr24', 'yuv420p', etc.
+        pts_lookup (np.ndarray): lookup seek table for pts values. Default is None (generate when needed).
+        thread_count (int): number of threads to use for decoding. Default is 0 (auto).
+    '''
+    def __init__(self, filename, threading=True, read_format='gray', pts_lookup=None, thread_count=0):
+        self.container = av.open(filename)
+        self.stream = self.container.streams.video[0]
+        self.stream.codec_context.thread_count = thread_count
+        self.stream.codec_context.thread_type = 'AUTO' if threading else 'SLICE' # FRAME/AUTO/SLICE
+        self.framegenerator = self.container.decode(video=0)
+        self.read_format = read_format
+        self._pts_lookup = pts_lookup
+        self._pts_per_frame = 1 / (self.stream.guessed_rate * self.stream.time_base)
+        self._init_pts = int(next(self.framegenerator).pts)
+        self._frame_to_pts = lambda n: round(n * self._pts_per_frame) + self._init_pts
+        self.rewind()
+
+    def read(self):
+        ''' Read the next frame in the specified format. '''
+        frame_obj = next(self.framegenerator)
+        self.last_pts = frame_obj.pts
+        im = frame_obj.to_ndarray(format=self.read_format)
+        #print(frame_obj.pts, frame_obj.dts, frame_obj.time)
+        del frame_obj
+        return im
+
+    def rewind(self):
+        ''' Rewind the video to the beginning. '''
+        self.container.seek(0)
+        self.framegenerator = self.container.decode(video=0)
+        self.last_pts = None
+
+    def read_frame(self, frame_idx):
+        ''' Read the specified frame index. 
+        
+        Args:
+            frame_idx (int): index of the frame to read
+        '''
+        if frame_idx == 0:
+            self.rewind()
+            return self.read()
+        if self.last_pts is not None and self.last_pts == self._frame_to_pts(frame_idx-1):
+            return self.read()
+        target_pts = self._frame_to_pts(frame_idx)
+        self.container.seek(target_pts-self._init_pts, backward=True, stream=self.container.streams.video[0])
+        self.framegenerator = self.container.decode(video=0)
+        frame_obj = next(self.framegenerator)
+        while frame_obj.pts != target_pts:
+            assert frame_obj.pts <= target_pts, f'pts glitch: {frame_obj.pts} > {target_pts}'
+            frame_obj = next(self.framegenerator)
+        frame = frame_obj.to_ndarray(format=self.read_format)
+        self.last_pts = frame_obj.pts
+        return frame
+
+    def close(self):
+        self.container.close()
+
+    def __del__(self):
+        self.close()
+
+    def __getitem__(self, index):
+        if isinstance(index, (int, np.integer)):  # single frame
+            return self.read_frame(index)
+        elif isinstance(index, tuple) and isinstance(index[0], int):
+            return self.read_frame(index[0])
+        elif isinstance(index, slice):
+            frames = [self.read_frame(i) for i in np.r_[index]]
+            return np.array(frames)
+        else:
+            raise NotImplementedError, "slicing of {type(index)} : {index} not implemented yet"
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        self.close()
+        return False
+
+    def __iter__(self):
+        self.rewind()
+        return self
+
+    def __next__(self):
+        try:
+            return self.read()
+        except:
+            self.rewind()
+            raise StopIteration
+
+    @property
+    def frame_shape(self):
+        ''' Return the shape of the video frames. '''
+        return self.container.streams.video[0].codec_context.height, self.container.streams.video[0].codec_context.width
+
+    @property
+    def nframes(self):
+        ''' Return the number of frames in the video. '''
+        return self.container.streams.video[0].frames
+
+    @property
+    def dtype(self):
+        return np.uint8
+
+    @property
+    def shape(self):
+        return (self.nframes, *self.frame_shape)
 
-    # optional kwargs for the corresponding viewer.add_* method
-    add_kwargs = {}
+    @property
+    def ndim(self):
+        return len(self.shape)
 
-    layer_type = "image"  # optional, default is "image"
-    return [(data, add_kwargs, layer_type)]
+    @property
+    def size(self):
+        return np.product(self.shape)
+
+    @staticmethod
+    def static_shape(filename):
+        ''' Get the shape of a video (static method). 
+        
+        Args:
+            filename (str): path to the video file'''
+        with av.open(filename) as container:
+            stream = container.streams.video[0]
+            shape = np.array([stream.frames, stream.codec_context.height, stream.codec_context.width])
+        return shape
diff --git a/src/napari_pyav/napari.yaml b/src/napari_pyav/napari.yaml
@@ -12,4 +12,4 @@ contributions:
   readers:
     - command: napari-pyav.get_reader
       accepts_directories: false
-      filename_patterns: ['*.npy']
+      filename_patterns: ['*.mp4']