Display motion levels in real time

WyattBlue · WyattBlue · commit 944be4198870 · 2024-07-22T16:29:25.000-04:00
diff --git a/auto_editor/analyze.py b/auto_editor/analyze.py
@@ -354,4 +354,5 @@ def motion(self, stream: int, blur: int, width: int) -> NDArray[np.float64]:
             prev_frame = current_frame
 
         self.bar.end()
+        container.close()
         return self.cache("motion", mobj, threshold_list[:index])
diff --git a/auto_editor/subcommands/levels.py b/auto_editor/subcommands/levels.py
@@ -25,6 +25,7 @@
 from auto_editor.vanparse import ArgumentParser
 
 if TYPE_CHECKING:
+    from collections.abc import Iterator
     from fractions import Fraction
 
     from numpy.typing import NDArray
@@ -79,6 +80,68 @@ def print_arr(arr: NDArray) -> None:
     print("")
 
 
+def print_arr_gen(arr: Iterator[int | float | bool]) -> None:
+    print("")
+    print("@start")
+    for a in arr:
+        if isinstance(a, float):
+            print(f"{a:.20f}")
+        if isinstance(a, bool):
+            print("1" if a else "0")
+        if isinstance(a, int):
+            print(a)
+    print("")
+
+
+def iter_motion(src, tb, stream: int, blur: int, width: int) -> Iterator[float]:
+    import av
+
+    container = av.open(f"{src.path}", "r")
+
+    video = container.streams.video[stream]
+    video.thread_type = "AUTO"
+
+    prev_frame = None
+    current_frame = None
+    total_pixels = src.videos[0].width * src.videos[0].height
+    index = 0
+    prev_index = 0
+
+    graph = av.filter.Graph()
+    graph.link_nodes(
+        graph.add_buffer(template=video),
+        graph.add("scale", f"{width}:-1"),
+        graph.add("format", "gray"),
+        graph.add("gblur", f"sigma={blur}"),
+        graph.add("buffersink"),
+    ).configure()
+
+    for unframe in container.decode(video):
+        if unframe.pts is None:
+            continue
+
+        graph.push(unframe)
+        frame = graph.pull()
+        assert frame.time is not None
+        index = round(frame.time * tb)
+
+        current_frame = frame.to_ndarray()
+        if prev_frame is None:
+            value = 0.0
+        else:
+            # Use `int16` to avoid underflow with `uint8` datatype
+            diff = np.abs(prev_frame.astype(np.int16) - current_frame.astype(np.int16))
+            value = np.count_nonzero(diff) / total_pixels
+
+        for _ in range(index - prev_index):
+            yield value
+
+        prev_frame = current_frame
+        prev_index = index
+
+    container.close()
+
+
 def main(sys_args: list[str] = sys.argv[1:]) -> None:
     parser = levels_options(ArgumentParser("levels"))
     args = parser.parse_args(LevelArgs, sys_args)
@@ -136,7 +199,7 @@ def main(sys_args: list[str] = sys.argv[1:]) -> None:
             if method == "audio":
                 print_arr(levels.audio(**obj))
             elif method == "motion":
-                print_arr(levels.motion(**obj))
+                print_arr_gen(iter_motion(src, tb, **obj))
             elif method == "subtitle":
                 print_arr(levels.subtitle(**obj))
             elif method == "none":