From 2e1d7485a8fe57c2d1a6f2b7acd532083c0f99c8 Mon Sep 17 00:00:00 2001
From: Emil Ernerfeldt <emil.ernerfeldt@gmail.com>
Date: Tue, 8 Oct 2024 21:40:35 +0200
Subject: [PATCH 01/33] Initial ffmpeg H.264 support in frames example

---
 Cargo.lock                                 |  10 +
 Cargo.toml                                 |   1 +
 crates/store/re_video/Cargo.toml           |  10 +-
 crates/store/re_video/build.rs             |   1 +
 crates/store/re_video/examples/frames.rs   |  32 ++-
 crates/store/re_video/src/decode/ffmpeg.rs | 216 +++++++++++++++++++++
 crates/store/re_video/src/decode/mod.rs    |   5 +-
 crates/store/re_video/src/demux/mod.rs     |   4 +
 8 files changed, 273 insertions(+), 6 deletions(-)
 create mode 100644 crates/store/re_video/src/decode/ffmpeg.rs

diff --git a/Cargo.lock b/Cargo.lock
index 26e9132e2bed..650342573024 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -2463,6 +2463,15 @@ dependencies = [
  "simd-adler32",
 ]
 
+[[package]]
+name = "ffmpeg-sidecar"
+version = "1.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4bd1e249e0ceeb0f5c9f84a3c6941c3bde3ebc2815f4b94531a7e806af61c4c0"
+dependencies = [
+ "anyhow",
+]
+
 [[package]]
 name = "filetime"
 version = "0.2.23"
@@ -6516,6 +6525,7 @@ dependencies = [
  "criterion",
  "crossbeam",
  "econtext",
+ "ffmpeg-sidecar",
  "indicatif",
  "itertools 0.13.0",
  "js-sys",
diff --git a/Cargo.toml b/Cargo.toml
index d5df6f87a744..a4edee627548 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -177,6 +177,7 @@ econtext = "0.2" # Prints error contexts on crashes
 ehttp = "0.5.0"
 enumset = "1.0.12"
 env_logger = { version = "0.10", default-features = false }
+ffmpeg-sidecar = "1.1.2"
 fixed = { version = "<1.28", default-features = false } # 1.28+ is MSRV 1.79+
 flatbuffers = "23.0"
 futures-channel = "0.3"
diff --git a/crates/store/re_video/Cargo.toml b/crates/store/re_video/Cargo.toml
index f9dd00bf199f..458d68b4403c 100644
--- a/crates/store/re_video/Cargo.toml
+++ b/crates/store/re_video/Cargo.toml
@@ -23,7 +23,7 @@ features = ["all"]
 
 
 [features]
-default = ["av1"]
+default = ["av1", "ffmpeg"]
 
 ## Enable serialization for data structures that support it.
 serde = ["dep:serde"]
@@ -31,6 +31,9 @@ serde = ["dep:serde"]
 ## Native AV1 decoding.
 av1 = ["dep:dav1d"]
 
+## Decode H.264 using ffmpeg over CLI.
+ffmpeg = ["dep:ffmpeg-sidecar"]
+
 ## Enable faster native video decoding with assembly.
 ## You need to install [nasm](https://nasm.us/) to compile with this feature.
 nasm = [
@@ -49,9 +52,11 @@ econtext.workspace = true
 itertools.workspace = true
 parking_lot.workspace = true
 re_mp4.workspace = true
-serde = { workspace = true, optional = true }
 thiserror.workspace = true
 
+ffmpeg-sidecar = { workspace = true, optional = true }
+serde = { workspace = true, optional = true }
+
 # We enable re_rav1d on native, UNLESS we're on Linux Arm64
 # See https://github.com/rerun-io/rerun/issues/7755
 [target.'cfg(all(not(target_arch = "wasm32"), not(all(target_os = "linux", target_arch = "aarch64"))))'.dependencies]
@@ -83,6 +88,7 @@ web-sys = { workspace = true, features = [
 ] }
 
 [dev-dependencies]
+# For the `frames` example:
 indicatif.workspace = true
 criterion.workspace = true
 
diff --git a/crates/store/re_video/build.rs b/crates/store/re_video/build.rs
index 261ccb770ba3..e9fdfb6aa24f 100644
--- a/crates/store/re_video/build.rs
+++ b/crates/store/re_video/build.rs
@@ -10,5 +10,6 @@ fn main() {
         native: { not(target_arch = "wasm32") },
         linux_arm64: { all(target_os = "linux", target_arch = "aarch64") },
         with_dav1d: { all(feature = "av1", native, not(linux_arm64)) }, // https://github.com/rerun-io/rerun/issues/7755
+        with_ffmpeg: { all(feature= "ffmpeg", native) }
     }
 }
diff --git a/crates/store/re_video/examples/frames.rs b/crates/store/re_video/examples/frames.rs
index cd931f31baa0..4837a09cf554 100644
--- a/crates/store/re_video/examples/frames.rs
+++ b/crates/store/re_video/examples/frames.rs
@@ -14,6 +14,8 @@ use indicatif::ProgressBar;
 use parking_lot::Mutex;
 
 fn main() {
+    re_log::setup_logging();
+
     // frames <video.mp4>
     let args: Vec<_> = std::env::args().collect();
     let Some(video_path) = args.get(1) else {
@@ -83,8 +85,15 @@ fn main() {
                 .create(true)
                 .truncate(true)
                 .open(output_dir.join(format!("{i:0width$}.ppm")))
-                .expect("failed to open file");
-            write_binary_ppm(&mut file, frame.width, frame.height, &frame.data);
+                .expect("failed to oformatpen file");
+            match frame.format {
+                re_video::PixelFormat::Rgb8Unorm => {
+                    write_ppm_rgb24(&mut file, frame.width, frame.height, &frame.data);
+                }
+                re_video::PixelFormat::Rgba8Unorm => {
+                    write_ppm_rgba32(&mut file, frame.width, frame.height, &frame.data);
+                }
+            }
         }
     }
 }
@@ -93,7 +102,24 @@ fn num_digits(n: usize) -> usize {
     (n as f64).log10().floor() as usize + 1
 }
 
-fn write_binary_ppm(file: &mut File, width: u32, height: u32, rgba: &[u8]) {
+fn write_ppm_rgb24(file: &mut File, width: u32, height: u32, rgb: &[u8]) {
+    assert_eq!(width as usize * height as usize * 3, rgb.len());
+
+    let header = format!("P6\n{width} {height}\n255\n");
+
+    let mut data = Vec::with_capacity(header.len() + width as usize * height as usize * 3);
+    data.extend_from_slice(header.as_bytes());
+
+    for rgb in rgb.chunks(3) {
+        data.extend_from_slice(&[rgb[0], rgb[1], rgb[2]]);
+    }
+
+    file.write_all(&data).expect("failed to write frame data");
+}
+
+fn write_ppm_rgba32(file: &mut File, width: u32, height: u32, rgba: &[u8]) {
+    assert_eq!(width as usize * height as usize * 4, rgba.len());
+
     let header = format!("P6\n{width} {height}\n255\n");
 
     let mut data = Vec::with_capacity(header.len() + width as usize * height as usize * 3);
diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
new file mode 100644
index 000000000000..c6d244f7e0ac
--- /dev/null
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -0,0 +1,216 @@
+//! Send video data to `ffmpeg` over CLI to decode it.
+
+use crossbeam::channel::Receiver;
+use ffmpeg_sidecar::{
+    child::FfmpegChild,
+    command::FfmpegCommand,
+    event::{FfmpegEvent, LogLevel},
+};
+
+use crate::{Time, Timescale};
+
+use super::{async_decoder_wrapper::SyncDecoder, Frame, Result};
+
+/// Decode H.264 video via ffmpeg over CLI
+
+pub struct FfmpegCliH264Decoder {
+    /// How we send more data to the ffmpeg process
+    ffmpeg_stdin: std::process::ChildStdin,
+
+    /// How we receive new frames back from ffmpeg
+    frame_rx: Receiver<Result<Frame>>,
+
+    avcc: re_mp4::Avc1Box,
+    timescale: Timescale,
+}
+
+impl FfmpegCliH264Decoder {
+    pub fn new(avcc: re_mp4::Avc1Box, timescale: Timescale) -> Result<Self> {
+        re_tracing::profile_function!();
+
+        let mut ffmpeg = {
+            re_tracing::profile_scope!("spawn-ffmpeg");
+
+            FfmpegCommand::new()
+                .hide_banner()
+                // Keep in mind that all arguments that are about the input, need to go before!
+                .format("h264") // High risk here: What's is available?
+                .input("-") // stdin is our input!
+                .rawvideo() // Output rgb24 on stdout. (TODO(emilk) for later: any format we can read directly on re_renderer would be better!)
+                .spawn()
+                .expect("Failed to spawn ffmpeg")
+        };
+
+        let mut ffmpeg_stdin = ffmpeg.take_stdin().unwrap();
+        let ffmpeg_iterator = ffmpeg.iter().unwrap();
+
+        let (frame_tx, frame_rx) = crossbeam::channel::unbounded();
+
+        let thread_handle = std::thread::Builder::new()
+            .name("ffmpeg-reader".to_owned())
+            .spawn(move || {
+                for event in ffmpeg_iterator {
+                    match event {
+                        FfmpegEvent::Log(LogLevel::Warning, msg) => re_log::warn_once!("{msg}"),
+                        FfmpegEvent::Log(LogLevel::Error, msg) => re_log::error_once!("{msg}"), // TODO: report errors
+                        FfmpegEvent::Progress(p) => {
+                            re_log::debug!("Progress: {}", p.time)
+                        }
+                        FfmpegEvent::OutputFrame(frame) => {
+                            re_log::trace!(
+                                "Received frame: d[0] {} time {:?} fmt {:?} size {}x{}",
+                                frame.data[0],
+                                frame.timestamp,
+                                frame.pix_fmt,
+                                frame.width,
+                                frame.height
+                            );
+
+                            debug_assert_eq!(frame.pix_fmt, "rgb24");
+                            debug_assert_eq!(
+                                frame.width as usize * frame.height as usize * 3,
+                                frame.data.len()
+                            );
+
+                            frame_tx.send(Ok(super::Frame {
+                                width: frame.width,
+                                height: frame.height,
+                                data: frame.data,
+                                format: crate::PixelFormat::Rgb8Unorm,
+                                presentation_timestamp: Time::from_secs(
+                                    frame.timestamp as f64,
+                                    timescale,
+                                ),
+                                duration: Time::from_secs(0.1, timescale), // TODO
+                            })); // TODO: handle disconnect
+                        }
+                        // TODO: handle all events
+                        event => re_log::debug!("Event: {event:?}"),
+                    }
+                }
+                re_log::debug!("Shutting down ffmpeg");
+            });
+
+        Ok(Self {
+            ffmpeg_stdin,
+            frame_rx,
+            avcc,
+            timescale,
+        })
+    }
+}
+
+impl SyncDecoder for FfmpegCliH264Decoder {
+    fn submit_chunk(
+        &mut self,
+        should_stop: &std::sync::atomic::AtomicBool,
+        chunk: super::Chunk,
+        on_output: &super::OutputCallback,
+    ) {
+        re_tracing::profile_function!();
+
+        let mut state = NaluStreamState::default();
+        write_avc_chunk_to_nalu_stream(&self.avcc, &mut self.ffmpeg_stdin, &chunk, &mut state)
+            .unwrap();
+        // consider writing samples while at the same time reading frames, for even lower latency
+        // and maybe reuse the same ffmpeg process.
+
+        // TODO: handle errors
+        while let Ok(frame_result) = self.frame_rx.try_recv() {
+            on_output(frame_result);
+        }
+    }
+
+    fn reset(&mut self) {
+        // TODO: restart ffmpeg process
+    }
+}
+
+/// Before every NAL unit, here is a nal start code.
+/// Can also be 2 bytes of 0x00 and 1 byte of 0x01.
+///
+/// This is used in byte stream formats such as h264 files.
+/// Packet transform systems (RTP) may omit these.
+pub const NAL_START_CODE: &[u8] = &[0x00, 0x00, 0x00, 0x01];
+
+#[derive(Default)]
+struct NaluStreamState {
+    previous_frame_was_idr: bool,
+}
+
+fn write_avc_chunk_to_nalu_stream(
+    avcc: &re_mp4::Avc1Box,
+    nalu_stream: &mut dyn std::io::Write,
+    chunk: &super::Chunk,
+    state: &mut NaluStreamState,
+) -> Result<(), Box<dyn std::error::Error>> {
+    re_tracing::profile_function!();
+    let avcc = &avcc.avcc;
+
+    // Append SPS (Sequence Parameter Set) & PPS (Picture Parameter Set) NAL unit whenever encountering
+    // an IDR frame unless the previous frame was an IDR frame.
+    // TODO(andreas): Should we detect this rather from the NALU stream rather than the samples?
+    if chunk.is_sync && !state.previous_frame_was_idr {
+        for sps in (&avcc.sequence_parameter_sets).iter() {
+            nalu_stream.write_all(&NAL_START_CODE)?;
+            nalu_stream.write_all(&sps.bytes)?;
+        }
+        for pps in (&avcc.picture_parameter_sets).iter() {
+            nalu_stream.write_all(&NAL_START_CODE)?;
+            nalu_stream.write_all(&pps.bytes)?;
+        }
+        state.previous_frame_was_idr = true;
+    } else {
+        state.previous_frame_was_idr = false;
+    }
+
+    // A single cjhunk may consist of multiple NAL units, each of which need our special treatment.
+    // (most of the time it's 1:1, but there might be extra NAL units for info, especially at the start).
+    let mut buffer_offset: usize = 0;
+    let sample_end = chunk.data.len();
+    while buffer_offset < sample_end {
+        re_tracing::profile_scope!("nalu");
+
+        // Each NAL unit in mp4 is prefixed with a length prefix.
+        // In Annex B this doesn't exist.
+        let length_prefix_size = avcc.length_size_minus_one as usize + 1;
+
+        // TODO: improve the error handling here.
+        let nal_unit_size = match length_prefix_size {
+            4 => u32::from_be_bytes(
+                chunk.data[buffer_offset..(buffer_offset + 4)]
+                    .try_into()
+                    .unwrap(),
+            ) as usize,
+            2 => u16::from_be_bytes(
+                chunk.data[buffer_offset..(buffer_offset + 2)]
+                    .try_into()
+                    .unwrap(),
+            ) as usize,
+            1 => chunk.data[buffer_offset] as usize,
+            _ => panic!("invalid length prefix size"),
+        };
+        //re_log::debug!("nal unit size: {}", nal_unit_size);
+
+        if chunk.data.len() < nal_unit_size {
+            panic!(
+                "sample size {} is smaller than nal unit size {nal_unit_size}",
+                chunk.data.len()
+            );
+        }
+
+        nalu_stream.write_all(&NAL_START_CODE)?;
+        let data_start = buffer_offset + length_prefix_size; // Skip the size.
+        let data_end = buffer_offset + nal_unit_size + length_prefix_size;
+        let data = &chunk.data[data_start..data_end];
+
+        // Note that we don't have to insert "emulation prevention bytes" since mp4 NALU still use them.
+        // (unlike the NAL start code, the presentation bytes are part of the NAL spec!)
+
+        nalu_stream.write_all(data)?;
+
+        buffer_offset = data_end;
+    }
+
+    Ok(())
+}
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index b870488029fd..d081881c6f22 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -77,11 +77,14 @@
 //! supporting HDR content at which point more properties will be important!
 //!
 
-#[cfg(with_dav1d)]
+#[cfg(any(with_dav1d, with_ffmpeg))]
 mod async_decoder_wrapper;
 #[cfg(with_dav1d)]
 mod av1;
 
+#[cfg(with_ffmpeg)]
+pub mod ffmpeg;
+
 #[cfg(target_arch = "wasm32")]
 mod webcodecs;
 
diff --git a/crates/store/re_video/src/demux/mod.rs b/crates/store/re_video/src/demux/mod.rs
index d93083a21cb1..4a642113e39b 100644
--- a/crates/store/re_video/src/demux/mod.rs
+++ b/crates/store/re_video/src/demux/mod.rs
@@ -337,6 +337,10 @@ impl Config {
     pub fn is_av1(&self) -> bool {
         matches!(self.stsd.contents, re_mp4::StsdBoxContent::Av01 { .. })
     }
+
+    pub fn is_h264(&self) -> bool {
+        matches!(self.stsd.contents, re_mp4::StsdBoxContent::Avc1 { .. })
+    }
 }
 
 /// Errors that can occur when loading a video.

From a06107ef1c75bb8e7f4c01deec2d045418383f43 Mon Sep 17 00:00:00 2001
From: Emil Ernerfeldt <emil.ernerfeldt@gmail.com>
Date: Tue, 8 Oct 2024 22:01:20 +0200
Subject: [PATCH 02/33] Actual H.264 video playback inside of Rerun viewer

---
 crates/store/re_video/src/decode/mod.rs | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index d081881c6f22..e7e9ff173afd 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -181,6 +181,19 @@ pub fn new_decoder(
             }
         }
 
+        #[cfg(with_ffmpeg)]
+        re_mp4::StsdBoxContent::Avc1(avc1_box) => {
+            re_log::trace!("Decoding H.264…");
+            return Ok(Box::new(async_decoder_wrapper::AsyncDecoderWrapper::new(
+                debug_name.to_owned(),
+                Box::new(ffmpeg::FfmpegCliH264Decoder::new(
+                    avc1_box.clone(),
+                    video.timescale,
+                )?),
+                on_output,
+            )));
+        }
+
         _ => Err(Error::UnsupportedCodec(video.human_readable_codec_string())),
     }
 }

From 770f24c4dcedc7b734166394d0fa393037b44318 Mon Sep 17 00:00:00 2001
From: Emil Ernerfeldt <emil.ernerfeldt@gmail.com>
Date: Wed, 9 Oct 2024 06:00:16 +0200
Subject: [PATCH 03/33] Fix timestamps and seeking

---
 crates/store/re_video/src/decode/ffmpeg.rs | 111 +++++++++++++++------
 crates/store/re_video/src/decode/mod.rs    |   8 ++
 2 files changed, 88 insertions(+), 31 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index c6d244f7e0ac..cf5de2cf3424 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,6 +1,6 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
-use crossbeam::channel::Receiver;
+use crossbeam::channel::{Receiver, Sender};
 use ffmpeg_sidecar::{
     child::FfmpegChild,
     command::FfmpegCommand,
@@ -9,14 +9,29 @@ use ffmpeg_sidecar::{
 
 use crate::{Time, Timescale};
 
-use super::{async_decoder_wrapper::SyncDecoder, Frame, Result};
+use super::{async_decoder_wrapper::SyncDecoder, Error, Frame, Result};
+
+/// ffmpeg does not tell us the timestamp/duration of a given frame, so we need to remember it.
+struct FrameInfo {
+    /// Monotonic index, from start
+    frame_num: u32,
+
+    timestamp: Time,
+    duration: Time,
+}
 
 /// Decode H.264 video via ffmpeg over CLI
 
 pub struct FfmpegCliH264Decoder {
+    /// Monotonically increasing
+    frame_num: u32,
+
     /// How we send more data to the ffmpeg process
     ffmpeg_stdin: std::process::ChildStdin,
 
+    /// For sending frame timestamps to the decoder thread
+    frame_info_tx: Sender<FrameInfo>,
+
     /// How we receive new frames back from ffmpeg
     frame_rx: Receiver<Result<Frame>>,
 
@@ -38,61 +53,82 @@ impl FfmpegCliH264Decoder {
                 .input("-") // stdin is our input!
                 .rawvideo() // Output rgb24 on stdout. (TODO(emilk) for later: any format we can read directly on re_renderer would be better!)
                 .spawn()
-                .expect("Failed to spawn ffmpeg")
+                .map_err(Error::FailedToStartFfmpeg)?
         };
 
-        let mut ffmpeg_stdin = ffmpeg.take_stdin().unwrap();
+        let ffmpeg_stdin = ffmpeg.take_stdin().unwrap();
         let ffmpeg_iterator = ffmpeg.iter().unwrap();
 
+        let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
         let (frame_tx, frame_rx) = crossbeam::channel::unbounded();
 
-        let thread_handle = std::thread::Builder::new()
+        std::thread::Builder::new()
             .name("ffmpeg-reader".to_owned())
             .spawn(move || {
                 for event in ffmpeg_iterator {
                     match event {
-                        FfmpegEvent::Log(LogLevel::Warning, msg) => re_log::warn_once!("{msg}"),
+                        FfmpegEvent::Log(LogLevel::Warning, msg) => {
+                            if !msg.contains(
+                                "No accelerated colorspace conversion found from yuv420p to rgb24",
+                            ) {
+                                re_log::warn_once!("{msg}");
+                            }
+                        }
                         FfmpegEvent::Log(LogLevel::Error, msg) => re_log::error_once!("{msg}"), // TODO: report errors
                         FfmpegEvent::Progress(p) => {
-                            re_log::debug!("Progress: {}", p.time)
+                            re_log::debug!("Progress: {}", p.time);
                         }
                         FfmpegEvent::OutputFrame(frame) => {
-                            re_log::trace!(
-                                "Received frame: d[0] {} time {:?} fmt {:?} size {}x{}",
-                                frame.data[0],
-                                frame.timestamp,
-                                frame.pix_fmt,
-                                frame.width,
-                                frame.height
-                            );
+                            // The `frame.timestamp` is monotonically increasing,
+                            // so it is not the actual timestamp in the stream.
+
+                            let frame_info: FrameInfo = frame_info_rx.recv().unwrap();
+
+                            let ffmpeg_sidecar::event::OutputVideoFrame {
+                                frame_num,
+                                pix_fmt,
+                                width,
+                                height,
+                                data,
+                                ..
+                            } = frame;
+
+                            debug_assert_eq!(frame_info.frame_num, frame_num, "We are out-of-sync"); // TODO: fix somehow
 
-                            debug_assert_eq!(frame.pix_fmt, "rgb24");
-                            debug_assert_eq!(
-                                frame.width as usize * frame.height as usize * 3,
-                                frame.data.len()
+                            re_log::trace!(
+                                "Received frame {frame_num}: fmt {pix_fmt:?} size {width}x{height}"
                             );
 
-                            frame_tx.send(Ok(super::Frame {
-                                width: frame.width,
-                                height: frame.height,
-                                data: frame.data,
-                                format: crate::PixelFormat::Rgb8Unorm,
-                                presentation_timestamp: Time::from_secs(
-                                    frame.timestamp as f64,
-                                    timescale,
-                                ),
-                                duration: Time::from_secs(0.1, timescale), // TODO
-                            })); // TODO: handle disconnect
+                            debug_assert_eq!(pix_fmt, "rgb24");
+                            debug_assert_eq!(width as usize * height as usize * 3, data.len());
+
+                            if frame_tx
+                                .send(Ok(super::Frame {
+                                    width,
+                                    height,
+                                    data,
+                                    format: crate::PixelFormat::Rgb8Unorm,
+                                    presentation_timestamp: frame_info.timestamp,
+                                    duration: frame_info.duration,
+                                }))
+                                .is_err()
+                            {
+                                re_log::debug!("Receiver disconnected");
+                                break;
+                            }
                         }
                         // TODO: handle all events
                         event => re_log::debug!("Event: {event:?}"),
                     }
                 }
                 re_log::debug!("Shutting down ffmpeg");
-            });
+            })
+            .expect("Failed to spawn ffmpeg thread");
 
         Ok(Self {
+            frame_num: 0,
             ffmpeg_stdin,
+            frame_info_tx,
             frame_rx,
             avcc,
             timescale,
@@ -109,6 +145,16 @@ impl SyncDecoder for FfmpegCliH264Decoder {
     ) {
         re_tracing::profile_function!();
 
+        // NOTE: this assumes each sample/chunk will result in exactly one frame.
+        self.frame_info_tx.send(FrameInfo {
+            frame_num: self.frame_num,
+            timestamp: chunk.timestamp,
+            duration: chunk.duration,
+        });
+
+        // NOTE: a 60 FPS video can go for two years before wrapping a u32.
+        self.frame_num = self.frame_num.wrapping_add(1);
+
         let mut state = NaluStreamState::default();
         write_avc_chunk_to_nalu_stream(&self.avcc, &mut self.ffmpeg_stdin, &chunk, &mut state)
             .unwrap();
@@ -117,6 +163,9 @@ impl SyncDecoder for FfmpegCliH264Decoder {
 
         // TODO: handle errors
         while let Ok(frame_result) = self.frame_rx.try_recv() {
+            if should_stop.load(std::sync::atomic::Ordering::Relaxed) {
+                return;
+            }
             on_output(frame_result);
         }
     }
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index e7e9ff173afd..5a53357f96a3 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -114,6 +114,14 @@ pub enum Error {
     #[cfg(target_arch = "wasm32")]
     #[error(transparent)]
     WebDecoderError(#[from] webcodecs::Error),
+
+    #[cfg(with_ffmpeg)]
+    #[error("Failed to start ffmppeg: {0}")]
+    FailedToStartFfmpeg(std::io::Error),
+
+    #[cfg(with_ffmpeg)]
+    #[error("Failed to start ffmppeg: {0}")]
+    FailedToSpawnThread(std::io::Error),
 }
 
 pub type Result<T = (), E = Error> = std::result::Result<T, E>;

From ab3d52aa75f71d98e01f5337add5e5f849915680 Mon Sep 17 00:00:00 2001
From: Emil Ernerfeldt <emil.ernerfeldt@gmail.com>
Date: Wed, 9 Oct 2024 06:31:05 +0200
Subject: [PATCH 04/33] Code cleanup and better error handling

---
 crates/store/re_video/src/decode/ffmpeg.rs    | 241 ++++++++++++------
 crates/store/re_video/src/decode/mod.rs       |  15 +-
 crates/viewer/re_renderer/src/video/mod.rs    |   2 +-
 crates/viewer/re_renderer/src/video/player.rs |   2 +-
 4 files changed, 175 insertions(+), 85 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index cf5de2cf3424..3a369ee7b0cd 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,15 +1,35 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
-use crossbeam::channel::{Receiver, Sender};
+use crossbeam::channel::{Receiver, Sender, TryRecvError};
 use ffmpeg_sidecar::{
-    child::FfmpegChild,
     command::FfmpegCommand,
     event::{FfmpegEvent, LogLevel},
 };
 
-use crate::{Time, Timescale};
+use crate::Time;
 
-use super::{async_decoder_wrapper::SyncDecoder, Error, Frame, Result};
+use super::{async_decoder_wrapper::SyncDecoder, Frame, Result};
+
+#[derive(thiserror::Error, Debug)]
+pub enum Error {
+    #[error("Failed to start ffmppeg: {0}")]
+    FailedToStartFfmpeg(std::io::Error),
+
+    #[error("Failed to get stdin handle")]
+    NoStdin,
+
+    #[error("Failed to get iterator: {0}")]
+    NoIterator(String),
+
+    #[error("There's a bug in Rerun")]
+    NoFrameInfo,
+}
+
+impl From<Error> for super::Error {
+    fn from(err: Error) -> Self {
+        Self::Ffmpeg(std::sync::Arc::new(err))
+    }
+}
 
 /// ffmpeg does not tell us the timestamp/duration of a given frame, so we need to remember it.
 struct FrameInfo {
@@ -33,14 +53,13 @@ pub struct FfmpegCliH264Decoder {
     frame_info_tx: Sender<FrameInfo>,
 
     /// How we receive new frames back from ffmpeg
-    frame_rx: Receiver<Result<Frame>>,
+    frame_rx: Receiver<super::Result<Frame>>,
 
     avcc: re_mp4::Avc1Box,
-    timescale: Timescale,
 }
 
 impl FfmpegCliH264Decoder {
-    pub fn new(avcc: re_mp4::Avc1Box, timescale: Timescale) -> Result<Self> {
+    pub fn new(avcc: re_mp4::Avc1Box) -> Result<Self> {
         re_tracing::profile_function!();
 
         let mut ffmpeg = {
@@ -56,8 +75,10 @@ impl FfmpegCliH264Decoder {
                 .map_err(Error::FailedToStartFfmpeg)?
         };
 
-        let ffmpeg_stdin = ffmpeg.take_stdin().unwrap();
-        let ffmpeg_iterator = ffmpeg.iter().unwrap();
+        let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+        let ffmpeg_iterator = ffmpeg
+            .iter()
+            .map_err(|err| Error::NoIterator(err.to_string()))?;
 
         let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
         let (frame_tx, frame_rx) = crossbeam::channel::unbounded();
@@ -65,62 +86,7 @@ impl FfmpegCliH264Decoder {
         std::thread::Builder::new()
             .name("ffmpeg-reader".to_owned())
             .spawn(move || {
-                for event in ffmpeg_iterator {
-                    match event {
-                        FfmpegEvent::Log(LogLevel::Warning, msg) => {
-                            if !msg.contains(
-                                "No accelerated colorspace conversion found from yuv420p to rgb24",
-                            ) {
-                                re_log::warn_once!("{msg}");
-                            }
-                        }
-                        FfmpegEvent::Log(LogLevel::Error, msg) => re_log::error_once!("{msg}"), // TODO: report errors
-                        FfmpegEvent::Progress(p) => {
-                            re_log::debug!("Progress: {}", p.time);
-                        }
-                        FfmpegEvent::OutputFrame(frame) => {
-                            // The `frame.timestamp` is monotonically increasing,
-                            // so it is not the actual timestamp in the stream.
-
-                            let frame_info: FrameInfo = frame_info_rx.recv().unwrap();
-
-                            let ffmpeg_sidecar::event::OutputVideoFrame {
-                                frame_num,
-                                pix_fmt,
-                                width,
-                                height,
-                                data,
-                                ..
-                            } = frame;
-
-                            debug_assert_eq!(frame_info.frame_num, frame_num, "We are out-of-sync"); // TODO: fix somehow
-
-                            re_log::trace!(
-                                "Received frame {frame_num}: fmt {pix_fmt:?} size {width}x{height}"
-                            );
-
-                            debug_assert_eq!(pix_fmt, "rgb24");
-                            debug_assert_eq!(width as usize * height as usize * 3, data.len());
-
-                            if frame_tx
-                                .send(Ok(super::Frame {
-                                    width,
-                                    height,
-                                    data,
-                                    format: crate::PixelFormat::Rgb8Unorm,
-                                    presentation_timestamp: frame_info.timestamp,
-                                    duration: frame_info.duration,
-                                }))
-                                .is_err()
-                            {
-                                re_log::debug!("Receiver disconnected");
-                                break;
-                            }
-                        }
-                        // TODO: handle all events
-                        event => re_log::debug!("Event: {event:?}"),
-                    }
-                }
+                read_ffmpeg_output(ffmpeg_iterator, &frame_info_rx, &frame_tx);
                 re_log::debug!("Shutting down ffmpeg");
             })
             .expect("Failed to spawn ffmpeg thread");
@@ -131,11 +97,142 @@ impl FfmpegCliH264Decoder {
             frame_info_tx,
             frame_rx,
             avcc,
-            timescale,
         })
     }
 }
 
+fn read_ffmpeg_output(
+    ffmpeg_iterator: ffmpeg_sidecar::iter::FfmpegIterator,
+    frame_info_rx: &Receiver<FrameInfo>,
+    frame_tx: &Sender<super::Result<Frame>>,
+) {
+    for event in ffmpeg_iterator {
+        #[allow(clippy::match_same_arms)]
+        match event {
+            FfmpegEvent::Log(LogLevel::Info, msg) => {
+                re_log::debug!("{msg}");
+            }
+
+            FfmpegEvent::Log(LogLevel::Warning, msg) => {
+                if !msg.contains("No accelerated colorspace conversion found from yuv420p to rgb24")
+                {
+                    re_log::warn_once!("{msg}");
+                }
+            }
+
+            FfmpegEvent::Log(LogLevel::Error, msg) => {
+                // TODO: report errors
+                re_log::error_once!("{msg}");
+            }
+
+            // Usefuless info in these:
+            FfmpegEvent::ParsedInput(_) => {}
+            FfmpegEvent::ParsedOutput(_) => {}
+            FfmpegEvent::ParsedStreamMapping(_) => {}
+
+            FfmpegEvent::ParsedInputStream(stream) => {
+                let ffmpeg_sidecar::event::AVStream {
+                    stream_type,
+                    format,
+                    pix_fmt, // Often 'yuv420p'
+                    width,
+                    height,
+                    fps,
+                    ..
+                } = stream;
+
+                re_log::debug!("ParsedInputStream {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS");
+
+                debug_assert_eq!(stream_type.to_ascii_lowercase(), "video");
+            }
+
+            FfmpegEvent::ParsedOutputStream(stream) => {
+                // This just repeats what we told ffmpeg to output, e.g. "rawvideo rgb24"
+                let ffmpeg_sidecar::event::AVStream {
+                    stream_type,
+                    format,
+                    pix_fmt,
+                    width,
+                    height,
+                    fps,
+                    ..
+                } = stream;
+
+                re_log::debug!("ParsedOutputStream {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS");
+
+                debug_assert_eq!(stream_type.to_ascii_lowercase(), "video");
+            }
+
+            FfmpegEvent::Progress(_) => {
+                // We can get out frame number etc here to know how far behind we are.
+            }
+
+            FfmpegEvent::OutputFrame(frame) => {
+                // NOTE: `frame.timestamp` is monotonically increasing,
+                // and is not the actual timestamp in the stream.
+
+                let frame_info: FrameInfo = match frame_info_rx.try_recv() {
+                    Ok(frame_info) => frame_info,
+
+                    Err(TryRecvError::Disconnected) => {
+                        re_log::debug!("Receiver disconnected");
+                        return;
+                    }
+
+                    Err(TryRecvError::Empty) => {
+                        // This shouldn't happen
+                        if frame_tx.send(Err(Error::NoFrameInfo.into())).is_err() {
+                            re_log::warn!("Got no frame-info, and failed to send error");
+                        }
+                        return;
+                    }
+                };
+
+                let ffmpeg_sidecar::event::OutputVideoFrame {
+                    frame_num,
+                    pix_fmt,
+                    width,
+                    height,
+                    data,
+                    ..
+                } = frame;
+
+                debug_assert_eq!(
+                    frame_info.frame_num, frame_num,
+                    "We are out-of-sync with ffmpeg"
+                ); // TODO: fix somehow
+
+                re_log::trace!("Received frame {frame_num}: fmt {pix_fmt:?} size {width}x{height}");
+
+                debug_assert_eq!(pix_fmt, "rgb24");
+                debug_assert_eq!(width as usize * height as usize * 3, data.len());
+
+                if frame_tx
+                    .send(Ok(super::Frame {
+                        width,
+                        height,
+                        data,
+                        format: crate::PixelFormat::Rgb8Unorm,
+                        presentation_timestamp: frame_info.timestamp,
+                        duration: frame_info.duration,
+                    }))
+                    .is_err()
+                {
+                    re_log::debug!("Receiver disconnected");
+                    return;
+                }
+            }
+
+            FfmpegEvent::Done => {
+                re_log::debug!("ffmpeg is Done");
+                return;
+            }
+            // TODO: handle all events
+            event => re_log::debug!("Event: {event:?}"),
+        }
+    }
+}
+
 impl SyncDecoder for FfmpegCliH264Decoder {
     fn submit_chunk(
         &mut self,
@@ -148,7 +245,7 @@ impl SyncDecoder for FfmpegCliH264Decoder {
         // NOTE: this assumes each sample/chunk will result in exactly one frame.
         self.frame_info_tx.send(FrameInfo {
             frame_num: self.frame_num,
-            timestamp: chunk.timestamp,
+            timestamp: chunk.composition_timestamp,
             duration: chunk.duration,
         });
 
@@ -200,12 +297,12 @@ fn write_avc_chunk_to_nalu_stream(
     // an IDR frame unless the previous frame was an IDR frame.
     // TODO(andreas): Should we detect this rather from the NALU stream rather than the samples?
     if chunk.is_sync && !state.previous_frame_was_idr {
-        for sps in (&avcc.sequence_parameter_sets).iter() {
-            nalu_stream.write_all(&NAL_START_CODE)?;
+        for sps in &avcc.sequence_parameter_sets {
+            nalu_stream.write_all(NAL_START_CODE)?;
             nalu_stream.write_all(&sps.bytes)?;
         }
-        for pps in (&avcc.picture_parameter_sets).iter() {
-            nalu_stream.write_all(&NAL_START_CODE)?;
+        for pps in &avcc.picture_parameter_sets {
+            nalu_stream.write_all(NAL_START_CODE)?;
             nalu_stream.write_all(&pps.bytes)?;
         }
         state.previous_frame_was_idr = true;
@@ -248,7 +345,7 @@ fn write_avc_chunk_to_nalu_stream(
             );
         }
 
-        nalu_stream.write_all(&NAL_START_CODE)?;
+        nalu_stream.write_all(NAL_START_CODE)?;
         let data_start = buffer_offset + length_prefix_size; // Skip the size.
         let data_end = buffer_offset + nal_unit_size + length_prefix_size;
         let data = &chunk.data[data_start..data_end];
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index 5a53357f96a3..3877bdb08018 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -90,7 +90,7 @@ mod webcodecs;
 
 use crate::Time;
 
-#[derive(thiserror::Error, Debug, Clone, PartialEq, Eq)]
+#[derive(thiserror::Error, Debug, Clone)]
 pub enum Error {
     #[error("Unsupported codec: {0}")]
     UnsupportedCodec(String),
@@ -116,12 +116,8 @@ pub enum Error {
     WebDecoderError(#[from] webcodecs::Error),
 
     #[cfg(with_ffmpeg)]
-    #[error("Failed to start ffmppeg: {0}")]
-    FailedToStartFfmpeg(std::io::Error),
-
-    #[cfg(with_ffmpeg)]
-    #[error("Failed to start ffmppeg: {0}")]
-    FailedToSpawnThread(std::io::Error),
+    #[error(transparent)]
+    Ffmpeg(std::sync::Arc<ffmpeg::Error>),
 }
 
 pub type Result<T = (), E = Error> = std::result::Result<T, E>;
@@ -194,10 +190,7 @@ pub fn new_decoder(
             re_log::trace!("Decoding H.264…");
             return Ok(Box::new(async_decoder_wrapper::AsyncDecoderWrapper::new(
                 debug_name.to_owned(),
-                Box::new(ffmpeg::FfmpegCliH264Decoder::new(
-                    avc1_box.clone(),
-                    video.timescale,
-                )?),
+                Box::new(ffmpeg::FfmpegCliH264Decoder::new(avc1_box.clone())?),
                 on_output,
             )));
         }
diff --git a/crates/viewer/re_renderer/src/video/mod.rs b/crates/viewer/re_renderer/src/video/mod.rs
index 7404c1cc2d0b..d1398b42b817 100644
--- a/crates/viewer/re_renderer/src/video/mod.rs
+++ b/crates/viewer/re_renderer/src/video/mod.rs
@@ -11,7 +11,7 @@ use re_video::{decode::DecodeHardwareAcceleration, VideoData};
 use crate::{resource_managers::GpuTexture2D, RenderContext};
 
 /// Error that can occur during playing videos.
-#[derive(thiserror::Error, Debug, Clone, PartialEq, Eq)]
+#[derive(thiserror::Error, Debug, Clone)]
 pub enum VideoPlayerError {
     #[error("The decoder is lagging behind")]
     EmptyBuffer,
diff --git a/crates/viewer/re_renderer/src/video/player.rs b/crates/viewer/re_renderer/src/video/player.rs
index 492032cc66cd..da831dbb3545 100644
--- a/crates/viewer/re_renderer/src/video/player.rs
+++ b/crates/viewer/re_renderer/src/video/player.rs
@@ -280,7 +280,7 @@ impl VideoPlayer {
         );
 
         if let Err(err) = result {
-            if err == VideoPlayerError::EmptyBuffer {
+            if matches!(err, VideoPlayerError::EmptyBuffer) {
                 // No buffered frames
 
                 // Might this be due to an error?

From b25a53980820b23fd7cf50c915ba5d73b78af8d1 Mon Sep 17 00:00:00 2001
From: Emil Ernerfeldt <emil.ernerfeldt@gmail.com>
Date: Wed, 9 Oct 2024 12:43:33 +0200
Subject: [PATCH 05/33] Better error handling

---
 crates/store/re_video/src/decode/ffmpeg.rs | 125 +++++++++++++++------
 1 file changed, 91 insertions(+), 34 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 3a369ee7b0cd..2cdea0d4b881 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,5 +1,7 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
+use std::sync::atomic::Ordering;
+
 use crossbeam::channel::{Receiver, Sender, TryRecvError};
 use ffmpeg_sidecar::{
     command::FfmpegCommand,
@@ -23,6 +25,12 @@ pub enum Error {
 
     #[error("There's a bug in Rerun")]
     NoFrameInfo,
+
+    #[error("Failed to write data to ffmpeg: {0}")]
+    FailedToWriteToFfmpeg(std::io::Error),
+
+    #[error("Bad video data: {0}")]
+    BadVideoData(String),
 }
 
 impl From<Error> for super::Error {
@@ -59,7 +67,7 @@ pub struct FfmpegCliH264Decoder {
 }
 
 impl FfmpegCliH264Decoder {
-    pub fn new(avcc: re_mp4::Avc1Box) -> Result<Self> {
+    pub fn new(avcc: re_mp4::Avc1Box) -> Result<Self, Error> {
         re_tracing::profile_function!();
 
         let mut ffmpeg = {
@@ -242,29 +250,53 @@ impl SyncDecoder for FfmpegCliH264Decoder {
     ) {
         re_tracing::profile_function!();
 
-        // NOTE: this assumes each sample/chunk will result in exactly one frame.
-        self.frame_info_tx.send(FrameInfo {
+        // First read any outstanding messages (e.g. error reports),
+        // so they get orderer correctly.
+        while let Ok(frame_result) = self.frame_rx.try_recv() {
+            if should_stop.load(Ordering::Relaxed) {
+                return;
+            }
+            on_output(frame_result);
+        }
+
+        // We send the information about this chunk first.
+        // This assumes each sample/chunk will result in exactly one frame.
+        // If this assumption is not held, we will get weird errors, like videos playing to slowly.
+        let frame_info = FrameInfo {
             frame_num: self.frame_num,
             timestamp: chunk.composition_timestamp,
             duration: chunk.duration,
-        });
+        };
 
         // NOTE: a 60 FPS video can go for two years before wrapping a u32.
         self.frame_num = self.frame_num.wrapping_add(1);
 
-        let mut state = NaluStreamState::default();
-        write_avc_chunk_to_nalu_stream(&self.avcc, &mut self.ffmpeg_stdin, &chunk, &mut state)
-            .unwrap();
-        // consider writing samples while at the same time reading frames, for even lower latency
-        // and maybe reuse the same ffmpeg process.
+        if self.frame_info_tx.send(frame_info).is_err() {
+            // The other thread must be down, e.g. because `ffmpeg` crashed.
+            // It should already have reported that as an error - no need to repeat it here.
+        } else {
+            // Write chunk to ffmpeg:
+            let mut state = NaluStreamState::default(); // TODO: remove state?
+            if let Err(err) = write_avc_chunk_to_nalu_stream(
+                should_stop,
+                &self.avcc,
+                &mut self.ffmpeg_stdin,
+                &chunk,
+                &mut state,
+            ) {
+                on_output(Err(err.into()));
+            }
+        }
 
-        // TODO: handle errors
+        // Read results and/or errors:
         while let Ok(frame_result) = self.frame_rx.try_recv() {
-            if should_stop.load(std::sync::atomic::Ordering::Relaxed) {
+            if should_stop.load(Ordering::Relaxed) {
                 return;
             }
             on_output(frame_result);
         }
+
+        // TODO: block until we have processed the frame!
     }
 
     fn reset(&mut self) {
@@ -285,11 +317,12 @@ struct NaluStreamState {
 }
 
 fn write_avc_chunk_to_nalu_stream(
+    should_stop: &std::sync::atomic::AtomicBool,
     avcc: &re_mp4::Avc1Box,
     nalu_stream: &mut dyn std::io::Write,
     chunk: &super::Chunk,
     state: &mut NaluStreamState,
-) -> Result<(), Box<dyn std::error::Error>> {
+) -> Result<(), Error> {
     re_tracing::profile_function!();
     let avcc = &avcc.avcc;
 
@@ -298,12 +331,20 @@ fn write_avc_chunk_to_nalu_stream(
     // TODO(andreas): Should we detect this rather from the NALU stream rather than the samples?
     if chunk.is_sync && !state.previous_frame_was_idr {
         for sps in &avcc.sequence_parameter_sets {
-            nalu_stream.write_all(NAL_START_CODE)?;
-            nalu_stream.write_all(&sps.bytes)?;
+            nalu_stream
+                .write_all(NAL_START_CODE)
+                .map_err(Error::FailedToWriteToFfmpeg)?;
+            nalu_stream
+                .write_all(&sps.bytes)
+                .map_err(Error::FailedToWriteToFfmpeg)?;
         }
         for pps in &avcc.picture_parameter_sets {
-            nalu_stream.write_all(NAL_START_CODE)?;
-            nalu_stream.write_all(&pps.bytes)?;
+            nalu_stream
+                .write_all(NAL_START_CODE)
+                .map_err(Error::FailedToWriteToFfmpeg)?;
+            nalu_stream
+                .write_all(&pps.bytes)
+                .map_err(Error::FailedToWriteToFfmpeg)?;
         }
         state.previous_frame_was_idr = true;
     } else {
@@ -314,46 +355,62 @@ fn write_avc_chunk_to_nalu_stream(
     // (most of the time it's 1:1, but there might be extra NAL units for info, especially at the start).
     let mut buffer_offset: usize = 0;
     let sample_end = chunk.data.len();
-    while buffer_offset < sample_end {
+    while buffer_offset < sample_end && !should_stop.load(Ordering::Relaxed) {
         re_tracing::profile_scope!("nalu");
 
         // Each NAL unit in mp4 is prefixed with a length prefix.
         // In Annex B this doesn't exist.
         let length_prefix_size = avcc.length_size_minus_one as usize + 1;
 
-        // TODO: improve the error handling here.
+        if sample_end < buffer_offset + length_prefix_size {
+            return Err(Error::BadVideoData(
+                "Not enough bytes to fit the length prefix".to_owned(),
+            ));
+        }
+
         let nal_unit_size = match length_prefix_size {
-            4 => u32::from_be_bytes(
-                chunk.data[buffer_offset..(buffer_offset + 4)]
+            1 => chunk.data[buffer_offset] as usize,
+
+            2 => u16::from_be_bytes(
+                #[allow(clippy::unwrap_used)] // can't fail
+                chunk.data[buffer_offset..(buffer_offset + 2)]
                     .try_into()
                     .unwrap(),
             ) as usize,
-            2 => u16::from_be_bytes(
-                chunk.data[buffer_offset..(buffer_offset + 2)]
+
+            4 => u32::from_be_bytes(
+                #[allow(clippy::unwrap_used)] // can't fail
+                chunk.data[buffer_offset..(buffer_offset + 4)]
                     .try_into()
                     .unwrap(),
             ) as usize,
-            1 => chunk.data[buffer_offset] as usize,
-            _ => panic!("invalid length prefix size"),
-        };
-        //re_log::debug!("nal unit size: {}", nal_unit_size);
 
-        if chunk.data.len() < nal_unit_size {
-            panic!(
-                "sample size {} is smaller than nal unit size {nal_unit_size}",
-                chunk.data.len()
-            );
-        }
+            _ => {
+                return Err(Error::BadVideoData(format!(
+                    "Bad length prefix size: {length_prefix_size}"
+                )));
+            }
+        };
 
-        nalu_stream.write_all(NAL_START_CODE)?;
         let data_start = buffer_offset + length_prefix_size; // Skip the size.
         let data_end = buffer_offset + nal_unit_size + length_prefix_size;
+
+        if chunk.data.len() < data_end {
+            return Err(Error::BadVideoData("Not enough bytes to".to_owned()));
+        }
+
         let data = &chunk.data[data_start..data_end];
 
+        nalu_stream
+            .write_all(NAL_START_CODE)
+            .map_err(Error::FailedToWriteToFfmpeg)?;
+
         // Note that we don't have to insert "emulation prevention bytes" since mp4 NALU still use them.
         // (unlike the NAL start code, the presentation bytes are part of the NAL spec!)
 
-        nalu_stream.write_all(data)?;
+        nalu_stream
+            .write_all(data)
+            .map_err(Error::FailedToWriteToFfmpeg)?;
 
         buffer_offset = data_end;
     }

From 32c58460831f2baba67fb5bac71af30ca98cd615 Mon Sep 17 00:00:00 2001
From: Emil Ernerfeldt <emil.ernerfeldt@gmail.com>
Date: Wed, 9 Oct 2024 13:24:58 +0200
Subject: [PATCH 06/33] Improve log output and thread names

---
 .../src/decode/async_decoder_wrapper.rs       |  2 +-
 crates/store/re_video/src/decode/ffmpeg.rs    | 60 ++++++++++++++++---
 2 files changed, 52 insertions(+), 10 deletions(-)

diff --git a/crates/store/re_video/src/decode/async_decoder_wrapper.rs b/crates/store/re_video/src/decode/async_decoder_wrapper.rs
index d572e1cbc0c6..8bfac6842fb4 100644
--- a/crates/store/re_video/src/decode/async_decoder_wrapper.rs
+++ b/crates/store/re_video/src/decode/async_decoder_wrapper.rs
@@ -73,7 +73,7 @@ impl AsyncDecoderWrapper {
         let comms = Comms::default();
 
         let thread = std::thread::Builder::new()
-            .name("av1_decoder".into())
+            .name(format!("decoer thread for {debug_name}"))
             .spawn({
                 let comms = comms.clone();
                 move || {
diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 2cdea0d4b881..e81e13a8299f 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -31,6 +31,12 @@ pub enum Error {
 
     #[error("Bad video data: {0}")]
     BadVideoData(String),
+
+    #[error("FFMPEG error: {0}")]
+    Ffmpeg(String),
+
+    #[error("FFMPEG IPC error: {0}")]
+    FfmpegSidecar(String),
 }
 
 impl From<Error> for super::Error {
@@ -49,7 +55,6 @@ struct FrameInfo {
 }
 
 /// Decode H.264 video via ffmpeg over CLI
-
 pub struct FfmpegCliH264Decoder {
     /// Monotonically increasing
     frame_num: u32,
@@ -67,6 +72,8 @@ pub struct FfmpegCliH264Decoder {
 }
 
 impl FfmpegCliH264Decoder {
+    // TODO: make this robust against `pkill ffmpeg` somehow.
+    // Maybe `AsyncDecoder` can auto-restart us, or we wrap ourselves in a new struct that restarts us on certain errors?
     pub fn new(avcc: re_mp4::Avc1Box) -> Result<Self, Error> {
         re_tracing::profile_function!();
 
@@ -114,23 +121,51 @@ fn read_ffmpeg_output(
     frame_info_rx: &Receiver<FrameInfo>,
     frame_tx: &Sender<super::Result<Frame>>,
 ) {
+    /// Ignore some common output from ffmpeg:
+    fn should_ignore_log_msg(msg: &str) -> bool {
+        let patterns = [
+            "Duration: N/A, bitrate: N/A",
+            "frame=    0 fps=0.0 q=0.0 size=       0kB time=N/A bitrate=N/A speed=N/A",
+            "Metadata:",
+            "No accelerated colorspace conversion found from yuv420p to rgb24",
+            "Stream mapping:",
+        ];
+
+        for pattern in patterns {
+            if msg.contains(pattern) {
+                return true;
+            }
+        }
+
+        false
+    }
+
     for event in ffmpeg_iterator {
         #[allow(clippy::match_same_arms)]
         match event {
             FfmpegEvent::Log(LogLevel::Info, msg) => {
-                re_log::debug!("{msg}");
+                if !should_ignore_log_msg(&msg) {
+                    re_log::debug!("{msg}");
+                }
             }
 
             FfmpegEvent::Log(LogLevel::Warning, msg) => {
-                if !msg.contains("No accelerated colorspace conversion found from yuv420p to rgb24")
-                {
+                if !should_ignore_log_msg(&msg) {
                     re_log::warn_once!("{msg}");
                 }
             }
 
             FfmpegEvent::Log(LogLevel::Error, msg) => {
-                // TODO: report errors
-                re_log::error_once!("{msg}");
+                frame_tx.send(Err(Error::Ffmpeg(msg).into())).ok();
+            }
+
+            FfmpegEvent::LogEOF => {
+                // This event proceeds `FfmpegEvent::Done`.
+                // This happens on `pkill ffmpeg`, for instance.
+            }
+
+            FfmpegEvent::Error(error) => {
+                frame_tx.send(Err(Error::FfmpegSidecar(error).into())).ok();
             }
 
             // Usefuless info in these:
@@ -149,7 +184,9 @@ fn read_ffmpeg_output(
                     ..
                 } = stream;
 
-                re_log::debug!("ParsedInputStream {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS");
+                re_log::debug!(
+                    "Input: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
+                );
 
                 debug_assert_eq!(stream_type.to_ascii_lowercase(), "video");
             }
@@ -166,7 +203,9 @@ fn read_ffmpeg_output(
                     ..
                 } = stream;
 
-                re_log::debug!("ParsedOutputStream {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS");
+                re_log::debug!(
+                    "Output: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
+                );
 
                 debug_assert_eq!(stream_type.to_ascii_lowercase(), "video");
             }
@@ -232,9 +271,11 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::Done => {
+                // This happens on `pkill ffmpeg`, for instance.
                 re_log::debug!("ffmpeg is Done");
                 return;
             }
+
             // TODO: handle all events
             event => re_log::debug!("Event: {event:?}"),
         }
@@ -356,7 +397,7 @@ fn write_avc_chunk_to_nalu_stream(
     let mut buffer_offset: usize = 0;
     let sample_end = chunk.data.len();
     while buffer_offset < sample_end && !should_stop.load(Ordering::Relaxed) {
-        re_tracing::profile_scope!("nalu");
+        re_tracing::profile_scope!("write_nalu");
 
         // Each NAL unit in mp4 is prefixed with a length prefix.
         // In Annex B this doesn't exist.
@@ -408,6 +449,7 @@ fn write_avc_chunk_to_nalu_stream(
         // Note that we don't have to insert "emulation prevention bytes" since mp4 NALU still use them.
         // (unlike the NAL start code, the presentation bytes are part of the NAL spec!)
 
+        re_tracing::profile_scope!("write_bytes", data.len().to_string());
         nalu_stream
             .write_all(data)
             .map_err(Error::FailedToWriteToFfmpeg)?;

From 32b673994803592203f290a9ec93e7fda07fe144 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Fri, 25 Oct 2024 17:14:46 +0200
Subject: [PATCH 07/33] reduce ffmpeg decode delay

---
 crates/store/re_video/src/decode/ffmpeg.rs | 23 +++++++++++++++++++++-
 1 file changed, 22 insertions(+), 1 deletion(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index e81e13a8299f..ceca6a6f26ae 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -82,10 +82,31 @@ impl FfmpegCliH264Decoder {
 
             FfmpegCommand::new()
                 .hide_banner()
+                // "Reduce the latency introduced by buffering during initial input streams analysis."
+                //.arg("-fflags nobuffer")
+                //
+                // .. instead use these more aggressive options found here
+                // https://stackoverflow.com/a/49273163
+                .args([
+                    "-probesize",
+                    "32", // 32 bytes is the minimum probe size.
+                    "-analyzeduration",
+                    "0",
+                ])
                 // Keep in mind that all arguments that are about the input, need to go before!
                 .format("h264") // High risk here: What's is available?
                 .input("-") // stdin is our input!
-                .rawvideo() // Output rgb24 on stdout. (TODO(emilk) for later: any format we can read directly on re_renderer would be better!)
+                // TODO: Do we have to do this instead?
+                // Set constant frame rate.
+                // We can't properly handle variable frame rate since `rawvideo` output won't report timestamps.
+                // To work around this we'd first need to establish a mapping of frame numbers to timestamps.
+                // This isn't entirely trivial since individual chunks may have arbitrary composition & decode timestamps.
+                //.fps_mode(1)
+                //
+                // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
+                // (should be faster overall at no quality loss if the video is in this format).
+                // Check `ffmpeg -pix_fmts` for full list.
+                .rawvideo() // Output rgb24 on stdout.
                 .spawn()
                 .map_err(Error::FailedToStartFfmpeg)?
         };

From 19fe5d0ce3149a9cddb711f7b4f19f3dd6472f22 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Fri, 25 Oct 2024 17:14:58 +0200
Subject: [PATCH 08/33] fix re_video example build

---
 crates/store/re_video/examples/frames.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/crates/store/re_video/examples/frames.rs b/crates/store/re_video/examples/frames.rs
index 4837a09cf554..18b9c55bd59a 100644
--- a/crates/store/re_video/examples/frames.rs
+++ b/crates/store/re_video/examples/frames.rs
@@ -93,6 +93,9 @@ fn main() {
                 re_video::PixelFormat::Rgba8Unorm => {
                     write_ppm_rgba32(&mut file, frame.width, frame.height, &frame.data);
                 }
+                re_video::PixelFormat::Yuv { .. } => {
+                    re_log::error_once!("YUV frame writing is not not supported");
+                }
             }
         }
     }

From e4d37402138cbefbf9c5299725fdbb24418a5b60 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Fri, 25 Oct 2024 17:31:39 +0200
Subject: [PATCH 09/33] add decode timestamp, nal header parsing, various
 comments, todo notes

---
 crates/store/re_video/src/decode/ffmpeg.rs    | 97 ++++++++++++++++---
 crates/store/re_video/src/decode/mod.rs       |  8 ++
 crates/store/re_video/src/demux/mod.rs        |  1 +
 crates/viewer/re_renderer/src/video/player.rs |  3 +-
 4 files changed, 97 insertions(+), 12 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index ceca6a6f26ae..e68cb4fd207e 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,6 +1,6 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
-use std::sync::atomic::Ordering;
+use std::{io::Write, sync::atomic::Ordering};
 
 use crossbeam::channel::{Receiver, Sender, TryRecvError};
 use ffmpeg_sidecar::{
@@ -23,7 +23,7 @@ pub enum Error {
     #[error("Failed to get iterator: {0}")]
     NoIterator(String),
 
-    #[error("There's a bug in Rerun")]
+    #[error("No frame info received, this is a likely a bug in Rerun")]
     NoFrameInfo,
 
     #[error("Failed to write data to ffmpeg: {0}")]
@@ -236,9 +236,6 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::OutputFrame(frame) => {
-                // NOTE: `frame.timestamp` is monotonically increasing,
-                // and is not the actual timestamp in the stream.
-
                 let frame_info: FrameInfo = match frame_info_rx.try_recv() {
                     Ok(frame_info) => frame_info,
 
@@ -262,7 +259,8 @@ fn read_ffmpeg_output(
                     width,
                     height,
                     data,
-                    ..
+                    output_index: _, // This is the stream index. for all we do it's always 0.
+                    timestamp: _, // This is a timestamp made up by ffmpeg_sidecar based on limited information it has.
                 } = frame;
 
                 debug_assert_eq!(
@@ -313,7 +311,7 @@ impl SyncDecoder for FfmpegCliH264Decoder {
         re_tracing::profile_function!();
 
         // First read any outstanding messages (e.g. error reports),
-        // so they get orderer correctly.
+        // so they get ordered correctly.
         while let Ok(frame_result) = self.frame_rx.try_recv() {
             if should_stop.load(Ordering::Relaxed) {
                 return;
@@ -324,6 +322,8 @@ impl SyncDecoder for FfmpegCliH264Decoder {
         // We send the information about this chunk first.
         // This assumes each sample/chunk will result in exactly one frame.
         // If this assumption is not held, we will get weird errors, like videos playing to slowly.
+        // TODO: this also assumes that the frame comes back in this order.
+        // Which is definitely wrong, as we know that frames are not necessarily in composition time stamp order!
         let frame_info = FrameInfo {
             frame_num: self.frame_num,
             timestamp: chunk.composition_timestamp,
@@ -348,17 +348,16 @@ impl SyncDecoder for FfmpegCliH264Decoder {
             ) {
                 on_output(Err(err.into()));
             }
+
+            self.ffmpeg_stdin.flush().ok();
         }
 
-        // Read results and/or errors:
         while let Ok(frame_result) = self.frame_rx.try_recv() {
             if should_stop.load(Ordering::Relaxed) {
                 return;
             }
             on_output(frame_result);
         }
-
-        // TODO: block until we have processed the frame!
     }
 
     fn reset(&mut self) {
@@ -413,7 +412,7 @@ fn write_avc_chunk_to_nalu_stream(
         state.previous_frame_was_idr = false;
     }
 
-    // A single cjhunk may consist of multiple NAL units, each of which need our special treatment.
+    // A single chunk may consist of multiple NAL units, each of which need our special treatment.
     // (most of the time it's 1:1, but there might be extra NAL units for info, especially at the start).
     let mut buffer_offset: usize = 0;
     let sample_end = chunk.data.len();
@@ -461,6 +460,13 @@ fn write_avc_chunk_to_nalu_stream(
             return Err(Error::BadVideoData("Not enough bytes to".to_owned()));
         }
 
+        let nal_header = NalHeader(chunk.data[data_start]);
+        re_log::trace!(
+            "nal_header: {:?}, {}",
+            nal_header.unit_type(),
+            nal_header.ref_idc()
+        );
+
         let data = &chunk.data[data_start..data_end];
 
         nalu_stream
@@ -480,3 +486,72 @@ fn write_avc_chunk_to_nalu_stream(
 
     Ok(())
 }
+
+/// Possible values for `nal_unit_type` field in `nal_unit`.
+///
+/// Encodes to 5 bits.
+/// Via: https://docs.rs/less-avc/0.1.5/src/less_avc/nal_unit.rs.html#232
+#[derive(PartialEq, Eq)]
+#[non_exhaustive]
+#[repr(u8)]
+#[derive(Copy, Clone, Debug)]
+pub enum NalUnitType {
+    /// Unspecified
+    Unspecified = 0,
+
+    /// Coded slice of a non-IDR picture
+    CodedSliceOfANonIDRPicture = 1,
+
+    /// Coded slice data partition A
+    CodedSliceDataPartitionA = 2,
+
+    /// Coded slice data partition B
+    CodedSliceDataPartitionB = 3,
+
+    /// Coded slice data partition C
+    CodedSliceDataPartitionC = 4,
+
+    /// Coded slice of an IDR picture
+    CodedSliceOfAnIDRPicture = 5,
+
+    /// Supplemental enhancement information (SEI)
+    SupplementalEnhancementInformation = 6,
+
+    /// Sequence parameter set
+    SequenceParameterSet = 7,
+
+    /// Picture parameter set
+    PictureParameterSet = 8,
+
+    /// Header type not listed here.
+    Other,
+}
+
+/// Header of the "Network Abstraction Layer" unit that is used by H.264/AVC & H.265/HEVC.
+#[derive(Copy, Clone, Debug, PartialEq, Eq)]
+struct NalHeader(pub u8);
+
+impl NalHeader {
+    pub fn unit_type(self) -> NalUnitType {
+        match self.0 & 0b111 {
+            0 => NalUnitType::Unspecified,
+            1 => NalUnitType::CodedSliceOfANonIDRPicture,
+            2 => NalUnitType::CodedSliceDataPartitionA,
+            3 => NalUnitType::CodedSliceDataPartitionB,
+            4 => NalUnitType::CodedSliceDataPartitionC,
+            5 => NalUnitType::CodedSliceOfAnIDRPicture,
+            6 => NalUnitType::SupplementalEnhancementInformation,
+            7 => NalUnitType::SequenceParameterSet,
+            8 => NalUnitType::PictureParameterSet,
+            _ => NalUnitType::Other,
+        }
+    }
+
+    /// Ref idc is a value from 0-3 that tells us how "important" the frame/sample is.
+    ///
+    /// For details see:
+    /// <https://yumichan.net/video-processing/video-compression/breif-description-of-nal_ref_idc-value-in-h-246-nalu/>
+    fn ref_idc(self) -> u8 {
+        (self.0 >> 5) & 0b11
+    }
+}
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index 3877bdb08018..bcc49ffddffb 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -208,8 +208,16 @@ pub struct Chunk {
 
     pub data: Vec<u8>,
 
+    /// Decode timestamp of this sample.
+    /// Chunks are expected to be submitted in the order of decode timestamp.
+    ///
+    /// `decode_timestamp <= composition_timestamp`
+    pub decode_timestamp: Time,
+
     /// Presentation/composition timestamp for the sample in this chunk.
     /// *not* decode timestamp.
+    ///
+    /// `decode_timestamp <= composition_timestamp`
     pub composition_timestamp: Time,
 
     pub duration: Time,
diff --git a/crates/store/re_video/src/demux/mod.rs b/crates/store/re_video/src/demux/mod.rs
index 4a642113e39b..672d024d1b05 100644
--- a/crates/store/re_video/src/demux/mod.rs
+++ b/crates/store/re_video/src/demux/mod.rs
@@ -310,6 +310,7 @@ impl Sample {
             .to_vec();
         Some(Chunk {
             data,
+            decode_timestamp: self.decode_timestamp,
             composition_timestamp: self.composition_timestamp,
             duration: self.duration,
             is_sync: self.is_sync,
diff --git a/crates/viewer/re_renderer/src/video/player.rs b/crates/viewer/re_renderer/src/video/player.rs
index da831dbb3545..a6c17d4d7904 100644
--- a/crates/viewer/re_renderer/src/video/player.rs
+++ b/crates/viewer/re_renderer/src/video/player.rs
@@ -188,8 +188,9 @@ impl VideoPlayer {
         //     = determines the decoding order of samples
         //
         // Note: `decode <= composition` for any given sample.
-        //       For some codecs, the two timestamps are the same.
+        //       For some codecs & videos, the two timestamps are the same.
         // We must enqueue samples in decode order, but show them in composition order.
+        // In the presence of b-frames this order may be different!
 
         // 1. Find the latest sample where `decode_timestamp <= presentation_timestamp`.
         //    Because `decode <= composition`, we never have to look further ahead in the

From 6aa86939210726fd5a8ba54bb9c066de5c5ef2c1 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Fri, 25 Oct 2024 18:07:04 +0200
Subject: [PATCH 10/33] better timestamp syncing strategy?

---
 crates/store/re_video/src/decode/av1.rs       |  4 +-
 crates/store/re_video/src/decode/ffmpeg.rs    | 73 +++++++++++--------
 crates/store/re_video/src/decode/mod.rs       | 10 +--
 crates/store/re_video/src/demux/mod.rs        | 11 +--
 crates/store/re_video/src/demux/mp4.rs        |  4 +-
 crates/viewer/re_renderer/src/video/player.rs |  4 +-
 6 files changed, 58 insertions(+), 48 deletions(-)

diff --git a/crates/store/re_video/src/decode/av1.rs b/crates/store/re_video/src/decode/av1.rs
index 61e821622388..a1c8528d5c5a 100644
--- a/crates/store/re_video/src/decode/av1.rs
+++ b/crates/store/re_video/src/decode/av1.rs
@@ -76,14 +76,14 @@ impl SyncDav1dDecoder {
         re_tracing::profile_function!();
         econtext::econtext_function_data!(format!(
             "chunk timestamp: {:?}",
-            chunk.composition_timestamp
+            chunk.presentation_timestamp
         ));
 
         re_tracing::profile_scope!("send_data");
         match self.decoder.send_data(
             chunk.data,
             None,
-            Some(chunk.composition_timestamp.0),
+            Some(chunk.presentation_timestamp.0),
             Some(chunk.duration.0),
         ) {
             Ok(()) => {}
diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index e68cb4fd207e..863b01350fcb 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,8 +1,8 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
-use std::{io::Write, sync::atomic::Ordering};
+use std::{collections::BTreeMap, io::Write, sync::atomic::Ordering};
 
-use crossbeam::channel::{Receiver, Sender, TryRecvError};
+use crossbeam::channel::{Receiver, Sender};
 use ffmpeg_sidecar::{
     command::FfmpegCommand,
     event::{FfmpegEvent, LogLevel},
@@ -47,10 +47,8 @@ impl From<Error> for super::Error {
 
 /// ffmpeg does not tell us the timestamp/duration of a given frame, so we need to remember it.
 struct FrameInfo {
-    /// Monotonic index, from start
-    frame_num: u32,
-
-    timestamp: Time,
+    decode_timestamp: Time,
+    presentation_timestamp: Time,
     duration: Time,
 }
 
@@ -161,6 +159,8 @@ fn read_ffmpeg_output(
         false
     }
 
+    let mut pending_frames = BTreeMap::new();
+
     for event in ffmpeg_iterator {
         #[allow(clippy::match_same_arms)]
         match event {
@@ -236,25 +236,37 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::OutputFrame(frame) => {
-                let frame_info: FrameInfo = match frame_info_rx.try_recv() {
-                    Ok(frame_info) => frame_info,
-
-                    Err(TryRecvError::Disconnected) => {
-                        re_log::debug!("Receiver disconnected");
-                        return;
-                    }
-
-                    Err(TryRecvError::Empty) => {
-                        // This shouldn't happen
-                        if frame_tx.send(Err(Error::NoFrameInfo.into())).is_err() {
-                            re_log::warn!("Got no frame-info, and failed to send error");
+                let frame_info = match pending_frames.pop_first() {
+                    Some((_, frame_info)) => frame_info,
+                    None => {
+                        // Retrieve frame infos until decode timestamp is no longer behind composition timestamp.
+                        // This is important because frame infos come not in in composition order,
+                        // but ffmpeg will report frames in composition order!
+                        loop {
+                            let Ok(frame_info) = frame_info_rx.try_recv() else {
+                                re_log::debug!("Receiver disconnected");
+                                return;
+                            };
+
+                            // Example how how presentation timestamps and decode timestamps can play out:
+                            //    PTS: 1 4 2 3
+                            //    DTS: 1 2 3 4
+                            // Stream: I P B B
+                            //
+                            // Essentially we need to wait until the dts has "caught up" with the pts!
+                            let highest_pts = pending_frames
+                                .last_key_value()
+                                .map_or(frame_info.presentation_timestamp, |(pts, _)| *pts);
+                            if frame_info.decode_timestamp <= highest_pts {
+                                break frame_info;
+                            }
+                            pending_frames.insert(frame_info.presentation_timestamp, frame_info);
                         }
-                        return;
                     }
                 };
 
                 let ffmpeg_sidecar::event::OutputVideoFrame {
-                    frame_num,
+                    frame_num: _, // This is made up by ffmpeg sidecar.
                     pix_fmt,
                     width,
                     height,
@@ -263,12 +275,11 @@ fn read_ffmpeg_output(
                     timestamp: _, // This is a timestamp made up by ffmpeg_sidecar based on limited information it has.
                 } = frame;
 
-                debug_assert_eq!(
-                    frame_info.frame_num, frame_num,
-                    "We are out-of-sync with ffmpeg"
-                ); // TODO: fix somehow
-
-                re_log::trace!("Received frame {frame_num}: fmt {pix_fmt:?} size {width}x{height}");
+                re_log::trace!(
+                    "Received frame: dts {:?} cts {:?} fmt {pix_fmt:?} size {width}x{height}",
+                    frame_info.decode_timestamp,
+                    frame_info.presentation_timestamp
+                );
 
                 debug_assert_eq!(pix_fmt, "rgb24");
                 debug_assert_eq!(width as usize * height as usize * 3, data.len());
@@ -279,7 +290,7 @@ fn read_ffmpeg_output(
                         height,
                         data,
                         format: crate::PixelFormat::Rgb8Unorm,
-                        presentation_timestamp: frame_info.timestamp,
+                        presentation_timestamp: frame_info.presentation_timestamp,
                         duration: frame_info.duration,
                     }))
                     .is_err()
@@ -322,11 +333,9 @@ impl SyncDecoder for FfmpegCliH264Decoder {
         // We send the information about this chunk first.
         // This assumes each sample/chunk will result in exactly one frame.
         // If this assumption is not held, we will get weird errors, like videos playing to slowly.
-        // TODO: this also assumes that the frame comes back in this order.
-        // Which is definitely wrong, as we know that frames are not necessarily in composition time stamp order!
         let frame_info = FrameInfo {
-            frame_num: self.frame_num,
-            timestamp: chunk.composition_timestamp,
+            presentation_timestamp: chunk.presentation_timestamp,
+            decode_timestamp: chunk.decode_timestamp,
             duration: chunk.duration,
         };
 
@@ -490,7 +499,7 @@ fn write_avc_chunk_to_nalu_stream(
 /// Possible values for `nal_unit_type` field in `nal_unit`.
 ///
 /// Encodes to 5 bits.
-/// Via: https://docs.rs/less-avc/0.1.5/src/less_avc/nal_unit.rs.html#232
+/// Via: <https://docs.rs/less-avc/0.1.5/src/less_avc/nal_unit.rs.html#232/>
 #[derive(PartialEq, Eq)]
 #[non_exhaustive]
 #[repr(u8)]
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index bcc49ffddffb..3483aaaa0988 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -211,14 +211,14 @@ pub struct Chunk {
     /// Decode timestamp of this sample.
     /// Chunks are expected to be submitted in the order of decode timestamp.
     ///
-    /// `decode_timestamp <= composition_timestamp`
+    /// `decode_timestamp <= presentation_timestamp`
     pub decode_timestamp: Time,
 
-    /// Presentation/composition timestamp for the sample in this chunk.
-    /// *not* decode timestamp.
+    /// Presentation timestamp for the sample in this chunk.
+    /// Often synonymous with `composition_timestamp`.
     ///
-    /// `decode_timestamp <= composition_timestamp`
-    pub composition_timestamp: Time,
+    /// `decode_timestamp <= presentation_timestamp`
+    pub presentation_timestamp: Time,
 
     pub duration: Time,
 }
diff --git a/crates/store/re_video/src/demux/mod.rs b/crates/store/re_video/src/demux/mod.rs
index 672d024d1b05..1f4fd189991b 100644
--- a/crates/store/re_video/src/demux/mod.rs
+++ b/crates/store/re_video/src/demux/mod.rs
@@ -238,7 +238,7 @@ impl VideoData {
         self.gops.iter().flat_map(|seg| {
             self.samples[seg.range()]
                 .iter()
-                .map(|sample| sample.composition_timestamp.into_nanos(self.timescale))
+                .map(|sample| sample.presentation_timestamp.into_nanos(self.timescale))
                 .sorted()
         })
     }
@@ -276,15 +276,16 @@ pub struct Sample {
     ///
     /// Samples should be decoded in this order.
     ///
-    /// `decode_timestamp <= composition_timestamp`
+    /// `decode_timestamp <= presentation_timestamp`
     pub decode_timestamp: Time,
 
     /// Time at which this sample appears in the frame stream, in time units.
+    /// Often synonymous with `presentation_timestamp`.
     ///
     /// The frame should be shown at this time.
     ///
-    /// `decode_timestamp <= composition_timestamp`
-    pub composition_timestamp: Time,
+    /// `decode_timestamp <= presentation_timestamp`
+    pub presentation_timestamp: Time,
 
     /// Duration of the sample, in time units.
     pub duration: Time,
@@ -311,7 +312,7 @@ impl Sample {
         Some(Chunk {
             data,
             decode_timestamp: self.decode_timestamp,
-            composition_timestamp: self.composition_timestamp,
+            presentation_timestamp: self.presentation_timestamp,
             duration: self.duration,
             is_sync: self.is_sync,
         })
diff --git a/crates/store/re_video/src/demux/mp4.rs b/crates/store/re_video/src/demux/mp4.rs
index 3bff80f0a63e..a886dd7429e2 100644
--- a/crates/store/re_video/src/demux/mp4.rs
+++ b/crates/store/re_video/src/demux/mp4.rs
@@ -54,7 +54,7 @@ impl VideoData {
             }
 
             let decode_timestamp = Time::new(sample.decode_timestamp as i64);
-            let composition_timestamp = Time::new(sample.composition_timestamp as i64);
+            let presentation_timestamp = Time::new(sample.composition_timestamp as i64);
             let duration = Time::new(sample.duration as i64);
 
             let byte_offset = sample.offset as u32;
@@ -63,7 +63,7 @@ impl VideoData {
             samples.push(Sample {
                 is_sync: sample.is_sync,
                 decode_timestamp,
-                composition_timestamp,
+                presentation_timestamp,
                 duration,
                 byte_offset,
                 byte_length,
diff --git a/crates/viewer/re_renderer/src/video/player.rs b/crates/viewer/re_renderer/src/video/player.rs
index a6c17d4d7904..0dc30812cf4e 100644
--- a/crates/viewer/re_renderer/src/video/player.rs
+++ b/crates/viewer/re_renderer/src/video/player.rs
@@ -204,11 +204,11 @@ impl VideoPlayer {
         };
 
         // 2. Search _backwards_, starting at `decode_sample_idx`, looking for
-        //    the first sample where `sample.composition_timestamp <= presentation_timestamp`.
+        //    the first sample where `sample.presentation_timestamp <= presentation_timestamp`.
         //    This is the sample which when decoded will be presented at the timestamp the user requested.
         let Some(requested_sample_idx) = self.data.samples[..=decode_sample_idx]
             .iter()
-            .rposition(|sample| sample.composition_timestamp <= presentation_timestamp)
+            .rposition(|sample| sample.presentation_timestamp <= presentation_timestamp)
         else {
             return Err(VideoPlayerError::EmptyVideo);
         };

From 84d0a55e9176c9732fd3fde8e7fe89e705081c81 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 28 Oct 2024 11:11:18 +0100
Subject: [PATCH 11/33] make ffmpeg an async decoder

---
 crates/store/re_video/src/decode/ffmpeg.rs | 96 +++++++++-------------
 crates/store/re_video/src/decode/mod.rs    | 14 ++--
 2 files changed, 47 insertions(+), 63 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 863b01350fcb..9c6681941aab 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,6 +1,6 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
-use std::{collections::BTreeMap, io::Write, sync::atomic::Ordering};
+use std::{collections::BTreeMap, io::Write, sync::Arc};
 
 use crossbeam::channel::{Receiver, Sender};
 use ffmpeg_sidecar::{
@@ -10,7 +10,7 @@ use ffmpeg_sidecar::{
 
 use crate::Time;
 
-use super::{async_decoder_wrapper::SyncDecoder, Frame, Result};
+use super::{AsyncDecoder, Frame, OutputCallback};
 
 #[derive(thiserror::Error, Debug)]
 pub enum Error {
@@ -63,16 +63,18 @@ pub struct FfmpegCliH264Decoder {
     /// For sending frame timestamps to the decoder thread
     frame_info_tx: Sender<FrameInfo>,
 
-    /// How we receive new frames back from ffmpeg
-    frame_rx: Receiver<super::Result<Frame>>,
-
     avcc: re_mp4::Avc1Box,
+
+    on_output: Arc<OutputCallback>,
 }
 
 impl FfmpegCliH264Decoder {
     // TODO: make this robust against `pkill ffmpeg` somehow.
     // Maybe `AsyncDecoder` can auto-restart us, or we wrap ourselves in a new struct that restarts us on certain errors?
-    pub fn new(avcc: re_mp4::Avc1Box) -> Result<Self, Error> {
+    pub fn new(
+        avcc: re_mp4::Avc1Box,
+        on_output: impl Fn(super::Result<Frame>) + Send + Sync + 'static,
+    ) -> Result<Self, Error> {
         re_tracing::profile_function!();
 
         let mut ffmpeg = {
@@ -115,13 +117,17 @@ impl FfmpegCliH264Decoder {
             .map_err(|err| Error::NoIterator(err.to_string()))?;
 
         let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
-        let (frame_tx, frame_rx) = crossbeam::channel::unbounded();
+
+        let on_output = Arc::new(on_output);
 
         std::thread::Builder::new()
             .name("ffmpeg-reader".to_owned())
-            .spawn(move || {
-                read_ffmpeg_output(ffmpeg_iterator, &frame_info_rx, &frame_tx);
-                re_log::debug!("Shutting down ffmpeg");
+            .spawn({
+                let on_output = on_output.clone();
+                move || {
+                    read_ffmpeg_output(ffmpeg_iterator, &frame_info_rx, on_output.as_ref());
+                    re_log::debug!("Shutting down ffmpeg");
+                }
             })
             .expect("Failed to spawn ffmpeg thread");
 
@@ -129,8 +135,8 @@ impl FfmpegCliH264Decoder {
             frame_num: 0,
             ffmpeg_stdin,
             frame_info_tx,
-            frame_rx,
             avcc,
+            on_output,
         })
     }
 }
@@ -138,7 +144,7 @@ impl FfmpegCliH264Decoder {
 fn read_ffmpeg_output(
     ffmpeg_iterator: ffmpeg_sidecar::iter::FfmpegIterator,
     frame_info_rx: &Receiver<FrameInfo>,
-    frame_tx: &Sender<super::Result<Frame>>,
+    on_output: &OutputCallback,
 ) {
     /// Ignore some common output from ffmpeg:
     fn should_ignore_log_msg(msg: &str) -> bool {
@@ -177,7 +183,7 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::Log(LogLevel::Error, msg) => {
-                frame_tx.send(Err(Error::Ffmpeg(msg).into())).ok();
+                on_output(Err(Error::Ffmpeg(msg).into()));
             }
 
             FfmpegEvent::LogEOF => {
@@ -186,7 +192,7 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::Error(error) => {
-                frame_tx.send(Err(Error::FfmpegSidecar(error).into())).ok();
+                on_output(Err(Error::FfmpegSidecar(error).into()));
             }
 
             // Usefuless info in these:
@@ -284,20 +290,14 @@ fn read_ffmpeg_output(
                 debug_assert_eq!(pix_fmt, "rgb24");
                 debug_assert_eq!(width as usize * height as usize * 3, data.len());
 
-                if frame_tx
-                    .send(Ok(super::Frame {
-                        width,
-                        height,
-                        data,
-                        format: crate::PixelFormat::Rgb8Unorm,
-                        presentation_timestamp: frame_info.presentation_timestamp,
-                        duration: frame_info.duration,
-                    }))
-                    .is_err()
-                {
-                    re_log::debug!("Receiver disconnected");
-                    return;
-                }
+                on_output(Ok(super::Frame {
+                    width,
+                    height,
+                    data,
+                    format: crate::PixelFormat::Rgb8Unorm,
+                    presentation_timestamp: frame_info.presentation_timestamp,
+                    duration: frame_info.duration,
+                }));
             }
 
             FfmpegEvent::Done => {
@@ -312,24 +312,10 @@ fn read_ffmpeg_output(
     }
 }
 
-impl SyncDecoder for FfmpegCliH264Decoder {
-    fn submit_chunk(
-        &mut self,
-        should_stop: &std::sync::atomic::AtomicBool,
-        chunk: super::Chunk,
-        on_output: &super::OutputCallback,
-    ) {
+impl AsyncDecoder for FfmpegCliH264Decoder {
+    fn submit_chunk(&mut self, chunk: super::Chunk) -> super::Result<()> {
         re_tracing::profile_function!();
 
-        // First read any outstanding messages (e.g. error reports),
-        // so they get ordered correctly.
-        while let Ok(frame_result) = self.frame_rx.try_recv() {
-            if should_stop.load(Ordering::Relaxed) {
-                return;
-            }
-            on_output(frame_result);
-        }
-
         // We send the information about this chunk first.
         // This assumes each sample/chunk will result in exactly one frame.
         // If this assumption is not held, we will get weird errors, like videos playing to slowly.
@@ -349,28 +335,29 @@ impl SyncDecoder for FfmpegCliH264Decoder {
             // Write chunk to ffmpeg:
             let mut state = NaluStreamState::default(); // TODO: remove state?
             if let Err(err) = write_avc_chunk_to_nalu_stream(
-                should_stop,
                 &self.avcc,
                 &mut self.ffmpeg_stdin,
                 &chunk,
                 &mut state,
             ) {
-                on_output(Err(err.into()));
+                (self.on_output)(Err(err.into()));
             }
 
             self.ffmpeg_stdin.flush().ok();
         }
 
-        while let Ok(frame_result) = self.frame_rx.try_recv() {
-            if should_stop.load(Ordering::Relaxed) {
-                return;
-            }
-            on_output(frame_result);
-        }
+        Ok(())
     }
 
-    fn reset(&mut self) {
+    fn reset(&mut self) -> super::Result<()> {
         // TODO: restart ffmpeg process
+        Ok(())
+    }
+}
+
+impl Drop for FfmpegCliH264Decoder {
+    fn drop(&mut self) {
+        // TODO: stop ffmpeg thread
     }
 }
 
@@ -387,7 +374,6 @@ struct NaluStreamState {
 }
 
 fn write_avc_chunk_to_nalu_stream(
-    should_stop: &std::sync::atomic::AtomicBool,
     avcc: &re_mp4::Avc1Box,
     nalu_stream: &mut dyn std::io::Write,
     chunk: &super::Chunk,
@@ -425,7 +411,7 @@ fn write_avc_chunk_to_nalu_stream(
     // (most of the time it's 1:1, but there might be extra NAL units for info, especially at the start).
     let mut buffer_offset: usize = 0;
     let sample_end = chunk.data.len();
-    while buffer_offset < sample_end && !should_stop.load(Ordering::Relaxed) {
+    while buffer_offset < sample_end {
         re_tracing::profile_scope!("write_nalu");
 
         // Each NAL unit in mp4 is prefixed with a length prefix.
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index 3483aaaa0988..e79bd1736d72 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -77,14 +77,12 @@
 //! supporting HDR content at which point more properties will be important!
 //!
 
-#[cfg(any(with_dav1d, with_ffmpeg))]
+#[cfg(with_dav1d)]
 mod async_decoder_wrapper;
 #[cfg(with_dav1d)]
 mod av1;
-
 #[cfg(with_ffmpeg)]
-pub mod ffmpeg;
-
+mod ffmpeg;
 #[cfg(target_arch = "wasm32")]
 mod webcodecs;
 
@@ -187,12 +185,12 @@ pub fn new_decoder(
 
         #[cfg(with_ffmpeg)]
         re_mp4::StsdBoxContent::Avc1(avc1_box) => {
+            // TODO: check if we have ffmpeg ONCE, and remember
             re_log::trace!("Decoding H.264…");
-            return Ok(Box::new(async_decoder_wrapper::AsyncDecoderWrapper::new(
-                debug_name.to_owned(),
-                Box::new(ffmpeg::FfmpegCliH264Decoder::new(avc1_box.clone())?),
+            Ok(Box::new(ffmpeg::FfmpegCliH264Decoder::new(
+                avc1_box.clone(),
                 on_output,
-            )));
+            )?))
         }
 
         _ => Err(Error::UnsupportedCodec(video.human_readable_codec_string())),

From 4897f1964435f7fd7de56a6bb731fc007a570c55 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 28 Oct 2024 12:54:02 +0100
Subject: [PATCH 12/33] set fps mode to passthrough

---
 crates/store/re_video/src/decode/ffmpeg.rs | 13 +++++--------
 1 file changed, 5 insertions(+), 8 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 9c6681941aab..2d770c9a8aac 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -94,15 +94,12 @@ impl FfmpegCliH264Decoder {
                     "0",
                 ])
                 // Keep in mind that all arguments that are about the input, need to go before!
-                .format("h264") // High risk here: What's is available?
+                .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
+                //.fps_mode("0")
                 .input("-") // stdin is our input!
-                // TODO: Do we have to do this instead?
-                // Set constant frame rate.
-                // We can't properly handle variable frame rate since `rawvideo` output won't report timestamps.
-                // To work around this we'd first need to establish a mapping of frame numbers to timestamps.
-                // This isn't entirely trivial since individual chunks may have arbitrary composition & decode timestamps.
-                //.fps_mode(1)
-                //
+                // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timestamp is wrong.
+                // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
+                .fps_mode("passthrough")
                 // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
                 // (should be faster overall at no quality loss if the video is in this format).
                 // Check `ffmpeg -pix_fmts` for full list.

From f8c70fcfb0e74c6ea3ba746cc30f59f9829c288f Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 28 Oct 2024 14:40:33 +0100
Subject: [PATCH 13/33] comments & debug output

---
 crates/store/re_video/src/decode/ffmpeg.rs | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 2d770c9a8aac..d1445df324ea 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -54,9 +54,6 @@ struct FrameInfo {
 
 /// Decode H.264 video via ffmpeg over CLI
 pub struct FfmpegCliH264Decoder {
-    /// Monotonically increasing
-    frame_num: u32,
-
     /// How we send more data to the ffmpeg process
     ffmpeg_stdin: std::process::ChildStdin,
 
@@ -97,7 +94,7 @@ impl FfmpegCliH264Decoder {
                 .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
                 //.fps_mode("0")
                 .input("-") // stdin is our input!
-                // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timestamp is wrong.
+                // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
                 // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
                 .fps_mode("passthrough")
                 // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
@@ -129,7 +126,6 @@ impl FfmpegCliH264Decoder {
             .expect("Failed to spawn ffmpeg thread");
 
         Ok(Self {
-            frame_num: 0,
             ffmpeg_stdin,
             frame_info_tx,
             avcc,
@@ -193,8 +189,13 @@ fn read_ffmpeg_output(
             }
 
             // Usefuless info in these:
-            FfmpegEvent::ParsedInput(_) => {}
-            FfmpegEvent::ParsedOutput(_) => {}
+            FfmpegEvent::ParsedInput(input) => {
+                re_log::debug!("{input:?}");
+            }
+            FfmpegEvent::ParsedOutput(output) => {
+                re_log::debug!("{output:?}");
+            }
+
             FfmpegEvent::ParsedStreamMapping(_) => {}
 
             FfmpegEvent::ParsedInputStream(stream) => {
@@ -236,6 +237,7 @@ fn read_ffmpeg_output(
 
             FfmpegEvent::Progress(_) => {
                 // We can get out frame number etc here to know how far behind we are.
+                // By default this triggers every 0.5s.
             }
 
             FfmpegEvent::OutputFrame(frame) => {
@@ -322,9 +324,7 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
             duration: chunk.duration,
         };
 
-        // NOTE: a 60 FPS video can go for two years before wrapping a u32.
-        self.frame_num = self.frame_num.wrapping_add(1);
-
+        // TODO: schedule this.
         if self.frame_info_tx.send(frame_info).is_err() {
             // The other thread must be down, e.g. because `ffmpeg` crashed.
             // It should already have reported that as an error - no need to repeat it here.

From edceed6af69d59e571ed739d667a097cef360fc2 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 28 Oct 2024 15:02:25 +0100
Subject: [PATCH 14/33] crude reset implementation

---
 crates/store/re_video/src/decode/ffmpeg.rs | 107 +++++++++++----------
 1 file changed, 58 insertions(+), 49 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index d1445df324ea..edc7bfcffd41 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -59,6 +59,7 @@ pub struct FfmpegCliH264Decoder {
 
     /// For sending frame timestamps to the decoder thread
     frame_info_tx: Sender<FrameInfo>,
+    frame_info_rx: Receiver<FrameInfo>,
 
     avcc: re_mp4::Avc1Box,
 
@@ -74,66 +75,70 @@ impl FfmpegCliH264Decoder {
     ) -> Result<Self, Error> {
         re_tracing::profile_function!();
 
-        let mut ffmpeg = {
-            re_tracing::profile_scope!("spawn-ffmpeg");
-
-            FfmpegCommand::new()
-                .hide_banner()
-                // "Reduce the latency introduced by buffering during initial input streams analysis."
-                //.arg("-fflags nobuffer")
-                //
-                // .. instead use these more aggressive options found here
-                // https://stackoverflow.com/a/49273163
-                .args([
-                    "-probesize",
-                    "32", // 32 bytes is the minimum probe size.
-                    "-analyzeduration",
-                    "0",
-                ])
-                // Keep in mind that all arguments that are about the input, need to go before!
-                .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
-                //.fps_mode("0")
-                .input("-") // stdin is our input!
-                // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
-                // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
-                .fps_mode("passthrough")
-                // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
-                // (should be faster overall at no quality loss if the video is in this format).
-                // Check `ffmpeg -pix_fmts` for full list.
-                .rawvideo() // Output rgb24 on stdout.
-                .spawn()
-                .map_err(Error::FailedToStartFfmpeg)?
-        };
-
-        let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
-        let ffmpeg_iterator = ffmpeg
-            .iter()
-            .map_err(|err| Error::NoIterator(err.to_string()))?;
-
-        let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
-
         let on_output = Arc::new(on_output);
+        let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
 
-        std::thread::Builder::new()
-            .name("ffmpeg-reader".to_owned())
-            .spawn({
-                let on_output = on_output.clone();
-                move || {
-                    read_ffmpeg_output(ffmpeg_iterator, &frame_info_rx, on_output.as_ref());
-                    re_log::debug!("Shutting down ffmpeg");
-                }
-            })
-            .expect("Failed to spawn ffmpeg thread");
+        let ffmpeg_stdin = start_ffmpeg_process(on_output.clone(), frame_info_rx.clone())?;
 
         Ok(Self {
             ffmpeg_stdin,
             frame_info_tx,
             avcc,
             on_output,
+            frame_info_rx,
         })
     }
 }
 
+fn start_ffmpeg_process(
+    on_output: Arc<OutputCallback>,
+    frame_info_rx: Receiver<FrameInfo>,
+) -> Result<std::process::ChildStdin, Error> {
+    let mut ffmpeg = {
+        re_tracing::profile_scope!("spawn-ffmpeg");
+
+        FfmpegCommand::new()
+            .hide_banner()
+            // "Reduce the latency introduced by buffering during initial input streams analysis."
+            //.arg("-fflags nobuffer")
+            //
+            // .. instead use these more aggressive options found here
+            // https://stackoverflow.com/a/49273163
+            .args([
+                "-probesize",
+                "32", // 32 bytes is the minimum probe size.
+                "-analyzeduration",
+                "0",
+            ])
+            // Keep in mind that all arguments that are about the input, need to go before!
+            .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
+            //.fps_mode("0")
+            .input("-") // stdin is our input!
+            // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
+            // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
+            .fps_mode("passthrough")
+            // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
+            // (should be faster overall at no quality loss if the video is in this format).
+            // Check `ffmpeg -pix_fmts` for full list.
+            .rawvideo() // Output rgb24 on stdout.
+            .spawn()
+            .map_err(Error::FailedToStartFfmpeg)?
+    };
+    let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+    let ffmpeg_iterator = ffmpeg
+        .iter()
+        .map_err(|err| Error::NoIterator(err.to_string()))?;
+
+    std::thread::Builder::new()
+        .name("ffmpeg-reader".to_owned())
+        .spawn(move || {
+            read_ffmpeg_output(ffmpeg_iterator, &frame_info_rx, on_output.as_ref());
+        })
+        .expect("Failed to spawn ffmpeg thread");
+
+    Ok(ffmpeg_stdin)
+}
+
 fn read_ffmpeg_output(
     ffmpeg_iterator: ffmpeg_sidecar::iter::FfmpegIterator,
     frame_info_rx: &Receiver<FrameInfo>,
@@ -347,13 +352,17 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
     }
 
     fn reset(&mut self) -> super::Result<()> {
-        // TODO: restart ffmpeg process
+        re_log::debug!("Resetting ffmpeg decoder");
+        // TODO: ensure previous ffmpeg process is dead and thread has stopped.
+        self.ffmpeg_stdin =
+            start_ffmpeg_process(self.on_output.clone(), self.frame_info_rx.clone())?;
         Ok(())
     }
 }
 
 impl Drop for FfmpegCliH264Decoder {
     fn drop(&mut self) {
+        re_log::debug!("Dropping ffmpeg decoder");
         // TODO: stop ffmpeg thread
     }
 }

From 3f21b3dfecfce80fb48dd78c0c2e9d45898181cf Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 28 Oct 2024 17:30:32 +0100
Subject: [PATCH 15/33] fix frame reordering

---
 crates/store/re_video/src/decode/ffmpeg.rs | 69 +++++++++++++---------
 1 file changed, 40 insertions(+), 29 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index edc7bfcffd41..0070472a81b8 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -163,7 +163,9 @@ fn read_ffmpeg_output(
         false
     }
 
-    let mut pending_frames = BTreeMap::new();
+    // Pending frames, sorted by their presentation timestamp.
+    let mut pending_frame_infos = BTreeMap::new();
+    let mut highest_dts = Time(i64::MIN); // Highest dts encountered so far.
 
     for event in ffmpeg_iterator {
         #[allow(clippy::match_same_arms)]
@@ -242,36 +244,43 @@ fn read_ffmpeg_output(
 
             FfmpegEvent::Progress(_) => {
                 // We can get out frame number etc here to know how far behind we are.
-                // By default this triggers every 0.5s.
+                // By default this triggers every 5s.
             }
 
             FfmpegEvent::OutputFrame(frame) => {
-                let frame_info = match pending_frames.pop_first() {
-                    Some((_, frame_info)) => frame_info,
-                    None => {
-                        // Retrieve frame infos until decode timestamp is no longer behind composition timestamp.
-                        // This is important because frame infos come not in in composition order,
-                        // but ffmpeg will report frames in composition order!
-                        loop {
-                            let Ok(frame_info) = frame_info_rx.try_recv() else {
-                                re_log::debug!("Receiver disconnected");
-                                return;
-                            };
-
-                            // Example how how presentation timestamps and decode timestamps can play out:
-                            //    PTS: 1 4 2 3
-                            //    DTS: 1 2 3 4
-                            // Stream: I P B B
-                            //
-                            // Essentially we need to wait until the dts has "caught up" with the pts!
-                            let highest_pts = pending_frames
-                                .last_key_value()
-                                .map_or(frame_info.presentation_timestamp, |(pts, _)| *pts);
-                            if frame_info.decode_timestamp <= highest_pts {
-                                break frame_info;
-                            }
-                            pending_frames.insert(frame_info.presentation_timestamp, frame_info);
-                        }
+                // DTS <= PTS
+                // chunk sorted by DTS
+
+                // Frames come in in PTS order, but "frame info" comes in in DTS order!
+                //
+                // Whenever the highest known DTS is behind the PTS, we need to wait until the DTS catches up.
+                // Otherwise, we'd assign the wrong PTS to the frame that just came in.
+                //
+                // Example how how presentation timestamps and decode timestamps
+                // can play out in the presence of B-frames to illustrate this:
+                //    PTS: 1 4 2 3
+                //    DTS: 1 2 3 4
+                // Stream: I P B B
+                let frame_info = loop {
+                    if pending_frame_infos
+                        .first_key_value()
+                        .map_or(true, |(pts, _)| *pts > highest_dts)
+                    {
+                        let Ok(frame_info) = frame_info_rx.try_recv() else {
+                            re_log::debug!("Receiver disconnected");
+                            return;
+                        };
+
+                        debug_assert!(
+                            frame_info.decode_timestamp > highest_dts,
+                            "Decode timestamps are expected to increase monotonically"
+                        );
+                        highest_dts = frame_info.decode_timestamp;
+                        pending_frame_infos.insert(frame_info.presentation_timestamp, frame_info);
+                    } else {
+                        // There must be an element here, otherwise we wouldn't be in this branch.
+                        #[allow(clippy::unwrap_used)]
+                        break pending_frame_infos.pop_first().unwrap().1;
                     }
                 };
 
@@ -329,7 +338,7 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
             duration: chunk.duration,
         };
 
-        // TODO: schedule this.
+        // TODO: schedule this in a thread.
         if self.frame_info_tx.send(frame_info).is_err() {
             // The other thread must be down, e.g. because `ffmpeg` crashed.
             // It should already have reported that as an error - no need to repeat it here.
@@ -485,6 +494,8 @@ fn write_avc_chunk_to_nalu_stream(
         buffer_offset = data_end;
     }
 
+    // TODO: Write an Access Unit Delimiter (AUD) NAL unit to the stream?
+
     Ok(())
 }
 

From 67843f706eff5d0e273b2d9e1be3c5280d4c930e Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Wed, 30 Oct 2024 11:57:17 +0100
Subject: [PATCH 16/33] expose DTS through frame info

---
 crates/store/re_video/src/decode/av1.rs    |  1 +
 crates/store/re_video/src/decode/ffmpeg.rs |  1 +
 crates/store/re_video/src/decode/mod.rs    |  6 ++++++
 crates/viewer/re_data_ui/src/video.rs      | 10 +++++++++-
 4 files changed, 17 insertions(+), 1 deletion(-)

diff --git a/crates/store/re_video/src/decode/av1.rs b/crates/store/re_video/src/decode/av1.rs
index eae47c2a2a67..422aa9e55aec 100644
--- a/crates/store/re_video/src/decode/av1.rs
+++ b/crates/store/re_video/src/decode/av1.rs
@@ -237,6 +237,7 @@ fn output_picture(
         info: FrameInfo {
             presentation_timestamp: Time(picture.timestamp().unwrap_or(0)),
             duration: Time(picture.duration()),
+            ..Default::default()
         },
     };
     on_output(Ok(frame));
diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index a07848c63e30..4aad8d17b4cb 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -313,6 +313,7 @@ fn read_ffmpeg_output(
                     info: super::FrameInfo {
                         presentation_timestamp: frame_info.presentation_timestamp,
                         duration: frame_info.duration,
+                        latest_decode_timestamp: Some(frame_info.decode_timestamp),
                     },
                 }));
             }
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index e46edee2f98d..dfc1dc262d48 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -249,6 +249,11 @@ pub struct FrameInfo {
     /// A duration of [`Time::MAX`] indicates that the frame is invalid or not yet available.
     // Implementation note: unlike with presentation timestamp we may be able fine with making this optional.
     pub duration: Time,
+
+    /// The decode timestamp of the last chunk that was needed to decode this frame.
+    ///
+    /// None indicates that the information is not available.
+    pub latest_decode_timestamp: Option<Time>,
 }
 
 impl Default for FrameInfo {
@@ -256,6 +261,7 @@ impl Default for FrameInfo {
         Self {
             presentation_timestamp: Time::MAX,
             duration: Time::MAX,
+            latest_decode_timestamp: None,
         }
     }
 }
diff --git a/crates/viewer/re_data_ui/src/video.rs b/crates/viewer/re_data_ui/src/video.rs
index 5f637739c9f1..c387212420b1 100644
--- a/crates/viewer/re_data_ui/src/video.rs
+++ b/crates/viewer/re_data_ui/src/video.rs
@@ -195,10 +195,18 @@ fn frame_info_ui(ui: &mut egui::Ui, frame_info: &FrameInfo, timescale: re_video:
     .on_hover_text("Time range in which this frame is valid.");
 
     ui.list_item_flat_noninteractive(
-        PropertyContent::new("PTS").value_text(format!("{}", frame_info.presentation_timestamp.0)),
+        PropertyContent::new("PTS").value_text(frame_info.presentation_timestamp.0.to_string()),
     )
     .on_hover_text("Raw presentation timestamp prior to applying the timescale.\n\
                     This specifies the time at which the frame should be shown relative to the start of a video stream.");
+
+    if let Some(dts) = frame_info.latest_decode_timestamp {
+        ui.list_item_flat_noninteractive(
+            PropertyContent::new("DTS").value_text(dts.0.to_string()),
+        )
+        .on_hover_text("Raw decode timestamp prior to applying the timescale.\n\
+                        If a frame is made up of multiple chunks, this is the last decode timestamp that was needed to decode the frame.");
+    }
 }
 
 fn source_image_data_format_ui(ui: &mut egui::Ui, format: &SourceImageDataFormat) {

From 3e59ee143575e8e2359f8c9ee6d41e7ee4fb7711 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Wed, 30 Oct 2024 19:30:13 +0100
Subject: [PATCH 17/33] handle ffmpeg process lifecycle, handle backward seeks

---
 crates/store/re_video/src/decode/ffmpeg.rs | 168 ++++++++++++++-------
 crates/store/re_video/src/decode/mod.rs    |   1 +
 2 files changed, 113 insertions(+), 56 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 4aad8d17b4cb..d5ffe90ed5e0 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -4,6 +4,7 @@ use std::{collections::BTreeMap, io::Write, sync::Arc};
 
 use crossbeam::channel::{Receiver, Sender};
 use ffmpeg_sidecar::{
+    child::FfmpegChild,
     command::FfmpegCommand,
     event::{FfmpegEvent, LogLevel},
 };
@@ -35,8 +36,14 @@ pub enum Error {
     #[error("FFMPEG error: {0}")]
     Ffmpeg(String),
 
+    #[error("FFMPEG fatal error: {0}")]
+    FfmpegFatal(String),
+
     #[error("FFMPEG IPC error: {0}")]
     FfmpegSidecar(String),
+
+    #[error("Failed to send video frame info to the ffmpeg read thread.")]
+    BrokenFrameInfoChannel,
 }
 
 impl From<Error> for super::Error {
@@ -46,6 +53,7 @@ impl From<Error> for super::Error {
 }
 
 /// ffmpeg does not tell us the timestamp/duration of a given frame, so we need to remember it.
+#[derive(Clone)]
 struct PendingFrameInfo {
     presentation_timestamp: Time,
     duration: Time,
@@ -54,6 +62,10 @@ struct PendingFrameInfo {
 
 /// Decode H.264 video via ffmpeg over CLI
 pub struct FfmpegCliH264Decoder {
+    debug_name: String,
+
+    ffmpeg: FfmpegChild,
+
     /// How we send more data to the ffmpeg process
     ffmpeg_stdin: std::process::ChildStdin,
 
@@ -67,9 +79,8 @@ pub struct FfmpegCliH264Decoder {
 }
 
 impl FfmpegCliH264Decoder {
-    // TODO: make this robust against `pkill ffmpeg` somehow.
-    // Maybe `AsyncDecoder` can auto-restart us, or we wrap ourselves in a new struct that restarts us on certain errors?
     pub fn new(
+        debug_name: String,
         avcc: re_mp4::Avc1Box,
         on_output: impl Fn(super::Result<Frame>) + Send + Sync + 'static,
     ) -> Result<Self, Error> {
@@ -78,9 +89,12 @@ impl FfmpegCliH264Decoder {
         let on_output = Arc::new(on_output);
         let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
 
-        let ffmpeg_stdin = start_ffmpeg_process(on_output.clone(), frame_info_rx.clone())?;
+        let mut ffmpeg = start_ffmpeg_process(on_output.clone(), frame_info_rx.clone())?;
+        let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
 
         Ok(Self {
+            debug_name,
+            ffmpeg,
             ffmpeg_stdin,
             frame_info_tx,
             avcc,
@@ -93,38 +107,36 @@ impl FfmpegCliH264Decoder {
 fn start_ffmpeg_process(
     on_output: Arc<OutputCallback>,
     frame_info_rx: Receiver<PendingFrameInfo>,
-) -> Result<std::process::ChildStdin, Error> {
-    let mut ffmpeg = {
-        re_tracing::profile_scope!("spawn-ffmpeg");
-
-        FfmpegCommand::new()
-            .hide_banner()
-            // "Reduce the latency introduced by buffering during initial input streams analysis."
-            //.arg("-fflags nobuffer")
-            //
-            // .. instead use these more aggressive options found here
-            // https://stackoverflow.com/a/49273163
-            .args([
-                "-probesize",
-                "32", // 32 bytes is the minimum probe size.
-                "-analyzeduration",
-                "0",
-            ])
-            // Keep in mind that all arguments that are about the input, need to go before!
-            .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
-            //.fps_mode("0")
-            .input("-") // stdin is our input!
-            // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
-            // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
-            .fps_mode("passthrough")
-            // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
-            // (should be faster overall at no quality loss if the video is in this format).
-            // Check `ffmpeg -pix_fmts` for full list.
-            .rawvideo() // Output rgb24 on stdout.
-            .spawn()
-            .map_err(Error::FailedToStartFfmpeg)?
-    };
-    let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+) -> Result<FfmpegChild, Error> {
+    re_tracing::profile_function!();
+
+    let mut ffmpeg = FfmpegCommand::new()
+        .hide_banner()
+        // "Reduce the latency introduced by buffering during initial input streams analysis."
+        //.arg("-fflags nobuffer")
+        //
+        // .. instead use these more aggressive options found here
+        // https://stackoverflow.com/a/49273163
+        .args([
+            "-probesize",
+            "32", // 32 bytes is the minimum probe size.
+            "-analyzeduration",
+            "0",
+        ])
+        // Keep in mind that all arguments that are about the input, need to go before!
+        .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
+        //.fps_mode("0")
+        .input("-") // stdin is our input!
+        // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
+        // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
+        .fps_mode("passthrough")
+        // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
+        // (should be faster overall at no quality loss if the video is in this format).
+        // Check `ffmpeg -pix_fmts` for full list.
+        .rawvideo() // Output rgb24 on stdout.
+        .spawn()
+        .map_err(Error::FailedToStartFfmpeg)?;
+
     let ffmpeg_iterator = ffmpeg
         .iter()
         .map_err(|err| Error::NoIterator(err.to_string()))?;
@@ -136,7 +148,7 @@ fn start_ffmpeg_process(
         })
         .expect("Failed to spawn ffmpeg thread");
 
-    Ok(ffmpeg_stdin)
+    Ok(ffmpeg)
 }
 
 fn read_ffmpeg_output(
@@ -150,8 +162,11 @@ fn read_ffmpeg_output(
             "Duration: N/A, bitrate: N/A",
             "frame=    0 fps=0.0 q=0.0 size=       0kB time=N/A bitrate=N/A speed=N/A",
             "Metadata:",
+            // TODO(andreas): we should just handle yuv420p directly!
             "No accelerated colorspace conversion found from yuv420p to rgb24",
             "Stream mapping:",
+            // We actually don't even want it to estimate a framerate!
+            "not enough frames to estimate rate",
         ];
 
         for pattern in patterns {
@@ -172,7 +187,7 @@ fn read_ffmpeg_output(
         match event {
             FfmpegEvent::Log(LogLevel::Info, msg) => {
                 if !should_ignore_log_msg(&msg) {
-                    re_log::debug!("{msg}");
+                    re_log::trace!("{msg}");
                 }
             }
 
@@ -186,6 +201,22 @@ fn read_ffmpeg_output(
                 on_output(Err(Error::Ffmpeg(msg).into()));
             }
 
+            FfmpegEvent::Log(LogLevel::Fatal, msg) => {
+                on_output(Err(Error::FfmpegFatal(msg).into()));
+                return;
+            }
+
+            FfmpegEvent::Log(LogLevel::Unknown, msg) => {
+                if msg.contains("system signals, hard exiting") {
+                    // That was probably us, killing the process.
+                    re_log::debug!("ffmpeg process was killed");
+                    return;
+                }
+                if !should_ignore_log_msg(&msg) {
+                    re_log::debug!("{msg}");
+                }
+            }
+
             FfmpegEvent::LogEOF => {
                 // This event proceeds `FfmpegEvent::Done`.
                 // This happens on `pkill ffmpeg`, for instance.
@@ -197,10 +228,10 @@ fn read_ffmpeg_output(
 
             // Usefuless info in these:
             FfmpegEvent::ParsedInput(input) => {
-                re_log::debug!("{input:?}");
+                re_log::trace!("{input:?}");
             }
             FfmpegEvent::ParsedOutput(output) => {
-                re_log::debug!("{output:?}");
+                re_log::trace!("{output:?}");
             }
 
             FfmpegEvent::ParsedStreamMapping(_) => {}
@@ -234,8 +265,7 @@ fn read_ffmpeg_output(
                     fps,
                     ..
                 } = stream;
-
-                re_log::debug!(
+                re_log::trace!(
                     "Output: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
                 );
 
@@ -271,11 +301,11 @@ fn read_ffmpeg_output(
                             return;
                         };
 
-                        debug_assert!(
-                            frame_info.decode_timestamp > highest_dts,
-                            "Decode timestamps are expected to increase monotonically"
-                        );
+                        // If the decodetimestamp did not increase, we're probably seeking backwards!
+                        // We'd expect the video player to do a reset prior to that, but we may not have noticed that in here yet!
+                        // In any case, we'll have to just run with this as the new highest timestamp, not much else we can do.
                         highest_dts = frame_info.decode_timestamp;
+
                         pending_frame_infos.insert(frame_info.presentation_timestamp, frame_info);
                     } else {
                         // There must be an element here, otherwise we wouldn't be in this branch.
@@ -344,18 +374,35 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
         };
 
         // TODO: schedule this in a thread.
-        if self.frame_info_tx.send(frame_info).is_err() {
-            // The other thread must be down, e.g. because `ffmpeg` crashed.
-            // It should already have reported that as an error - no need to repeat it here.
+        if self.frame_info_tx.send(frame_info.clone()).is_err() {
+            // This should never happen, even if the write thread dies
+            // since we keep a copy of both sides of the channel.
+            return Err(Error::BrokenFrameInfoChannel.into());
         } else {
             // Write chunk to ffmpeg:
             let mut state = NaluStreamState::default(); // TODO: remove state?
-            if let Err(err) = write_avc_chunk_to_nalu_stream(
+            let mut write_result = write_avc_chunk_to_nalu_stream(
                 &self.avcc,
                 &mut self.ffmpeg_stdin,
                 &chunk,
                 &mut state,
-            ) {
+            );
+            // The other thread must be down, e.g. because `ffmpeg` crashed.
+            // It should already have reported that as an error - no need to repeat it here.
+            //
+            // Reset and try again.
+            // Note that if we're in the middle of a GOP, this might get glitchy, but that's fine for this case.
+            if matches!(write_result, Err(Error::FailedToWriteToFfmpeg(_))) {
+                self.reset()?;
+                write_result = write_avc_chunk_to_nalu_stream(
+                    &self.avcc,
+                    &mut self.ffmpeg_stdin,
+                    &chunk,
+                    &mut state,
+                );
+            }
+
+            if let Err(err) = write_result {
                 (self.on_output)(Err(err.into()));
             }
 
@@ -366,18 +413,27 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
     }
 
     fn reset(&mut self) -> super::Result<()> {
-        re_log::debug!("Resetting ffmpeg decoder");
-        // TODO: ensure previous ffmpeg process is dead and thread has stopped.
-        self.ffmpeg_stdin =
-            start_ffmpeg_process(self.on_output.clone(), self.frame_info_rx.clone())?;
+        re_log::debug!("Resetting ffmpeg decoder {}", self.debug_name);
+        re_tracing::profile_function!();
+
+        // Either we drain the frame info channel, message the thread
+        // and hope that ffmpeg is well behaved after receiving an IDR frame (no matter what was in flight so far).
+        // ... or we just kill ffmpeg & start a new process & thread.
+        self.ffmpeg.kill().ok(); // Don't care if it was already dead.
+        self.ffmpeg = start_ffmpeg_process(self.on_output.clone(), self.frame_info_rx.clone())?;
+        self.ffmpeg_stdin = self.ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+
         Ok(())
     }
 }
 
 impl Drop for FfmpegCliH264Decoder {
     fn drop(&mut self) {
-        re_log::debug!("Dropping ffmpeg decoder");
-        // TODO: stop ffmpeg thread
+        re_log::debug!("Dropping ffmpeg decoder {}", self.debug_name);
+        self.ffmpeg.kill().ok(); // Don't care if it's already dead.
+
+        // Read thread should stop by itself.
+        // We could wait for that, but that doesn't really matter.
     }
 }
 
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index dfc1dc262d48..a1afdbdf7737 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -188,6 +188,7 @@ pub fn new_decoder(
             // TODO: check if we have ffmpeg ONCE, and remember
             re_log::trace!("Decoding H.264…");
             Ok(Box::new(ffmpeg::FfmpegCliH264Decoder::new(
+                debug_name.to_owned(),
                 avc1_box.clone(),
                 on_output,
             )?))

From 88b62a5bd38cabe8b90da8b2a30822a11ee9c283 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 11:28:32 +0100
Subject: [PATCH 18/33] turn around scheduling & threading strategy again to
 make things snappier and robust

---
 crates/store/re_video/src/decode/ffmpeg.rs | 336 ++++++++++++---------
 1 file changed, 197 insertions(+), 139 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index d5ffe90ed5e0..e38079c180a3 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -11,7 +11,7 @@ use ffmpeg_sidecar::{
 
 use crate::Time;
 
-use super::{AsyncDecoder, Frame, OutputCallback};
+use super::{AsyncDecoder, Chunk, Frame, OutputCallback};
 
 #[derive(thiserror::Error, Debug)]
 pub enum Error {
@@ -42,6 +42,9 @@ pub enum Error {
     #[error("FFMPEG IPC error: {0}")]
     FfmpegSidecar(String),
 
+    #[error("FFMPEG exited unexpectedly with code {0:?}")]
+    FfmpegUnexpectedExit(Option<std::process::ExitStatus>),
+
     #[error("Failed to send video frame info to the ffmpeg read thread.")]
     BrokenFrameInfoChannel,
 }
@@ -54,106 +57,161 @@ impl From<Error> for super::Error {
 
 /// ffmpeg does not tell us the timestamp/duration of a given frame, so we need to remember it.
 #[derive(Clone)]
-struct PendingFrameInfo {
+struct FfmpegFrameInfo {
     presentation_timestamp: Time,
     duration: Time,
     decode_timestamp: Time,
 }
 
-/// Decode H.264 video via ffmpeg over CLI
-pub struct FfmpegCliH264Decoder {
-    debug_name: String,
+enum FfmpegFrameData {
+    Chunk(Chunk),
+    EndOfStream,
+}
 
+struct FfmpegProcessAndListener {
     ffmpeg: FfmpegChild,
 
-    /// How we send more data to the ffmpeg process
-    ffmpeg_stdin: std::process::ChildStdin,
-
-    /// For sending frame timestamps to the decoder thread
-    frame_info_tx: Sender<PendingFrameInfo>,
-    frame_info_rx: Receiver<PendingFrameInfo>,
+    /// For sending frame timestamps to the ffmpeg listener thread.
+    frame_info_tx: Sender<FfmpegFrameInfo>,
+    /// For sending chunks to the ffmpeg write thread.
+    frame_data_tx: Sender<FfmpegFrameData>,
 
-    avcc: re_mp4::Avc1Box,
-
-    on_output: Arc<OutputCallback>,
+    listen_thread: Option<std::thread::JoinHandle<()>>,
+    write_thread: Option<std::thread::JoinHandle<()>>,
 }
 
-impl FfmpegCliH264Decoder {
-    pub fn new(
-        debug_name: String,
+impl FfmpegProcessAndListener {
+    fn new(
+        debug_name: &str,
+        on_output: Arc<OutputCallback>,
         avcc: re_mp4::Avc1Box,
-        on_output: impl Fn(super::Result<Frame>) + Send + Sync + 'static,
     ) -> Result<Self, Error> {
         re_tracing::profile_function!();
 
-        let on_output = Arc::new(on_output);
-        let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
+        let mut ffmpeg = FfmpegCommand::new()
+            .hide_banner()
+            // "Reduce the latency introduced by buffering during initial input streams analysis."
+            //.arg("-fflags nobuffer")
+            //
+            // .. instead use these more aggressive options found here
+            // https://stackoverflow.com/a/49273163
+            .args([
+                "-probesize",
+                "32", // 32 bytes is the minimum probe size.
+                "-analyzeduration",
+                "0",
+            ])
+            // Keep in mind that all arguments that are about the input, need to go before!
+            .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
+            //.fps_mode("0")
+            .input("-") // stdin is our input!
+            // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
+            // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
+            .fps_mode("passthrough")
+            // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
+            // (should be faster overall at no quality loss if the video is in this format).
+            // Check `ffmpeg -pix_fmts` for full list.
+            .rawvideo() // Output rgb24 on stdout.
+            .spawn()
+            .map_err(Error::FailedToStartFfmpeg)?;
+
+        let ffmpeg_iterator = ffmpeg
+            .iter()
+            .map_err(|err| Error::NoIterator(err.to_string()))?;
 
-        let mut ffmpeg = start_ffmpeg_process(on_output.clone(), frame_info_rx.clone())?;
-        let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+        let (frame_info_tx, frame_info_rx) = crossbeam::channel::unbounded();
+        let (frame_data_tx, frame_data_rx) = crossbeam::channel::unbounded();
+
+        let listen_thread = std::thread::Builder::new()
+            .name(format!("ffmpeg-reader for {debug_name}"))
+            .spawn({
+                let on_output = on_output.clone();
+                let debug_name = debug_name.to_owned();
+                move || {
+                    read_ffmpeg_output(
+                        &debug_name,
+                        ffmpeg_iterator,
+                        &frame_info_rx,
+                        on_output.as_ref(),
+                    );
+                }
+            })
+            .expect("Failed to spawn ffmpeg listener thread");
+
+        let write_thread = std::thread::Builder::new()
+            .name(format!("ffmpeg-writer for {debug_name}"))
+            .spawn({
+                let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+                move || {
+                    write_ffmpeg_input(ffmpeg_stdin, &frame_data_rx, on_output.as_ref(), &avcc);
+                }
+            })
+            .expect("Failed to spawn ffmpeg writer thread");
 
         Ok(Self {
-            debug_name,
             ffmpeg,
-            ffmpeg_stdin,
             frame_info_tx,
-            avcc,
-            on_output,
-            frame_info_rx,
+            frame_data_tx,
+            listen_thread: Some(listen_thread),
+            write_thread: Some(write_thread),
         })
     }
 }
 
-fn start_ffmpeg_process(
-    on_output: Arc<OutputCallback>,
-    frame_info_rx: Receiver<PendingFrameInfo>,
-) -> Result<FfmpegChild, Error> {
-    re_tracing::profile_function!();
+impl Drop for FfmpegProcessAndListener {
+    fn drop(&mut self) {
+        // First stop the write thread. If we kill it too early, it will try to send chunks to an already dead ffmpeg process.
+        self.frame_data_tx.send(FfmpegFrameData::EndOfStream).ok();
+        if let Some(write_thread) = self.write_thread.take() {
+            if write_thread.join().is_err() {
+                re_log::error!("Failed to join ffmpeg listener thread.");
+            }
+        }
 
-    let mut ffmpeg = FfmpegCommand::new()
-        .hide_banner()
-        // "Reduce the latency introduced by buffering during initial input streams analysis."
-        //.arg("-fflags nobuffer")
-        //
-        // .. instead use these more aggressive options found here
-        // https://stackoverflow.com/a/49273163
-        .args([
-            "-probesize",
-            "32", // 32 bytes is the minimum probe size.
-            "-analyzeduration",
-            "0",
-        ])
-        // Keep in mind that all arguments that are about the input, need to go before!
-        .format("h264") // TODO(andreas): should we check ahead of time whether this is available?
-        //.fps_mode("0")
-        .input("-") // stdin is our input!
-        // h264 bitstreams doesn't have timestamp information. Whatever ffmpeg tries to make up about timing & framerates is wrong!
-        // If we don't tell it to just pass the frames through, variable framerate (VFR) video will just not play at all.
-        .fps_mode("passthrough")
-        // TODO(andreas): at least do `rgba`. But we could also do `yuv420p` for instance if that's what the video is specifying
-        // (should be faster overall at no quality loss if the video is in this format).
-        // Check `ffmpeg -pix_fmts` for full list.
-        .rawvideo() // Output rgb24 on stdout.
-        .spawn()
-        .map_err(Error::FailedToStartFfmpeg)?;
-
-    let ffmpeg_iterator = ffmpeg
-        .iter()
-        .map_err(|err| Error::NoIterator(err.to_string()))?;
-
-    std::thread::Builder::new()
-        .name("ffmpeg-reader".to_owned())
-        .spawn(move || {
-            read_ffmpeg_output(ffmpeg_iterator, &frame_info_rx, on_output.as_ref());
-        })
-        .expect("Failed to spawn ffmpeg thread");
+        // The listen thread is waiting for ffmpeg things, so killing ffmpeg is enough to get it notified.
+        self.ffmpeg.kill().ok();
+        if let Some(listen_thread) = self.listen_thread.take() {
+            if listen_thread.join().is_err() {
+                re_log::error!("Failed to join ffmpeg listener thread.");
+            }
+        }
+    }
+}
 
-    Ok(ffmpeg)
+fn write_ffmpeg_input(
+    mut ffmpeg_stdin: std::process::ChildStdin,
+    frame_data_rx: &Receiver<FfmpegFrameData>,
+    on_output: &OutputCallback,
+    avcc: &re_mp4::Avc1Box,
+) {
+    let mut state = NaluStreamState::default();
+
+    while let Ok(data) = frame_data_rx.recv() {
+        let chunk = match data {
+            FfmpegFrameData::Chunk(chunk) => chunk,
+            FfmpegFrameData::EndOfStream => break,
+        };
+
+        if let Err(err) =
+            write_avc_chunk_to_nalu_stream(avcc, &mut ffmpeg_stdin, &chunk, &mut state)
+        {
+            // This is unlikely to improve! Ffmpeg process likely died.
+            // By exiting here we hang up on the channel, making future attempts to push into it fail which should cause a reset eventually.
+            let should_exit = matches!(err, Error::FailedToWriteToFfmpeg(_));
+            (on_output)(Err(err.into()));
+            if should_exit {
+                return;
+            }
+        } else {
+            ffmpeg_stdin.flush().ok();
+        }
+    }
 }
 
 fn read_ffmpeg_output(
+    debug_name: &str,
     ffmpeg_iterator: ffmpeg_sidecar::iter::FfmpegIterator,
-    frame_info_rx: &Receiver<PendingFrameInfo>,
+    frame_info_rx: &Receiver<FfmpegFrameInfo>,
     on_output: &OutputCallback,
 ) {
     /// Ignore some common output from ffmpeg:
@@ -187,13 +245,13 @@ fn read_ffmpeg_output(
         match event {
             FfmpegEvent::Log(LogLevel::Info, msg) => {
                 if !should_ignore_log_msg(&msg) {
-                    re_log::trace!("{msg}");
+                    re_log::trace!("{debug_name} decoder: {msg}");
                 }
             }
 
             FfmpegEvent::Log(LogLevel::Warning, msg) => {
                 if !should_ignore_log_msg(&msg) {
-                    re_log::warn_once!("{msg}");
+                    re_log::warn_once!("{debug_name} decoder: {msg}");
                 }
             }
 
@@ -209,11 +267,11 @@ fn read_ffmpeg_output(
             FfmpegEvent::Log(LogLevel::Unknown, msg) => {
                 if msg.contains("system signals, hard exiting") {
                     // That was probably us, killing the process.
-                    re_log::debug!("ffmpeg process was killed");
+                    re_log::debug!("ffmpeg process for {debug_name} was killed");
                     return;
                 }
                 if !should_ignore_log_msg(&msg) {
-                    re_log::debug!("{msg}");
+                    re_log::debug!("{debug_name} decoder: {msg}");
                 }
             }
 
@@ -228,10 +286,10 @@ fn read_ffmpeg_output(
 
             // Usefuless info in these:
             FfmpegEvent::ParsedInput(input) => {
-                re_log::trace!("{input:?}");
+                re_log::trace!("{debug_name} decoder: {input:?}");
             }
             FfmpegEvent::ParsedOutput(output) => {
-                re_log::trace!("{output:?}");
+                re_log::trace!("{debug_name} decoder: {output:?}");
             }
 
             FfmpegEvent::ParsedStreamMapping(_) => {}
@@ -247,8 +305,8 @@ fn read_ffmpeg_output(
                     ..
                 } = stream;
 
-                re_log::debug!(
-                    "Input: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
+                re_log::trace!(
+                    "{debug_name} decoder input: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
                 );
 
                 debug_assert_eq!(stream_type.to_ascii_lowercase(), "video");
@@ -266,7 +324,7 @@ fn read_ffmpeg_output(
                     ..
                 } = stream;
                 re_log::trace!(
-                    "Output: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
+                    "{debug_name} decoder output: {stream_type} {format} {pix_fmt} {width}x{height} @ {fps} FPS"
                 );
 
                 debug_assert_eq!(stream_type.to_ascii_lowercase(), "video");
@@ -297,13 +355,18 @@ fn read_ffmpeg_output(
                         .map_or(true, |(pts, _)| *pts > highest_dts)
                     {
                         let Ok(frame_info) = frame_info_rx.try_recv() else {
-                            re_log::debug!("Receiver disconnected");
+                            re_log::debug!(
+                                "{debug_name} ffmpeg decoder frame info channel disconnected"
+                            );
                             return;
                         };
 
                         // If the decodetimestamp did not increase, we're probably seeking backwards!
-                        // We'd expect the video player to do a reset prior to that, but we may not have noticed that in here yet!
+                        // We'd expect the video player to do a reset prior to that and close the channel as part of that, but we may not have noticed that in here yet!
                         // In any case, we'll have to just run with this as the new highest timestamp, not much else we can do.
+                        if highest_dts < frame_info.decode_timestamp {
+                            re_log::warn_once!("Video decode timestamps are expected to monotonically increase unless there was a decoder reset. This is probably a bug in Rerun.");
+                        }
                         highest_dts = frame_info.decode_timestamp;
 
                         pending_frame_infos.insert(frame_info.presentation_timestamp, frame_info);
@@ -325,7 +388,7 @@ fn read_ffmpeg_output(
                 } = frame;
 
                 re_log::trace!(
-                    "Received frame: dts {:?} cts {:?} fmt {pix_fmt:?} size {width}x{height}",
+                    "{debug_name} received frame: dts {:?} cts {:?} fmt {pix_fmt:?} size {width}x{height}",
                     frame_info.decode_timestamp,
                     frame_info.presentation_timestamp
                 );
@@ -350,16 +413,44 @@ fn read_ffmpeg_output(
 
             FfmpegEvent::Done => {
                 // This happens on `pkill ffmpeg`, for instance.
-                re_log::debug!("ffmpeg is Done");
+                re_log::debug!("{debug_name}'s ffmpeg is Done");
                 return;
             }
 
             // TODO: handle all events
-            event => re_log::debug!("Event: {event:?}"),
+            event => re_log::debug!("{debug_name} event: {event:?}"),
         }
     }
 }
 
+/// Decode H.264 video via ffmpeg over CLI
+pub struct FfmpegCliH264Decoder {
+    debug_name: String,
+    ffmpeg: FfmpegProcessAndListener,
+    avcc: re_mp4::Avc1Box,
+    on_output: Arc<OutputCallback>,
+}
+
+impl FfmpegCliH264Decoder {
+    pub fn new(
+        debug_name: String,
+        avcc: re_mp4::Avc1Box,
+        on_output: impl Fn(super::Result<Frame>) + Send + Sync + 'static,
+    ) -> Result<Self, Error> {
+        re_tracing::profile_function!();
+
+        let on_output = Arc::new(on_output);
+        let ffmpeg = FfmpegProcessAndListener::new(&debug_name, on_output.clone(), avcc.clone())?;
+
+        Ok(Self {
+            debug_name,
+            ffmpeg,
+            avcc,
+            on_output,
+        })
+    }
+}
+
 impl AsyncDecoder for FfmpegCliH264Decoder {
     fn submit_chunk(&mut self, chunk: super::Chunk) -> super::Result<()> {
         re_tracing::profile_function!();
@@ -367,46 +458,27 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
         // We send the information about this chunk first.
         // This assumes each sample/chunk will result in exactly one frame.
         // If this assumption is not held, we will get weird errors, like videos playing to slowly.
-        let frame_info = PendingFrameInfo {
+        let frame_info = FfmpegFrameInfo {
             presentation_timestamp: chunk.presentation_timestamp,
             decode_timestamp: chunk.decode_timestamp,
             duration: chunk.duration,
         };
+        let chunk = FfmpegFrameData::Chunk(chunk);
+
+        if self.ffmpeg.frame_info_tx.send(frame_info).is_err()
+            || self.ffmpeg.frame_data_tx.send(chunk).is_err()
+        {
+            let err = super::Error::Ffmpeg(Arc::new(
+                if let Ok(exit_code) = self.ffmpeg.ffmpeg.as_inner_mut().try_wait() {
+                    Error::FfmpegUnexpectedExit(exit_code)
+                } else {
+                    Error::BrokenFrameInfoChannel
+                },
+            ));
 
-        // TODO: schedule this in a thread.
-        if self.frame_info_tx.send(frame_info.clone()).is_err() {
-            // This should never happen, even if the write thread dies
-            // since we keep a copy of both sides of the channel.
-            return Err(Error::BrokenFrameInfoChannel.into());
-        } else {
-            // Write chunk to ffmpeg:
-            let mut state = NaluStreamState::default(); // TODO: remove state?
-            let mut write_result = write_avc_chunk_to_nalu_stream(
-                &self.avcc,
-                &mut self.ffmpeg_stdin,
-                &chunk,
-                &mut state,
-            );
-            // The other thread must be down, e.g. because `ffmpeg` crashed.
-            // It should already have reported that as an error - no need to repeat it here.
-            //
-            // Reset and try again.
-            // Note that if we're in the middle of a GOP, this might get glitchy, but that's fine for this case.
-            if matches!(write_result, Err(Error::FailedToWriteToFfmpeg(_))) {
-                self.reset()?;
-                write_result = write_avc_chunk_to_nalu_stream(
-                    &self.avcc,
-                    &mut self.ffmpeg_stdin,
-                    &chunk,
-                    &mut state,
-                );
-            }
-
-            if let Err(err) = write_result {
-                (self.on_output)(Err(err.into()));
-            }
-
-            self.ffmpeg_stdin.flush().ok();
+            // Report the error on the decoding stream.
+            (self.on_output)(Err(err.clone()));
+            return Err(err);
         }
 
         Ok(())
@@ -414,29 +486,15 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
 
     fn reset(&mut self) -> super::Result<()> {
         re_log::debug!("Resetting ffmpeg decoder {}", self.debug_name);
-        re_tracing::profile_function!();
-
-        // Either we drain the frame info channel, message the thread
-        // and hope that ffmpeg is well behaved after receiving an IDR frame (no matter what was in flight so far).
-        // ... or we just kill ffmpeg & start a new process & thread.
-        self.ffmpeg.kill().ok(); // Don't care if it was already dead.
-        self.ffmpeg = start_ffmpeg_process(self.on_output.clone(), self.frame_info_rx.clone())?;
-        self.ffmpeg_stdin = self.ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
-
+        self.ffmpeg = FfmpegProcessAndListener::new(
+            &self.debug_name,
+            self.on_output.clone(),
+            self.avcc.clone(),
+        )?;
         Ok(())
     }
 }
 
-impl Drop for FfmpegCliH264Decoder {
-    fn drop(&mut self) {
-        re_log::debug!("Dropping ffmpeg decoder {}", self.debug_name);
-        self.ffmpeg.kill().ok(); // Don't care if it's already dead.
-
-        // Read thread should stop by itself.
-        // We could wait for that, but that doesn't really matter.
-    }
-}
-
 /// Before every NAL unit, here is a nal start code.
 /// Can also be 2 bytes of 0x00 and 1 byte of 0x01.
 ///

From 471e4c5fb936646b8c25e5a3eeabcf8466193b64 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 14:25:02 +0100
Subject: [PATCH 19/33] add access unit delimiter units

---
 crates/store/re_video/src/decode/ffmpeg.rs | 40 +++++++++++++++++++---
 1 file changed, 36 insertions(+), 4 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index e38079c180a3..7921cee37194 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -613,7 +613,20 @@ fn write_avc_chunk_to_nalu_stream(
         buffer_offset = data_end;
     }
 
-    // TODO: Write an Access Unit Delimiter (AUD) NAL unit to the stream?
+    // Write an Access Unit Delimiter (AUD) NAL unit to the stream to signal the end of an access unit.
+    // This can help with ffmpeg picking up NALs right away before seeing the next chunk.
+    nalu_stream
+        .write_all(NAL_START_CODE)
+        .map_err(Error::FailedToWriteToFfmpeg)?;
+    nalu_stream
+        .write_all(&[
+            NalHeader::new(NalUnitType::AccessUnitDelimiter, 3).0,
+            // Two arbitrary bytes? 0000 worked as well, but this is what
+            // https://stackoverflow.com/a/44394025/ uses. Couldn't figure out the rules for this.
+            0xFF,
+            0x80,
+        ])
+        .map_err(Error::FailedToWriteToFfmpeg)?;
 
     Ok(())
 }
@@ -621,7 +634,9 @@ fn write_avc_chunk_to_nalu_stream(
 /// Possible values for `nal_unit_type` field in `nal_unit`.
 ///
 /// Encodes to 5 bits.
-/// Via: <https://docs.rs/less-avc/0.1.5/src/less_avc/nal_unit.rs.html#232/>
+/// Via:
+/// * <https://docs.rs/less-avc/0.1.5/src/less_avc/nal_unit.rs.html#232/>
+/// * <https://github.com/FFmpeg/FFmpeg/blob/87068b9600daa522e3f45b5501ecd487a3c0be57/libavcodec/h264.h#L33>
 #[derive(PartialEq, Eq)]
 #[non_exhaustive]
 #[repr(u8)]
@@ -654,6 +669,14 @@ pub enum NalUnitType {
     /// Picture parameter set
     PictureParameterSet = 8,
 
+    /// Signals the end of a NAL unit.
+    AccessUnitDelimiter = 9,
+
+    EndSequence = 10,
+    EndStream = 11,
+    FillerData = 12,
+    SequenceParameterSetExt = 13,
+
     /// Header type not listed here.
     Other,
 }
@@ -663,8 +686,12 @@ pub enum NalUnitType {
 struct NalHeader(pub u8);
 
 impl NalHeader {
+    pub const fn new(unit_type: NalUnitType, ref_idc: u8) -> Self {
+        Self((unit_type as u8) | (ref_idc << 5))
+    }
+
     pub fn unit_type(self) -> NalUnitType {
-        match self.0 & 0b111 {
+        match self.0 & 0b11111 {
             0 => NalUnitType::Unspecified,
             1 => NalUnitType::CodedSliceOfANonIDRPicture,
             2 => NalUnitType::CodedSliceDataPartitionA,
@@ -674,6 +701,11 @@ impl NalHeader {
             6 => NalUnitType::SupplementalEnhancementInformation,
             7 => NalUnitType::SequenceParameterSet,
             8 => NalUnitType::PictureParameterSet,
+            9 => NalUnitType::AccessUnitDelimiter,
+            10 => NalUnitType::EndSequence,
+            11 => NalUnitType::EndStream,
+            12 => NalUnitType::FillerData,
+            13 => NalUnitType::SequenceParameterSetExt,
             _ => NalUnitType::Other,
         }
     }
@@ -682,7 +714,7 @@ impl NalHeader {
     ///
     /// For details see:
     /// <https://yumichan.net/video-processing/video-compression/breif-description-of-nal_ref_idc-value-in-h-246-nalu/>
-    fn ref_idc(self) -> u8 {
+    pub fn ref_idc(self) -> u8 {
         (self.0 >> 5) & 0b11
     }
 }

From 4d2ebaf9e7bcd70201695da8e65d12c5ef0b0f64 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 14:37:43 +0100
Subject: [PATCH 20/33] fix long wait time for ffmpeg shutdown/reset

---
 crates/store/re_video/src/decode/ffmpeg.rs | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 7921cee37194..557c062c18cb 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -160,16 +160,15 @@ impl FfmpegProcessAndListener {
 
 impl Drop for FfmpegProcessAndListener {
     fn drop(&mut self) {
-        // First stop the write thread. If we kill it too early, it will try to send chunks to an already dead ffmpeg process.
+        re_tracing::profile_function!();
         self.frame_data_tx.send(FfmpegFrameData::EndOfStream).ok();
+        self.ffmpeg.kill().ok();
+
         if let Some(write_thread) = self.write_thread.take() {
             if write_thread.join().is_err() {
                 re_log::error!("Failed to join ffmpeg listener thread.");
             }
         }
-
-        // The listen thread is waiting for ffmpeg things, so killing ffmpeg is enough to get it notified.
-        self.ffmpeg.kill().ok();
         if let Some(listen_thread) = self.listen_thread.take() {
             if listen_thread.join().is_err() {
                 re_log::error!("Failed to join ffmpeg listener thread.");

From 8f71b5cfc36ae4a8dc0199a11466d495629250bb Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 14:44:32 +0100
Subject: [PATCH 21/33] fixup webcodecs

---
 crates/store/re_video/src/decode/webcodecs.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/crates/store/re_video/src/decode/webcodecs.rs b/crates/store/re_video/src/decode/webcodecs.rs
index 243c0ebf3956..5ae7cbd08c06 100644
--- a/crates/store/re_video/src/decode/webcodecs.rs
+++ b/crates/store/re_video/src/decode/webcodecs.rs
@@ -132,7 +132,7 @@ impl AsyncDecoder for WebVideoDecoder {
         let web_chunk = EncodedVideoChunkInit::new(
             &data,
             video_chunk
-                .composition_timestamp
+                .presentation_timestamp
                 .into_micros(self.timescale),
             type_,
         );
@@ -184,6 +184,7 @@ fn init_video_decoder(
                 info: FrameInfo {
                     presentation_timestamp,
                     duration,
+                    ..Default::default()
                 },
             }));
         }) as Box<dyn Fn(web_sys::VideoFrame)>)

From 415bd09c7e6f733f76b31df798dc6da45db9aca2 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 16:37:15 +0100
Subject: [PATCH 22/33] document the meaning of a video sample better

---
 crates/store/re_video/src/decode/mod.rs |  4 ++--
 crates/store/re_video/src/demux/mod.rs  | 14 ++++++++++++++
 2 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index a1afdbdf7737..8d2f25961111 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -198,9 +198,9 @@ pub fn new_decoder(
     }
 }
 
-/// One chunk of encoded video data; usually one frame.
+/// One chunk of encoded video data, representing a single [`crate::Sample`].
 ///
-/// One loaded [`crate::Sample`].
+/// For details on how to interpret the data, see [`crate::Sample`].
 pub struct Chunk {
     /// The start of a new [`crate::demux::GroupOfPictures`]?
     pub is_sync: bool,
diff --git a/crates/store/re_video/src/demux/mod.rs b/crates/store/re_video/src/demux/mod.rs
index 1f4fd189991b..601f8313e7e8 100644
--- a/crates/store/re_video/src/demux/mod.rs
+++ b/crates/store/re_video/src/demux/mod.rs
@@ -267,6 +267,20 @@ impl GroupOfPictures {
 }
 
 /// A single sample in a video.
+///
+/// This is equivalent to MP4's definition of a single sample.
+/// Note that in MP4, each sample is forms a single access unit,
+/// see 3.1.1 [ISO_IEC_14496-14](https://ossrs.io/lts/zh-cn/assets/files/ISO_IEC_14496-14-MP4-2003-9a3eb04879ded495406399602ff2e587.pdf):
+/// > 3.1.1 Elementary Stream Data
+/// > To maintain the goals of streaming protocol independence, the media data is stored in its most ‘natural’ format,
+/// > and not fragmented. This enables easy local manipulation of the media data. Therefore media-data is stored
+/// > as access units, a range of contiguous bytes for each access unit (a single access unit is the definition of a
+/// > ‘sample’ for an MPEG-4 media stream).
+///
+/// Access units in H.264/H.265 are always yielding a single frame upon decoding,
+/// see <https://en.wikipedia.org/wiki/Network_Abstraction_Layer#Access_Units/>:
+/// > A set of NAL units in a specified form is referred to as an access unit.
+/// > The decoding of each access unit results in one decoded picture.
 #[derive(Debug, Clone)]
 pub struct Sample {
     /// Is t his the start of a new [`GroupOfPictures`]?

From 10abb11187428585355072f2427a2a542e58fa0c Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 16:48:03 +0100
Subject: [PATCH 23/33] fix lints, handle all ffmpeg events

---
 crates/store/re_video/examples/frames.rs   |  2 +-
 crates/store/re_video/src/decode/ffmpeg.rs | 31 ++++++++++++++++------
 crates/store/re_video/src/decode/mod.rs    |  1 -
 3 files changed, 24 insertions(+), 10 deletions(-)

diff --git a/crates/store/re_video/examples/frames.rs b/crates/store/re_video/examples/frames.rs
index 6da48f977464..ac73e0234175 100644
--- a/crates/store/re_video/examples/frames.rs
+++ b/crates/store/re_video/examples/frames.rs
@@ -96,7 +96,7 @@ fn main() {
                     write_ppm_rgba32(&mut file, frame.width, frame.height, &frame.data);
                 }
                 re_video::PixelFormat::Yuv { .. } => {
-                    re_log::error_once!("YUV frame writing is not not supported");
+                    re_log::error_once!("YUV frame writing is not supported");
                 }
             }
         }
diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 557c062c18cb..19bc7f4612ac 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -73,6 +73,7 @@ struct FfmpegProcessAndListener {
 
     /// For sending frame timestamps to the ffmpeg listener thread.
     frame_info_tx: Sender<FfmpegFrameInfo>,
+
     /// For sending chunks to the ffmpeg write thread.
     frame_data_tx: Sender<FfmpegFrameData>,
 
@@ -89,7 +90,6 @@ impl FfmpegProcessAndListener {
         re_tracing::profile_function!();
 
         let mut ffmpeg = FfmpegCommand::new()
-            .hide_banner()
             // "Reduce the latency introduced by buffering during initial input streams analysis."
             //.arg("-fflags nobuffer")
             //
@@ -335,15 +335,12 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::OutputFrame(frame) => {
-                // DTS <= PTS
-                // chunk sorted by DTS
-
-                // Frames come in in PTS order, but "frame info" comes in in DTS order!
+                // Frames come in PTS order, but "frame info" comes in DTS order!
                 //
                 // Whenever the highest known DTS is behind the PTS, we need to wait until the DTS catches up.
                 // Otherwise, we'd assign the wrong PTS to the frame that just came in.
                 //
-                // Example how how presentation timestamps and decode timestamps
+                // Example how presentation timestamps and decode timestamps
                 // can play out in the presence of B-frames to illustrate this:
                 //    PTS: 1 4 2 3
                 //    DTS: 1 2 3 4
@@ -416,8 +413,26 @@ fn read_ffmpeg_output(
                 return;
             }
 
-            // TODO: handle all events
-            event => re_log::debug!("{debug_name} event: {event:?}"),
+            FfmpegEvent::ParsedVersion(ffmpeg_version) => {
+                re_log::debug_once!("ffmpeg version is: {}", ffmpeg_version.version);
+            }
+
+            FfmpegEvent::ParsedConfiguration(ffmpeg_configuration) => {
+                re_log::debug_once!(
+                    "ffmpeg configuration: {:?}",
+                    ffmpeg_configuration.configuration
+                );
+            }
+
+            FfmpegEvent::ParsedDuration(ffmpeg_duration) => {
+                re_log::debug!("ffmpeg duration: {:?}", ffmpeg_duration);
+            }
+
+            FfmpegEvent::OutputChunk(_) => {
+                // Something went seriously wrong if we end up here.
+                re_log::error!("Unexpected ffmpeg output chunk for {debug_name}");
+                return;
+            }
         }
     }
 }
diff --git a/crates/store/re_video/src/decode/mod.rs b/crates/store/re_video/src/decode/mod.rs
index 8d2f25961111..d990f4177bfe 100644
--- a/crates/store/re_video/src/decode/mod.rs
+++ b/crates/store/re_video/src/decode/mod.rs
@@ -185,7 +185,6 @@ pub fn new_decoder(
 
         #[cfg(with_ffmpeg)]
         re_mp4::StsdBoxContent::Avc1(avc1_box) => {
-            // TODO: check if we have ffmpeg ONCE, and remember
             re_log::trace!("Decoding H.264…");
             Ok(Box::new(ffmpeg::FfmpegCliH264Decoder::new(
                 debug_name.to_owned(),

From 7e1fc90ce5ee72d395efd8aca6bbb93fe59a0561 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 16:51:20 +0100
Subject: [PATCH 24/33] The ultimate source on nal headers is unfortunately
 gone, no point in linking to it anymore

---
 crates/store/re_video/src/decode/ffmpeg.rs | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 19bc7f4612ac..787e22f10bbd 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -725,9 +725,6 @@ impl NalHeader {
     }
 
     /// Ref idc is a value from 0-3 that tells us how "important" the frame/sample is.
-    ///
-    /// For details see:
-    /// <https://yumichan.net/video-processing/video-compression/breif-description-of-nal_ref_idc-value-in-h-246-nalu/>
     pub fn ref_idc(self) -> u8 {
         (self.0 >> 5) & 0b11
     }

From b99519745d140a10778e01b22241c3d84f2a23be Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Thu, 31 Oct 2024 16:52:09 +0100
Subject: [PATCH 25/33] remove old todo

---
 crates/store/re_video/src/decode/ffmpeg.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 787e22f10bbd..eea69f193473 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -532,7 +532,6 @@ fn write_avc_chunk_to_nalu_stream(
 
     // Append SPS (Sequence Parameter Set) & PPS (Picture Parameter Set) NAL unit whenever encountering
     // an IDR frame unless the previous frame was an IDR frame.
-    // TODO(andreas): Should we detect this rather from the NALU stream rather than the samples?
     if chunk.is_sync && !state.previous_frame_was_idr {
         for sps in &avcc.sequence_parameter_sets {
             nalu_stream

From 2fdb06c26e956241416565589cb3630895c20c81 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 11:03:32 +0100
Subject: [PATCH 26/33] various improvement to ffmpeg error handling

---
 crates/store/re_video/src/decode/ffmpeg.rs | 27 ++++++++++++++++------
 crates/store/re_video/src/time.rs          |  1 +
 2 files changed, 21 insertions(+), 7 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index eea69f193473..429c60e8f2bf 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -45,6 +45,9 @@ pub enum Error {
     #[error("FFMPEG exited unexpectedly with code {0:?}")]
     FfmpegUnexpectedExit(Option<std::process::ExitStatus>),
 
+    #[error("FFMPEG output a non-image chunk when we expected only images.")]
+    UnexpectedFfmpegOutputChunk,
+
     #[error("Failed to send video frame info to the ffmpeg read thread.")]
     BrokenFrameInfoChannel,
 }
@@ -237,14 +240,14 @@ fn read_ffmpeg_output(
 
     // Pending frames, sorted by their presentation timestamp.
     let mut pending_frame_infos = BTreeMap::new();
-    let mut highest_dts = Time(i64::MIN); // Highest dts encountered so far.
+    let mut highest_dts = Time::MIN; // Highest dts encountered so far.
 
     for event in ffmpeg_iterator {
         #[allow(clippy::match_same_arms)]
         match event {
             FfmpegEvent::Log(LogLevel::Info, msg) => {
                 if !should_ignore_log_msg(&msg) {
-                    re_log::trace!("{debug_name} decoder: {msg}");
+                    re_log::debug!("{debug_name} decoder: {msg}");
                 }
             }
 
@@ -280,18 +283,22 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::Error(error) => {
+                // An error in ffmpeg sidecar itself, rather than ffmpeg.
                 on_output(Err(Error::FfmpegSidecar(error).into()));
             }
 
-            // Usefuless info in these:
             FfmpegEvent::ParsedInput(input) => {
                 re_log::trace!("{debug_name} decoder: {input:?}");
             }
+
             FfmpegEvent::ParsedOutput(output) => {
                 re_log::trace!("{debug_name} decoder: {output:?}");
             }
 
-            FfmpegEvent::ParsedStreamMapping(_) => {}
+            FfmpegEvent::ParsedStreamMapping(_) => {
+                // This reports what input streams ffmpeg maps to which output streams.
+                // Very unspectecular in our case as know that we map h264 video to raw video.
+            }
 
             FfmpegEvent::ParsedInputStream(stream) => {
                 let ffmpeg_sidecar::event::AVStream {
@@ -335,8 +342,13 @@ fn read_ffmpeg_output(
             }
 
             FfmpegEvent::OutputFrame(frame) => {
-                // Frames come in PTS order, but "frame info" comes in DTS order!
+                // We input frames into ffmpeg in decode (DTS) order, and so that's
+                // also the order we will receive the `FrameInfo`s from `frame_info_rx`.
+                // However, `ffmpeg` will re-order the frames to output them in presentation (PTS) order.
+                // We want to accurately match the `FrameInfo` with its corresponding output frame.
+                // To do that, we need to buffer frames that come out of ffmpeg.
                 //
+                // How do we know how large this buffer needs to be?
                 // Whenever the highest known DTS is behind the PTS, we need to wait until the DTS catches up.
                 // Otherwise, we'd assign the wrong PTS to the frame that just came in.
                 //
@@ -424,13 +436,14 @@ fn read_ffmpeg_output(
                 );
             }
 
-            FfmpegEvent::ParsedDuration(ffmpeg_duration) => {
-                re_log::debug!("ffmpeg duration: {:?}", ffmpeg_duration);
+            FfmpegEvent::ParsedDuration(_) => {
+                // ffmpeg has no way of knowing the duration of the stream. Whatever it might make up is wrong.
             }
 
             FfmpegEvent::OutputChunk(_) => {
                 // Something went seriously wrong if we end up here.
                 re_log::error!("Unexpected ffmpeg output chunk for {debug_name}");
+                on_output(Err(Error::UnexpectedFfmpegOutputChunk.into()));
                 return;
             }
         }
diff --git a/crates/store/re_video/src/time.rs b/crates/store/re_video/src/time.rs
index fc0c36619d4b..de763092d539 100644
--- a/crates/store/re_video/src/time.rs
+++ b/crates/store/re_video/src/time.rs
@@ -15,6 +15,7 @@ pub struct Time(pub i64);
 impl Time {
     pub const ZERO: Self = Self(0);
     pub const MAX: Self = Self(i64::MAX);
+    pub const MIN: Self = Self(i64::MIN);
 
     /// Create a new value in _time units_.
     ///

From 2858c00b3ed07a2f82641535b27b392336709855 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 11:07:24 +0100
Subject: [PATCH 27/33] more comment improvements

---
 crates/store/re_video/src/decode/ffmpeg.rs | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 429c60e8f2bf..afcebfc5adf9 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -483,8 +483,7 @@ impl AsyncDecoder for FfmpegCliH264Decoder {
         re_tracing::profile_function!();
 
         // We send the information about this chunk first.
-        // This assumes each sample/chunk will result in exactly one frame.
-        // If this assumption is not held, we will get weird errors, like videos playing to slowly.
+        // Chunks are defined to always yield a single frame.
         let frame_info = FfmpegFrameInfo {
             presentation_timestamp: chunk.presentation_timestamp,
             decode_timestamp: chunk.decode_timestamp,
@@ -543,8 +542,10 @@ fn write_avc_chunk_to_nalu_stream(
     re_tracing::profile_function!();
     let avcc = &avcc.avcc;
 
-    // Append SPS (Sequence Parameter Set) & PPS (Picture Parameter Set) NAL unit whenever encountering
-    // an IDR frame unless the previous frame was an IDR frame.
+    // We expect the stream of chunks to not have any SPS (Sequence Parameter Set) & PPS (Picture Parameter Set)
+    // just as it is the case with MP4 data.
+    // In order to have every IDR frame be able to be fully re-entrant, we need to prepend the SPS & PPS NAL units.
+    // Otherwise the decoder is not able to get the necessary information about how the video stream is encoded.
     if chunk.is_sync && !state.previous_frame_was_idr {
         for sps in &avcc.sequence_parameter_sets {
             nalu_stream

From 5025f3be07515d10075f03454f371fe48790aa8a Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 11:10:06 +0100
Subject: [PATCH 28/33] utility method for writing to stream with mapped error

---
 crates/store/re_video/src/decode/ffmpeg.rs | 25 +++++++++++-----------
 1 file changed, 12 insertions(+), 13 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index afcebfc5adf9..1a8d06d89803 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -533,6 +533,10 @@ struct NaluStreamState {
     previous_frame_was_idr: bool,
 }
 
+fn write_bytes(stream: &mut dyn std::io::Write, data: &[u8]) -> Result<(), Error> {
+    stream.write_all(data).map_err(Error::FailedToWriteToFfmpeg)
+}
+
 fn write_avc_chunk_to_nalu_stream(
     avcc: &re_mp4::Avc1Box,
     nalu_stream: &mut dyn std::io::Write,
@@ -625,35 +629,30 @@ fn write_avc_chunk_to_nalu_stream(
 
         let data = &chunk.data[data_start..data_end];
 
-        nalu_stream
-            .write_all(NAL_START_CODE)
-            .map_err(Error::FailedToWriteToFfmpeg)?;
+        write_bytes(nalu_stream, NAL_START_CODE)?;
 
         // Note that we don't have to insert "emulation prevention bytes" since mp4 NALU still use them.
         // (unlike the NAL start code, the presentation bytes are part of the NAL spec!)
 
         re_tracing::profile_scope!("write_bytes", data.len().to_string());
-        nalu_stream
-            .write_all(data)
-            .map_err(Error::FailedToWriteToFfmpeg)?;
+        write_bytes(nalu_stream, data)?;
 
         buffer_offset = data_end;
     }
 
     // Write an Access Unit Delimiter (AUD) NAL unit to the stream to signal the end of an access unit.
     // This can help with ffmpeg picking up NALs right away before seeing the next chunk.
-    nalu_stream
-        .write_all(NAL_START_CODE)
-        .map_err(Error::FailedToWriteToFfmpeg)?;
-    nalu_stream
-        .write_all(&[
+    write_bytes(nalu_stream, NAL_START_CODE)?;
+    write_bytes(
+        nalu_stream,
+        &[
             NalHeader::new(NalUnitType::AccessUnitDelimiter, 3).0,
             // Two arbitrary bytes? 0000 worked as well, but this is what
             // https://stackoverflow.com/a/44394025/ uses. Couldn't figure out the rules for this.
             0xFF,
             0x80,
-        ])
-        .map_err(Error::FailedToWriteToFfmpeg)?;
+        ],
+    )?;
 
     Ok(())
 }

From 8a43e246767528f4be2d6261abebf0dada5374fd Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 11:20:01 +0100
Subject: [PATCH 29/33] hide banner (reduce log spam), easier to read frame
 info reordering

---
 crates/store/re_video/src/decode/ffmpeg.rs | 18 ++++++++++--------
 1 file changed, 10 insertions(+), 8 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 1a8d06d89803..4ca3dbae21f5 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -93,6 +93,7 @@ impl FfmpegProcessAndListener {
         re_tracing::profile_function!();
 
         let mut ffmpeg = FfmpegCommand::new()
+            .hide_banner()
             // "Reduce the latency introduced by buffering during initial input streams analysis."
             //.arg("-fflags nobuffer")
             //
@@ -358,10 +359,15 @@ fn read_ffmpeg_output(
                 //    DTS: 1 2 3 4
                 // Stream: I P B B
                 let frame_info = loop {
-                    if pending_frame_infos
-                        .first_key_value()
-                        .map_or(true, |(pts, _)| *pts > highest_dts)
-                    {
+                    let oldest_pts_in_buffer =
+                        pending_frame_infos.first_key_value().map(|(pts, _)| *pts);
+                    let is_caught_up = oldest_pts_in_buffer.is_some_and(|pts| pts <= highest_dts);
+                    if is_caught_up {
+                        // There must be an element here, otherwise we wouldn't be here.
+                        #[allow(clippy::unwrap_used)]
+                        break pending_frame_infos.pop_first().unwrap().1;
+                    } else {
+                        // We're behind:
                         let Ok(frame_info) = frame_info_rx.try_recv() else {
                             re_log::debug!(
                                 "{debug_name} ffmpeg decoder frame info channel disconnected"
@@ -378,10 +384,6 @@ fn read_ffmpeg_output(
                         highest_dts = frame_info.decode_timestamp;
 
                         pending_frame_infos.insert(frame_info.presentation_timestamp, frame_info);
-                    } else {
-                        // There must be an element here, otherwise we wouldn't be in this branch.
-                        #[allow(clippy::unwrap_used)]
-                        break pending_frame_infos.pop_first().unwrap().1;
                     }
                 };
 

From 53fff85fb7bfb5fa1f9f2685af593b155610faea Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 11:56:29 +0100
Subject: [PATCH 30/33] fix logspam on seeking

---
 crates/store/re_video/src/decode/ffmpeg.rs | 34 ++++++++++++++++++----
 1 file changed, 29 insertions(+), 5 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 4ca3dbae21f5..3c22303a4fae 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -1,6 +1,10 @@
 //! Send video data to `ffmpeg` over CLI to decode it.
 
-use std::{collections::BTreeMap, io::Write, sync::Arc};
+use std::{
+    collections::BTreeMap,
+    io::Write,
+    sync::{atomic::AtomicBool, Arc},
+};
 
 use crossbeam::channel::{Receiver, Sender};
 use ffmpeg_sidecar::{
@@ -82,6 +86,9 @@ struct FfmpegProcessAndListener {
 
     listen_thread: Option<std::thread::JoinHandle<()>>,
     write_thread: Option<std::thread::JoinHandle<()>>,
+
+    /// If true, the write thread will not report errors. Used upon exit, so the write thread won't log spam on the hung up stdin.
+    suppress_write_error_reports: Arc<AtomicBool>,
 }
 
 impl FfmpegProcessAndListener {
@@ -142,12 +149,20 @@ impl FfmpegProcessAndListener {
             })
             .expect("Failed to spawn ffmpeg listener thread");
 
+        let suppress_write_error_reports = Arc::new(AtomicBool::new(false));
         let write_thread = std::thread::Builder::new()
             .name(format!("ffmpeg-writer for {debug_name}"))
             .spawn({
                 let ffmpeg_stdin = ffmpeg.take_stdin().ok_or(Error::NoStdin)?;
+                let suppress_write_error_reports = suppress_write_error_reports.clone();
                 move || {
-                    write_ffmpeg_input(ffmpeg_stdin, &frame_data_rx, on_output.as_ref(), &avcc);
+                    write_ffmpeg_input(
+                        ffmpeg_stdin,
+                        &frame_data_rx,
+                        on_output.as_ref(),
+                        &avcc,
+                        &suppress_write_error_reports,
+                    );
                 }
             })
             .expect("Failed to spawn ffmpeg writer thread");
@@ -158,6 +173,7 @@ impl FfmpegProcessAndListener {
             frame_data_tx,
             listen_thread: Some(listen_thread),
             write_thread: Some(write_thread),
+            suppress_write_error_reports,
         })
     }
 }
@@ -165,6 +181,8 @@ impl FfmpegProcessAndListener {
 impl Drop for FfmpegProcessAndListener {
     fn drop(&mut self) {
         re_tracing::profile_function!();
+        self.suppress_write_error_reports
+            .store(true, std::sync::atomic::Ordering::Relaxed);
         self.frame_data_tx.send(FfmpegFrameData::EndOfStream).ok();
         self.ffmpeg.kill().ok();
 
@@ -186,6 +204,7 @@ fn write_ffmpeg_input(
     frame_data_rx: &Receiver<FfmpegFrameData>,
     on_output: &OutputCallback,
     avcc: &re_mp4::Avc1Box,
+    suppress_write_error_reports: &AtomicBool,
 ) {
     let mut state = NaluStreamState::default();
 
@@ -198,11 +217,16 @@ fn write_ffmpeg_input(
         if let Err(err) =
             write_avc_chunk_to_nalu_stream(avcc, &mut ffmpeg_stdin, &chunk, &mut state)
         {
+            let write_error = matches!(err, Error::FailedToWriteToFfmpeg(_));
+            if !write_error
+                || !suppress_write_error_reports.load(std::sync::atomic::Ordering::Relaxed)
+            {
+                (on_output)(Err(err.into()));
+            }
+
             // This is unlikely to improve! Ffmpeg process likely died.
             // By exiting here we hang up on the channel, making future attempts to push into it fail which should cause a reset eventually.
-            let should_exit = matches!(err, Error::FailedToWriteToFfmpeg(_));
-            (on_output)(Err(err.into()));
-            if should_exit {
+            if write_error {
                 return;
             }
         } else {

From 6743ced847a24d4ba08d2569679ba07d5c02abb1 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 12:07:20 +0100
Subject: [PATCH 31/33] fix decode timestamp warning being the wrong way round

---
 crates/store/re_video/src/decode/ffmpeg.rs | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index 3c22303a4fae..d086dee60eff 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -402,8 +402,9 @@ fn read_ffmpeg_output(
                         // If the decodetimestamp did not increase, we're probably seeking backwards!
                         // We'd expect the video player to do a reset prior to that and close the channel as part of that, but we may not have noticed that in here yet!
                         // In any case, we'll have to just run with this as the new highest timestamp, not much else we can do.
-                        if highest_dts < frame_info.decode_timestamp {
-                            re_log::warn_once!("Video decode timestamps are expected to monotonically increase unless there was a decoder reset. This is probably a bug in Rerun.");
+                        if highest_dts > frame_info.decode_timestamp {
+                            re_log::warn!("Video decode timestamps are expected to monotonically increase unless there was a decoder reset.\n\
+                                                It went from {:?} to {:?} for the decoder of {debug_name}. This is probably a bug in Rerun.", highest_dts, frame_info.decode_timestamp);
                         }
                         highest_dts = frame_info.decode_timestamp;
 

From 696ea49a200bfd08ec60d36d4b7b58a0d06716d6 Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 12:53:27 +0100
Subject: [PATCH 32/33] hover tooltips

---
 .../src/decode/async_decoder_wrapper.rs       |  2 +-
 crates/viewer/re_data_ui/src/video.rs         | 28 +++++++++++++------
 2 files changed, 21 insertions(+), 9 deletions(-)

diff --git a/crates/store/re_video/src/decode/async_decoder_wrapper.rs b/crates/store/re_video/src/decode/async_decoder_wrapper.rs
index 8bfac6842fb4..546a5cbffa2a 100644
--- a/crates/store/re_video/src/decode/async_decoder_wrapper.rs
+++ b/crates/store/re_video/src/decode/async_decoder_wrapper.rs
@@ -73,7 +73,7 @@ impl AsyncDecoderWrapper {
         let comms = Comms::default();
 
         let thread = std::thread::Builder::new()
-            .name(format!("decoer thread for {debug_name}"))
+            .name(format!("decoder of {debug_name}"))
             .spawn({
                 let comms = comms.clone();
                 move || {
diff --git a/crates/viewer/re_data_ui/src/video.rs b/crates/viewer/re_data_ui/src/video.rs
index bc9724923094..2cd4c69a4eea 100644
--- a/crates/viewer/re_data_ui/src/video.rs
+++ b/crates/viewer/re_data_ui/src/video.rs
@@ -198,24 +198,36 @@ fn frame_info_ui(ui: &mut egui::Ui, frame_info: &FrameInfo, timescale: re_video:
     let time_range = frame_info.time_range();
     ui.list_item_flat_noninteractive(PropertyContent::new("Time range").value_text(format!(
         "{} - {}",
-        re_format::format_timestamp_seconds(time_range.start.into_secs(timescale),),
-        re_format::format_timestamp_seconds(time_range.end.into_secs(timescale),),
+        re_format::format_timestamp_seconds(time_range.start.into_secs(timescale)),
+        re_format::format_timestamp_seconds(time_range.end.into_secs(timescale)),
     )))
     .on_hover_text("Time range in which this frame is valid.");
 
-    ui.list_item_flat_noninteractive(
-        PropertyContent::new("PTS").value_text(frame_info.presentation_timestamp.0.to_string()),
-    )
-    .on_hover_text("Raw presentation timestamp prior to applying the timescale.\n\
-                    This specifies the time at which the frame should be shown relative to the start of a video stream.");
+    fn value_fn_for_time(
+        time: re_video::Time,
+        timescale: re_video::Timescale,
+    ) -> impl FnOnce(&mut egui::Ui, egui::style::WidgetVisuals) {
+        move |ui, _| {
+            ui.add(egui::Label::new(time.0.to_string()).truncate())
+                .on_hover_text(re_format::format_timestamp_seconds(
+                    time.into_secs(timescale),
+                ));
+        }
+    }
 
     if let Some(dts) = frame_info.latest_decode_timestamp {
         ui.list_item_flat_noninteractive(
-            PropertyContent::new("DTS").value_text(dts.0.to_string()),
+            PropertyContent::new("DTS").value_fn(value_fn_for_time(dts, timescale)),
         )
         .on_hover_text("Raw decode timestamp prior to applying the timescale.\n\
                         If a frame is made up of multiple chunks, this is the last decode timestamp that was needed to decode the frame.");
     }
+
+    ui.list_item_flat_noninteractive(
+        PropertyContent::new("PTS").value_fn(value_fn_for_time(frame_info.presentation_timestamp, timescale)),
+    )
+    .on_hover_text("Raw presentation timestamp prior to applying the timescale.\n\
+                    This specifies the time at which the frame should be shown relative to the start of a video stream.");
 }
 
 fn source_image_data_format_ui(ui: &mut egui::Ui, format: &SourceImageDataFormat) {

From e2dc61e72de3d07face43aa01d857920cf6cc11c Mon Sep 17 00:00:00 2001
From: Andreas Reich <r_andreas2@web.de>
Date: Mon, 4 Nov 2024 13:15:14 +0100
Subject: [PATCH 33/33] make ffmpeg warnigns warn_once, fix swscalar message
 showing up a lot for deprecated video formats

---
 crates/store/re_video/src/decode/ffmpeg.rs | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/crates/store/re_video/src/decode/ffmpeg.rs b/crates/store/re_video/src/decode/ffmpeg.rs
index d086dee60eff..8fdfe466e256 100644
--- a/crates/store/re_video/src/decode/ffmpeg.rs
+++ b/crates/store/re_video/src/decode/ffmpeg.rs
@@ -246,6 +246,7 @@ fn read_ffmpeg_output(
         let patterns = [
             "Duration: N/A, bitrate: N/A",
             "frame=    0 fps=0.0 q=0.0 size=       0kB time=N/A bitrate=N/A speed=N/A",
+            "encoder         : ", // Describes the encoder that was used to encode a video.
             "Metadata:",
             // TODO(andreas): we should just handle yuv420p directly!
             "No accelerated colorspace conversion found from yuv420p to rgb24",
@@ -272,12 +273,20 @@ fn read_ffmpeg_output(
         match event {
             FfmpegEvent::Log(LogLevel::Info, msg) => {
                 if !should_ignore_log_msg(&msg) {
-                    re_log::debug!("{debug_name} decoder: {msg}");
+                    re_log::trace!("{debug_name} decoder: {msg}");
                 }
             }
 
-            FfmpegEvent::Log(LogLevel::Warning, msg) => {
+            FfmpegEvent::Log(LogLevel::Warning, mut msg) => {
                 if !should_ignore_log_msg(&msg) {
+                    // Make warn_once work on `[swscaler @ 0x148db8000]` style warnings even if the address is different every time.
+                    if let Some(pos) = msg.find("[swscaler @ 0x") {
+                        msg = [
+                            &msg[..pos],
+                            &msg[(pos + "[swscaler @ 0x148db8000]".len())..],
+                        ]
+                        .join("[swscaler]");
+                    };
                     re_log::warn_once!("{debug_name} decoder: {msg}");
                 }
             }
@@ -298,7 +307,7 @@ fn read_ffmpeg_output(
                     return;
                 }
                 if !should_ignore_log_msg(&msg) {
-                    re_log::debug!("{debug_name} decoder: {msg}");
+                    re_log::warn_once!("{debug_name} decoder: {msg}");
                 }
             }