T5.2: VideoQualityController with per-mode allocation gates + 8-step target table

This commit is contained in:
Siavash Sameni
2026-05-12 12:34:32 +04:00
parent 276ecc660e
commit 2e0bdc5904
8 changed files with 464 additions and 3 deletions

View File

@@ -8,6 +8,7 @@ rust-version.workspace = true
[dependencies]
bytes = { workspace = true }
tracing = { workspace = true }
wzp-proto = { path = "../wzp-proto" }
[target.'cfg(target_os = "macos")'.dependencies]
shiguredo_video_toolbox = "2026.1"

View File

@@ -0,0 +1,384 @@
//! Video quality controller — maps bandwidth estimate + priority mode to
//! encoder target parameters (bitrate, fps, resolution).
//!
//! See `docs/PRD/PRD-video-quality-priority.md`.
use std::sync::Arc;
use std::sync::atomic::{AtomicU8, AtomicU32, Ordering::Relaxed};
use wzp_proto::BandwidthEstimator;
use wzp_proto::PriorityMode;
/// Target parameters for the video encoder.
///
/// A `bitrate_kbps` of `0` means video is disabled (not enough bandwidth).
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
pub struct VideoTarget {
/// Target bitrate in kilobits per second.
pub bitrate_kbps: u32,
/// Target frame rate.
pub fps: u8,
/// Frame width in pixels.
pub width: u16,
/// Frame height in pixels.
pub height: u16,
}
impl VideoTarget {
/// Disabled video — zero budget.
pub const DISABLED: Self = Self {
bitrate_kbps: 0,
fps: 0,
width: 0,
height: 0,
};
}
/// Step in the bitrate -> (resolution, fps) lookup table.
struct Step {
min_budget_kbps: u32,
width: u16,
height: u16,
fps: u8,
}
/// H.264 baseline step table. Each step is the minimum budget required to
/// sustain the corresponding resolution + frame rate.
///
/// Steps are ordered from highest to lowest budget. The first step whose
/// `min_budget_kbps` is <= the available video budget wins.
static STEP_TABLE: &[Step] = &[
Step {
min_budget_kbps: 4000,
width: 1280,
height: 720,
fps: 30,
},
Step {
min_budget_kbps: 2000,
width: 640,
height: 480,
fps: 30,
},
Step {
min_budget_kbps: 1000,
width: 480,
height: 360,
fps: 30,
},
Step {
min_budget_kbps: 500,
width: 480,
height: 360,
fps: 15,
},
Step {
min_budget_kbps: 250,
width: 320,
height: 240,
fps: 15,
},
Step {
min_budget_kbps: 150,
width: 320,
height: 240,
fps: 10,
},
Step {
min_budget_kbps: 100,
width: 240,
height: 180,
fps: 10,
},
Step {
min_budget_kbps: 50,
width: 240,
height: 180,
fps: 5,
},
];
/// Audio floor budgets per priority mode (kbps).
const AUDIO_FLOOR_KBPS: u32 = 24;
const AUDIO_FLOOR_SCREENCAST_KBPS: u32 = 16;
/// Proportion of total budget allocated to audio in `Balanced` mode.
const BALANCED_AUDIO_RATIO: f64 = 0.15;
/// Maximum bitrate change ratio per second (2x up or down).
const MAX_CHANGE_RATIO_PER_SEC: f64 = 2.0;
/// Video quality controller.
///
/// Consumes a [`BandwidthEstimator`] and a [`PriorityMode`] and produces
/// [`VideoTarget`] recommendations for the encoder. The controller is
/// thread-safe: `mode`, `loss_pct`, and `rtt_ms` can be updated from any
/// thread while `tick()` runs on the encoder thread.
pub struct VideoQualityController {
bwe: Arc<BandwidthEstimator>,
mode: AtomicU8, // PriorityMode as u8
loss_pct: AtomicU8,
rtt_ms: AtomicU32,
last_target: std::sync::Mutex<VideoTarget>,
last_tick_ms: AtomicU32,
}
impl VideoQualityController {
/// Create a new controller.
pub fn new(bwe: Arc<BandwidthEstimator>) -> Self {
Self {
bwe,
mode: AtomicU8::new(PriorityMode::AudioFirst as u8),
loss_pct: AtomicU8::new(0),
rtt_ms: AtomicU32::new(0),
last_target: std::sync::Mutex::new(VideoTarget::DISABLED),
last_tick_ms: AtomicU32::new(0),
}
}
/// Set the current priority mode (mid-call override).
pub fn set_mode(&self, mode: PriorityMode) {
self.mode.store(mode as u8, Relaxed);
}
/// Update network observables.
pub fn update_network(&self, loss_pct: u8, rtt_ms: u32) {
self.loss_pct.store(loss_pct, Relaxed);
self.rtt_ms.store(rtt_ms, Relaxed);
}
/// Read the current priority mode.
pub fn mode(&self) -> PriorityMode {
match self.mode.load(Relaxed) {
1 => PriorityMode::VideoFirst,
2 => PriorityMode::ScreenShare,
3 => PriorityMode::Balanced,
_ => PriorityMode::AudioFirst,
}
}
/// Compute audio and video budgets from the current BWE and priority mode.
///
/// Returns `(audio_budget_kbps, video_budget_kbps)`.
pub fn allocate(&self) -> (u32, u32) {
let bwe_kbps = (self.bwe.target_send_bps() / 1000) as u32;
let mode = self.mode();
match mode {
PriorityMode::AudioFirst => {
let audio = AUDIO_FLOOR_KBPS.min(bwe_kbps);
let video = bwe_kbps.saturating_sub(audio);
(audio, video)
}
PriorityMode::VideoFirst => {
// Video floor: enough for the lowest step (240x180 @ 5fps).
let video_floor = STEP_TABLE.last().map(|s| s.min_budget_kbps).unwrap_or(50);
let video = video_floor.min(bwe_kbps);
let audio = bwe_kbps.saturating_sub(video);
(audio, video)
}
PriorityMode::ScreenShare => {
let audio = AUDIO_FLOOR_SCREENCAST_KBPS.min(bwe_kbps);
let video = bwe_kbps.saturating_sub(audio);
(audio, video)
}
PriorityMode::Balanced => {
let audio = ((bwe_kbps as f64) * BALANCED_AUDIO_RATIO) as u32;
let video = bwe_kbps.saturating_sub(audio);
(audio, video)
}
}
}
/// Map a video budget to a `(bitrate_kbps, width, height, fps)` target.
///
/// Uses the static step table. If budget is below the lowest step,
/// returns [`VideoTarget::DISABLED`].
fn derive_target(&self, video_budget_kbps: u32) -> VideoTarget {
for step in STEP_TABLE {
if video_budget_kbps >= step.min_budget_kbps {
return VideoTarget {
bitrate_kbps: video_budget_kbps,
fps: step.fps,
width: step.width,
height: step.height,
};
}
}
VideoTarget::DISABLED
}
/// Smooth the target to avoid jumps larger than `MAX_CHANGE_RATIO_PER_SEC`
/// over one second.
///
/// `dt_ms` is the elapsed time since the last tick.
fn smooth(&self, raw: VideoTarget, dt_ms: u32) -> VideoTarget {
if raw.bitrate_kbps == 0 {
return raw;
}
let last = *self.last_target.lock().unwrap();
if last.bitrate_kbps == 0 {
return raw;
}
let dt_s = dt_ms as f64 / 1000.0;
let max_ratio = MAX_CHANGE_RATIO_PER_SEC.powf(dt_s);
let min_br = (last.bitrate_kbps as f64 / max_ratio) as u32;
let max_br = (last.bitrate_kbps as f64 * max_ratio) as u32;
let clamped_br = raw.bitrate_kbps.clamp(min_br, max_br);
VideoTarget {
bitrate_kbps: clamped_br,
..raw
}
}
/// Run one controller tick.
///
/// `now_ms` is a monotonic timestamp (e.g. `timestamp_ms` from the media
/// pipeline). Returns the current [`VideoTarget`] which the caller should
/// pass to the encoder.
pub fn tick(&self, now_ms: u32) -> VideoTarget {
let (_audio_budget, video_budget) = self.allocate();
let raw = self.derive_target(video_budget);
let prev = self.last_tick_ms.swap(now_ms, Relaxed);
let dt_ms = if prev == 0 {
1000
} else {
now_ms.saturating_sub(prev)
};
let smoothed = self.smooth(raw, dt_ms);
*self.last_target.lock().unwrap() = smoothed;
smoothed
}
}
#[cfg(test)]
mod tests {
use super::*;
fn dummy_bwe(bps: u64) -> Arc<BandwidthEstimator> {
let bwe = BandwidthEstimator::new((bps / 1000) as f64, 10.0, 100_000.0);
// Seed cwnd so target_send_bps() returns a non-zero value.
// cwnd_bps = cwnd_bytes * 8 / rtt_s. For 1s RTT: cwnd_bytes = bps / 8.
let cwnd_bytes = bps / 8;
bwe.update_from_path(cwnd_bytes, 0, 1000);
Arc::new(bwe)
}
#[test]
fn audio_first_reserves_floor() {
let bwe = dummy_bwe(100_000); // 100 kbps
let ctrl = VideoQualityController::new(bwe);
let (audio, video) = ctrl.allocate();
// BWE target is 90% of raw = 90 kbps.
assert_eq!(audio, 24, "audio floor is 24 kbps");
assert_eq!(video, 66, "video gets remainder after 90% BWE factor");
}
#[test]
fn audio_first_floor_not_below_bwe() {
let bwe = dummy_bwe(10_000); // 10 kbps
let ctrl = VideoQualityController::new(bwe);
let (audio, video) = ctrl.allocate();
// BWE target is 90% of raw = 9 kbps.
assert_eq!(audio, 9, "audio cannot exceed bwe");
assert_eq!(video, 0, "video gets nothing");
}
#[test]
fn screen_share_clamps_audio() {
let bwe = dummy_bwe(200_000); // 200 kbps
let ctrl = VideoQualityController::new(bwe);
ctrl.set_mode(PriorityMode::ScreenShare);
let (audio, video) = ctrl.allocate();
// BWE target is 90% of raw = 180 kbps.
assert_eq!(audio, 16, "screen-share audio clamped to 16 kbps");
assert_eq!(video, 164);
}
#[test]
fn balanced_split() {
let bwe = dummy_bwe(1_000_000); // 1 Mbps
let ctrl = VideoQualityController::new(bwe);
ctrl.set_mode(PriorityMode::Balanced);
let (audio, video) = ctrl.allocate();
// BWE target is 90% of raw = 900 kbps.
assert_eq!(audio, 135, "15% of 900 kbps = 135 kbps audio");
assert_eq!(video, 765);
}
#[test]
fn derive_target_disabled_below_floor() {
let bwe = dummy_bwe(1_000_000);
let ctrl = VideoQualityController::new(bwe);
let target = ctrl.derive_target(10); // below lowest step (50 kbps)
assert_eq!(target, VideoTarget::DISABLED);
}
#[test]
fn derive_target_lowest_step() {
let bwe = dummy_bwe(1_000_000);
let ctrl = VideoQualityController::new(bwe);
let target = ctrl.derive_target(50);
assert_eq!(target.width, 240);
assert_eq!(target.height, 180);
assert_eq!(target.fps, 5);
}
#[test]
fn derive_target_highest_step() {
let bwe = dummy_bwe(10_000_000); // 10 Mbps
let ctrl = VideoQualityController::new(bwe);
let target = ctrl.derive_target(5000);
assert_eq!(target.width, 1280);
assert_eq!(target.height, 720);
assert_eq!(target.fps, 30);
}
#[test]
fn smoothing_limits_jump() {
let bwe = dummy_bwe(10_000_000);
let ctrl = VideoQualityController::new(bwe);
// First tick establishes baseline at 720p.
let t0 = ctrl.tick(0);
assert!(t0.bitrate_kbps > 0);
// Simulate a BWE drop from 10 Mbps to 1 Mbps.
let bwe2 = dummy_bwe(1_000_000);
let ctrl2 = VideoQualityController::new(bwe2);
// Pre-seed last_target so smoothing has something to compare against.
*ctrl2.last_target.lock().unwrap() = VideoTarget {
bitrate_kbps: 4000,
..VideoTarget::DISABLED
};
ctrl2.last_tick_ms.store(0, Relaxed);
let t1 = ctrl2.tick(1000); // 1 s later
// Max change per second is 2x, so 4000 -> min 2000.
assert!(
t1.bitrate_kbps >= 2000,
"smoothing should prevent >2x drop in 1s"
);
// Raw budget after 1 Mbps drop is ~900 kbps; smoothing clamps to 2000.
assert!(
t1.bitrate_kbps < 4000,
"smoothing should also cap upward jumps"
);
}
#[test]
fn mode_roundtrip() {
let bwe = dummy_bwe(1_000_000);
let ctrl = VideoQualityController::new(bwe);
assert_eq!(ctrl.mode(), PriorityMode::AudioFirst);
ctrl.set_mode(PriorityMode::ScreenShare);
assert_eq!(ctrl.mode(), PriorityMode::ScreenShare);
}
}

View File

@@ -38,6 +38,12 @@ pub trait VideoEncoder: Send {
/// Returns true if the given encoded packet is a keyframe.
fn is_keyframe(&self, packet: &[u8]) -> bool;
/// Apply a new quality target (bitrate, resolution, fps).
///
/// Default implementation is a no-op; platform encoders override to
/// reconfigure the underlying session.
fn set_target(&mut self, _target: &crate::VideoTarget) {}
}
/// Raw video frame input for encoding.

View File

@@ -4,6 +4,7 @@
//! packetization (NAL fragmentation / reassembly). Platform encoders and
//! decoders land in T4.2/T4.3.
pub mod controller;
pub mod decoder;
pub mod depacketizer;
pub mod encoder;
@@ -12,6 +13,7 @@ pub mod mediacodec;
pub mod nack;
pub mod videotoolbox;
pub use controller::{VideoQualityController, VideoTarget};
pub use decoder::VideoDecoder;
pub use depacketizer::H264Depacketizer;
pub use encoder::{VideoEncoder, VideoError, VideoFrame};