mod.rs - mozsearch

// Copyright (c) the JPEG XL Project Authors. All rights reserved.

//

// Use of this source code is governed by a BSD-style

// license that can be found in the LICENSE file.

use std::{

    cmp::min,

    collections::{BTreeMap, BTreeSet},

    fmt::Debug,

    ops::Range,

    sync::atomic::{AtomicUsize, Ordering},

};

use crate::{

    bit_reader::BitReader,

    error::{Error, Result},

    frame::{

        ColorCorrelationParams, HfMetadata,

        block_context_map::BlockContextMap,

        quantizer::{self, LfQuantFactors, QuantizerParams},

},

    headers::{

        ImageMetadata, JxlHeader,

        bit_depth::BitDepth,

        frame_header::FrameHeader,

        modular::{GroupHeader, TransformId},

},

    image::{Image, Rect},

    util::{AtomicRefCell, CeilLog2, SmallVec, tracing_wrappers::*},

};

use jxl_transforms::transform_map::*;

mod borrowed_buffers;

pub(crate) mod decode;

mod predict;

mod transforms;

mod tree;

use borrowed_buffers::with_buffers;

pub use decode::ModularStreamId;

use decode::decode_modular_subbitstream;

pub use predict::Predictor;

use transforms::{TransformStepChunk, make_grids};

pub use tree::Tree;

// Two rows on top, two pixels to the left, two pixels to the right.

const IMAGE_PADDING: (usize, usize) = (4, 2);

const IMAGE_OFFSET: (usize, usize) = (2, 2);

#[derive(Clone, PartialEq, Eq, Copy)]

struct ChannelInfo {

    // The index of the output channel in the render pipeline.

    output_channel_idx: Option<usize>,

    // width, height

    size: (usize, usize),

    shift: Option<(usize, usize)>, // None for meta-channels

    bit_depth: BitDepth,

impl Debug for ChannelInfo {

    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {

        write!(f, "{}x{}", self.size.0, self.size.1)?;

        if let Some(shift) = self.shift {

            write!(f, "(shift {},{})", shift.0, shift.1)?;

        } else {

            write!(f, "(meta)")?;

        write!(f, "{:?}", self.bit_depth)?;

        if let Some(oc) = self.output_channel_idx {

            write!(f, "(output channel {})", oc)?;

        Ok(())

impl ChannelInfo {

    fn is_meta(&self) -> bool {

        self.shift.is_none()

    fn is_meta_or_small(&self, group_dim: usize) -> bool {

        self.is_meta() || (self.size.0 <= group_dim && self.size.1 <= group_dim)

    fn is_shift_in_range(&self, min: usize, max: usize) -> bool {

        // This might be called with max < min, in which case we just return false.

        // This matches libjxl behaviour.

        self.shift.is_some_and(|(a, b)| {

            let shift = a.min(b);

            min <= shift && shift <= max

})

    fn is_equivalent(&self, other: &ChannelInfo) -> bool {

        self.size == other.size && self.shift == other.shift && self.bit_depth == other.bit_depth

#[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Clone, Copy)]

enum ModularGridKind {

    // Single big channel.

    None,

    // 2048x2048 image-pixels (if modular_group_shift == 1).

Lf,

    // 256x256 image-pixels (if modular_group_shift == 1).

Hf,

impl ModularGridKind {

    fn grid_dim(&self, frame_header: &FrameHeader, shift: (usize, usize)) -> (usize, usize) {

        let group_dim = match self {

            ModularGridKind::None => 0,

            ModularGridKind::Lf => frame_header.lf_group_dim(),

            ModularGridKind::Hf => frame_header.group_dim(),

};

        (group_dim >> shift.0, group_dim >> shift.1)

    fn grid_shape(&self, frame_header: &FrameHeader) -> (usize, usize) {

        match self {

            ModularGridKind::None => (1, 1),

            ModularGridKind::Lf => frame_header.size_lf_groups(),

            ModularGridKind::Hf => frame_header.size_groups(),

// All the information on a specific buffer needed by Modular decoding.

#[derive(Debug)]

pub(crate) struct ModularChannel {

    // Actual pixel buffer.

    pub data: Image<i32>,

    // Holds additional information such as the weighted predictor's error channel's last row for

    // the transform chunk that produced this buffer.

    auxiliary_data: Option<Image<i32>>,

    // Shift of the channel (None if this is a meta-channel).

    shift: Option<(usize, usize)>,

    bit_depth: BitDepth,

impl ModularChannel {

    pub fn new(size: (usize, usize), bit_depth: BitDepth) -> Result<Self> {

        Self::new_with_shift(size, Some((0, 0)), bit_depth)

    fn new_with_shift(

        size: (usize, usize),

        shift: Option<(usize, usize)>,

        bit_depth: BitDepth,

    ) -> Result<Self> {

        Ok(ModularChannel {

            data: Image::new_with_padding(size, IMAGE_OFFSET, IMAGE_PADDING)?,

            auxiliary_data: None,

            shift,

            bit_depth,

})

    fn try_clone(&self) -> Result<Self> {

        Ok(ModularChannel {

            data: self.data.try_clone()?,

            auxiliary_data: self

                .auxiliary_data

                .as_ref()

                .map(Image::try_clone)

                .transpose()?,

            shift: self.shift,

            bit_depth: self.bit_depth,

})

    fn channel_info(&self) -> ChannelInfo {

        ChannelInfo {

            output_channel_idx: None,

            size: self.data.size(),

            shift: self.shift,

            bit_depth: self.bit_depth,

const BUFFER_STATUS_NOT_RENDERED: usize = 0;

const BUFFER_STATUS_PARTIAL_RENDER: usize = 1;

const BUFFER_STATUS_FINAL_RENDER: usize = 2;

// Note: this type uses interior mutability to get mutable references to multiple buffers at once.

// In principle, this is not needed, but the overhead should be minimal so using `unsafe` here is

// probably not worth it.

#[derive(Debug)]

struct ModularBuffer {

    data: AtomicRefCell<Option<ModularChannel>>,

    // Number of times this buffer will be used, *including* when it is used for output.

    remaining_uses: AtomicUsize,

    // Transform steps that "strongly" or "weakly" use the image data in this buffer.

    // A "strong" usage always triggers a re-render if the image data changes.

    // A "weak" usage only triggers a re-render if the buffer is final, or if the

    // current re-render was not only caused by weak re-renders.

    used_by_transforms_strong: Vec<usize>,

    used_by_transforms_weak: Vec<usize>,

    size: (usize, usize),

    status: AtomicUsize,

impl ModularBuffer {

    fn get_status(&self) -> usize {

        self.status.load(Ordering::Relaxed)

    fn set_status(&self, val: usize) {

        self.status.store(val, Ordering::Relaxed);

    // Iterator over (transform_id, is_strong_use)

    fn users(&self, include_weak: bool) -> impl Iterator<Item = (usize, bool)> {

        let strong = self.used_by_transforms_strong.iter().map(|x| (*x, true));

        let weak = if include_weak {

            &self.used_by_transforms_weak[..]

        } else {

&[]

        .iter()

        .map(|x| (*x, false));

        strong.chain(weak)

    // Gives out a copy of the buffer + auxiliary buffer, marking the buffer as used.

    // If this was the last usage of the buffer, does not actually copy the buffer.

    fn get_buffer(&self, can_consume: bool) -> Result<ModularChannel> {

        if !can_consume {

            return ModularChannel::try_clone(self.data.borrow().as_ref().unwrap());

        let mut ret = None;

        let _ = self.remaining_uses.fetch_update(

            Ordering::Release,

            Ordering::Acquire,

            |remaining_pre| {

                let remaining = remaining_pre.checked_sub(1).unwrap();

                if ret.is_none() {

                    if remaining == 0 {

                        ret = Some(Ok(self.data.borrow_mut().take().unwrap()))

                    } else {

                        ret = self.data.borrow().as_ref().map(ModularChannel::try_clone);

                } else if remaining == 0 {

                    *self.data.borrow_mut() = None;

                Some(remaining)

},

);

        Ok(ret.transpose()?.unwrap())

    fn mark_used(&self, can_consume: bool) {

        if !can_consume {

            return;

        let _ = self.remaining_uses.fetch_update(

            Ordering::Release,

            Ordering::Acquire,

            |remaining_pre: usize| {

                let remaining = remaining_pre.checked_sub(1).unwrap();

                if remaining == 0 {

                    *self.data.borrow_mut() = None;

                Some(remaining)

},

);

#[derive(Debug)]

struct ModularBufferInfo {

    info: ChannelInfo,

    // The index of coded channel in the bit-stream, or -1 for non-coded channels.

    coded_channel_id: isize,

    #[cfg_attr(not(feature = "tracing"), allow(dead_code))]

    description: String,

    grid_kind: ModularGridKind,

    grid_shape: (usize, usize),

    buffer_grid: Vec<ModularBuffer>,

impl ModularBufferInfo {

    fn get_grid_idx(

        &self,

        output_grid_kind: ModularGridKind,

        output_grid_pos: (usize, usize),

    ) -> usize {

        let grid_pos = match (output_grid_kind, self.grid_kind) {

            (_, ModularGridKind::None) => (0, 0),

            (ModularGridKind::Lf, ModularGridKind::Lf)

            | (ModularGridKind::Hf, ModularGridKind::Hf) => output_grid_pos,

            (ModularGridKind::Hf, ModularGridKind::Lf) => {

                (output_grid_pos.0 / 8, output_grid_pos.1 / 8)

            _ => unreachable!("invalid combination of output grid kind and buffer grid kind"),

};

        self.grid_shape.0 * grid_pos.1 + grid_pos.0

    fn get_grid_rect(

        &self,

        frame_header: &FrameHeader,

        output_grid_kind: ModularGridKind,

        output_grid_pos: (usize, usize),

    ) -> Rect {

        let chan_size = self.info.size;

        if output_grid_kind == ModularGridKind::None {

            assert_eq!(self.grid_kind, output_grid_kind);

            return Rect {

                origin: (0, 0),

                size: chan_size,

};

        let shift = self.info.shift.unwrap();

        let grid_dim = output_grid_kind.grid_dim(frame_header, shift);

        let bx = output_grid_pos.0 * grid_dim.0;

        let by = output_grid_pos.1 * grid_dim.1;

        let size = (

            (chan_size.0 - bx).min(grid_dim.0),

            (chan_size.1 - by).min(grid_dim.1),

);

        let origin = match (output_grid_kind, self.grid_kind) {

            (ModularGridKind::Lf, ModularGridKind::Lf)

            | (ModularGridKind::Hf, ModularGridKind::Hf) => (0, 0),

            (_, ModularGridKind::None) => (bx, by),

            (ModularGridKind::Hf, ModularGridKind::Lf) => {

                let lf_grid_dim = self.grid_kind.grid_dim(frame_header, shift);

                (bx % lf_grid_dim.0, by % lf_grid_dim.1)

            _ => unreachable!("invalid combination of output grid kind and buffer grid kind"),

};

        if size.0 == 0 || size.1 == 0 {

            Rect {

                origin: (0, 0),

                size: (0, 0),

        } else {

            Rect { origin, size }

/// A modular image is a sequence of channels to which one or more transforms might have been

/// applied. We represent a modular image as a list of buffers, some of which are coded in the

/// bitstream; other buffers are obtained as the output of one of the transformation steps.

/// Some buffers are marked as `output`: those are the buffers corresponding to the pre-transform

/// image channels.

/// The buffers are internally divided in grids, matching the sizes of the groups they are coded

/// in (with appropriate shifts), or the size of the data produced by applying the appropriate

/// transforms to each of the groups in the input of the transforms.

#[derive(Debug)]

pub struct FullModularImage {

    buffer_info: Vec<ModularBufferInfo>,

    transform_steps: Vec<TransformStepChunk>,

    // List of buffer indices of the channels of the modular image encoded in each kind of section.

    // In order, LfGlobal, LfGroup, HfGroup(pass 0), ..., HfGroup(last pass).

    section_buffer_indices: Vec<Vec<usize>>,

    modular_color_channels: usize,

    can_do_partial_render: bool,

    can_do_early_partial_render: bool,

    decoded_section0_channels: usize,

    needed_section0_channels_for_early_render: usize,

    global_header: Option<GroupHeader>,

    buffers_for_channels: Vec<usize>,

    // Buffers to _start rendering from_ on the next call to process_output.

    // This is initially set to LF global and LF buffers, and populated with HF buffers

    // just before we start decoding them.

    ready_buffers_dry_run: BTreeSet<(usize, usize)>,

    ready_buffers: BTreeSet<(usize, usize)>,

    // Whether each channel is used or not by the render pipeline.

    pipeline_used_channels: Vec<bool>,

impl FullModularImage {

    pub fn can_do_partial_render(&self) -> bool {

        self.can_do_partial_render

    pub fn can_do_early_partial_render(&self) -> bool {

        self.can_do_early_partial_render

            // Avoid green martians

            && self.decoded_section0_channels >= self.needed_section0_channels_for_early_render

    pub fn set_pipeline_used_channels(&mut self, used: &[bool]) {

        self.pipeline_used_channels = used.to_vec();

    #[instrument(level = "debug", skip_all)]

    pub fn read(

        frame_header: &FrameHeader,

        image_metadata: &ImageMetadata,

        modular_color_channels: usize,

        br: &mut BitReader,

    ) -> Result<Self> {

        let mut channels = vec![];

        for c in 0..modular_color_channels {

            let shift = (frame_header.hshift(c), frame_header.vshift(c));

            let size = frame_header.size();

            channels.push(ChannelInfo {

                output_channel_idx: Some(c),

                size: (size.0.div_ceil(1 << shift.0), size.1.div_ceil(1 << shift.1)),

                shift: Some(shift),

                bit_depth: image_metadata.bit_depth,

});

        for (idx, ecups) in frame_header.ec_upsampling.iter().enumerate() {

            let shift_ec = ecups.ceil_log2();

            let shift_color = frame_header.upsampling.ceil_log2();

            let shift = shift_ec

                .checked_sub(shift_color)

                .expect("ec_upsampling >= upsampling should be checked in frame header")

                as usize;

            let size = frame_header.size_upsampled();

            let size = (

                size.0.div_ceil(*ecups as usize),

                size.1.div_ceil(*ecups as usize),

);

            channels.push(ChannelInfo {

                output_channel_idx: Some(3 + idx),

                size,

                shift: Some((shift, shift)),

                bit_depth: image_metadata.bit_depth,

});

        #[cfg(feature = "tracing")]

        for (i, ch) in channels.iter().enumerate() {

            trace!("Modular channel {i}: {ch:?}");

        if channels.is_empty() {

            return Ok(Self {

                buffer_info: vec![],

                transform_steps: vec![],

                section_buffer_indices: vec![vec![]; 2 + frame_header.passes.num_passes as usize],

                modular_color_channels,

                can_do_partial_render: true,

                can_do_early_partial_render: false,

                decoded_section0_channels: 0,

                needed_section0_channels_for_early_render: 0,

                global_header: None,

                buffers_for_channels: vec![],

                ready_buffers_dry_run: BTreeSet::new(),

                ready_buffers: BTreeSet::new(),

                pipeline_used_channels: vec![],

});

        trace!("reading modular header");

        let header = GroupHeader::read(br)?;

        // Disallow progressive rendering with multi-channel palette transforms

        // or delta-palette.

        let has_problematic_palette_transform = header.transforms.iter().any(|x| {

            x.id == TransformId::Palette

                && (x.num_channels > 1 || x.predictor_id != Predictor::Zero as u32)

});

        let has_squeeze_transform = header

            .transforms

            .iter()

            .any(|x| x.id == TransformId::Squeeze);

        let (mut buffer_info, transform_steps) =

            transforms::apply::meta_apply_transforms(&channels, &header)?;

        // Assign each (channel, group) pair present in the bitstream to the section in which it

        // will be decoded.

        let mut section_buffer_indices: Vec<Vec<usize>> = vec![];

        let mut sorted_buffers: Vec<_> = buffer_info

            .iter()

            .enumerate()

            .filter_map(|(i, b)| {

                if b.coded_channel_id >= 0 {

                    Some((b.coded_channel_id, i))

                } else {

                    None

})

            .collect();

        sorted_buffers.sort_by_key(|x| x.0);

        section_buffer_indices.push(

            sorted_buffers

                .iter()

                .take_while(|x| {

                    buffer_info[x.1]

                        .info

                        .is_meta_or_small(frame_header.group_dim())

})

                .map(|x| x.1)

                .collect(),

);

        section_buffer_indices.push(

            sorted_buffers

                .iter()

                .skip_while(|x| {

                    buffer_info[x.1]

                        .info

                        .is_meta_or_small(frame_header.group_dim())

})

                .filter(|x| buffer_info[x.1].info.is_shift_in_range(3, usize::MAX))

                .map(|x| x.1)

                .collect(),

);

        for pass in 0..frame_header.passes.num_passes as usize {

            let (min_shift, max_shift) = frame_header.passes.downsampling_bracket(pass);

            section_buffer_indices.push(

                sorted_buffers

                    .iter()

                    .skip_while(|x| {

                        buffer_info[x.1]

                            .info

                            .is_meta_or_small(frame_header.group_dim())

})

                    .filter(|x| {

                        buffer_info[x.1]

                            .info

                            .is_shift_in_range(min_shift, max_shift)

})

                    .map(|x| x.1)

                    .collect(),

);

        // Ensure that the channel list in each group is sorted by actual channel ID.

        for list in section_buffer_indices.iter_mut() {

            list.sort_by_key(|x| buffer_info[*x].coded_channel_id);

        trace!(?section_buffer_indices);

        #[cfg(feature = "tracing")]

        for (section, indices) in section_buffer_indices.iter().enumerate() {

            let section_name = match section {

                0 => "LF global".to_string(),

                1 => "LF groups".to_string(),

                _ => format!("HF groups, pass {}", section - 2),

};

            trace!("Coded modular channels in {section_name}");

            for i in indices {

                let bi = &buffer_info[*i];

                trace!(

                    "Channel {i} {:?} coded id: {}",

                    bi.info, bi.coded_channel_id

);

        let transform_steps = make_grids(

            frame_header,

            transform_steps,

            &section_buffer_indices,

            &mut buffer_info,

);

        #[cfg(feature = "tracing")]

        for (i, bi) in buffer_info.iter().enumerate() {

            trace!(

                "Channel {i} {:?} coded_id: {} '{}' {:?} grid {:?}",

                bi.info, bi.coded_channel_id, bi.description, bi.grid_kind, bi.grid_shape

);

            for (pos, buf) in bi.buffer_grid.iter().enumerate() {

                trace!(

                    "Channel {i} grid {pos} ({}, {})  size: {:?}, uses: {:?}, used_by: s {:?} w {:?}",

                    pos % bi.grid_shape.0,

                    pos / bi.grid_shape.0,

                    buf.size,

                    buf.remaining_uses,

                    buf.used_by_transforms_strong,

                    buf.used_by_transforms_weak,

);

        #[cfg(feature = "tracing")]

        for (i, ts) in transform_steps.iter().enumerate() {

            trace!("Transform {i}: {ts:?}");

        let mut buffers_for_channels = vec![];

        for (i, c) in buffer_info.iter().enumerate() {

            if let Some(c) = c.info.output_channel_idx {

                if buffers_for_channels.len() <= c {

                    buffers_for_channels.resize(c + 1, 0);

                buffers_for_channels[c] = i;

        let num_meta_channels = buffer_info

            .iter()

            .filter(|b| b.coded_channel_id >= 0 && b.info.is_meta())

            .count();

        Ok(FullModularImage {

            buffer_info,

            transform_steps,

            section_buffer_indices,

            modular_color_channels,

            can_do_partial_render: !has_problematic_palette_transform,

            can_do_early_partial_render: !has_problematic_palette_transform

                && has_squeeze_transform,

            decoded_section0_channels: 0,

            needed_section0_channels_for_early_render: buffers_for_channels.len()

                + num_meta_channels,

            global_header: Some(header),

            buffers_for_channels,

            ready_buffers_dry_run: BTreeSet::new(),

            ready_buffers: BTreeSet::new(),

            pipeline_used_channels: vec![],

})

    pub fn read_section0(

        &mut self,

        frame_header: &FrameHeader,

        global_tree: &Option<Tree>,

        br: &mut BitReader,

        allow_partial: bool,

    ) -> Result<()> {

        let mut decoded_if_partial = 0;

        let ret = with_buffers(

            &self.buffer_info,

            &self.section_buffer_indices[0],

0,

            |bufs| {

                decode_modular_subbitstream(

                    bufs,

                    ModularStreamId::GlobalData.get_id(frame_header),

                    self.global_header.clone(),

                    global_tree,

br,

                    Some(&mut decoded_if_partial),

},

);

        match (ret, allow_partial) {

            (Ok(_), _) => {

                // Decoded section completely.

                self.decoded_section0_channels = self.section_buffer_indices[0].len();

            (Err(_), true) => {

                self.decoded_section0_channels = decoded_if_partial;

            (Err(e), false) => {

                return Err(e);

        for b in self.section_buffer_indices[0]

            .iter()

            .take(self.decoded_section0_channels)

            if self.buffer_info[*b].buffer_grid[0].get_status() == BUFFER_STATUS_FINAL_RENDER {

                continue;

            // If we did a partial decode, we cannot be 100% sure of whether we correctly

            // decoded all the sections. Thus, mark the sections as partially decoded.

            self.buffer_info[*b].buffer_grid[0].set_status(if allow_partial {

                BUFFER_STATUS_PARTIAL_RENDER

            } else {

                BUFFER_STATUS_FINAL_RENDER

});

            self.ready_buffers_dry_run.insert((*b, 0));

        Ok(())

    pub fn mark_group_to_be_read(&mut self, section_id: usize, group: usize) {

        for b in self.section_buffer_indices[section_id].iter() {

            self.buffer_info[*b].buffer_grid[group].set_status(BUFFER_STATUS_FINAL_RENDER);

            self.ready_buffers_dry_run.insert((*b, group));

    #[allow(clippy::type_complexity)]

    #[instrument(level = "debug", skip(self, frame_header, global_tree, br), ret)]

    pub fn read_stream(

        &mut self,

        stream: ModularStreamId,

        frame_header: &FrameHeader,

        global_tree: &Option<Tree>,

        br: &mut BitReader,

    ) -> Result<()> {

        if self.buffer_info.is_empty() {

            info!("No modular channels to decode");

            return Ok(());

        let (section_id, grid) = match stream {

            ModularStreamId::ModularLF(group) => (1, group),

            ModularStreamId::ModularHF { pass, group } => (2 + pass, group),

            _ => {

                unreachable!(

                    "read_stream should only be used for streams that are part of the main Modular image"

);

};

        with_buffers(

            &self.buffer_info,

            &self.section_buffer_indices[section_id],

            grid,

            |bufs| {

                decode_modular_subbitstream(

                    bufs,

                    stream.get_id(frame_header),

                    None,

                    global_tree,

br,

                    None,

)?;

                Ok(())

},

)?;

        Ok(())

    fn maybe_output(

        &self,

        buf: usize,

        grid: usize,

        dry_run: bool,

        pass_to_pipeline: &mut dyn FnMut(usize, usize, bool, Option<Image<i32>>) -> Result<()>,

    ) -> Result<()> {

        if let Some(chan) = self.buffer_info[buf].info.output_channel_idx {

            let is_final =

                self.buffer_info[buf].buffer_grid[grid].get_status() == BUFFER_STATUS_FINAL_RENDER;

            let all_final = self.buffers_for_channels.iter().all(|x| {

                self.buffer_info[*x].buffer_grid[grid].get_status() == BUFFER_STATUS_FINAL_RENDER

});

            let channels: SmallVec<usize, 3> = if chan == 0 && self.modular_color_channels == 1 {

                (0..3).filter(|x| self.pipeline_used_channels[*x]).collect()

            } else {

                self.pipeline_used_channels[chan]

                    .then_some(chan)

                    .into_iter()

                    .collect()

};

            if channels.is_empty() {

                return Ok(());

            if dry_run {

                for c in channels.iter() {

                    pass_to_pipeline(*c, grid, is_final, None)?;

            } else {

                debug!("Rendering channel {chan:?}, grid position {grid}");

                let buf = self.buffer_info[buf].buffer_grid[grid].get_buffer(all_final)?;

                for c in channels[1..].iter() {

                    pass_to_pipeline(*c, grid, is_final, Some(buf.data.try_clone()?))?;

                pass_to_pipeline(channels[0], grid, is_final, Some(buf.data))?;

        Ok(())

    // If `dry_run` is true, this call does not modify any state, and the calls to `pass_to_pipeline`

    // will have None as an image. Otherwise, the image will always be `Some(..)`.

    // It is *required* to do a dry run before doing an actual run after any event that might have

    // readied some buffers.

    pub fn process_output(

        &mut self,

        frame_header: &FrameHeader,

        dry_run: bool,

        pass_to_pipeline: &mut dyn FnMut(usize, usize, bool, Option<Image<i32>>) -> Result<()>,

    ) -> Result<()> {

        // TODO(veluca): consider using `used_channel_mask` to avoid running transforms that produce

        // channels that are not used.

        // layer -> (transform -> is_strong)

        let mut to_process_by_layer = BTreeMap::<usize, BTreeMap<usize, bool>>::new();

        let mut buffers_to_output = vec![];

        let ready_buffers = if dry_run {

            std::mem::take(&mut self.ready_buffers_dry_run)

        } else {

            assert!(self.ready_buffers_dry_run.is_empty());

            std::mem::take(&mut self.ready_buffers)

};

        for (buf, grid) in ready_buffers {

            if self.buffer_info[buf].info.output_channel_idx.is_some() {

                buffers_to_output.push((buf, grid));

            for (t, is_strong_dep) in self.buffer_info[buf].buffer_grid[grid].users(true) {

                let layer = self.transform_steps[t].layer;

                let layer = to_process_by_layer.entry(layer).or_default();

                let is_strong = layer.entry(t).or_default();

                *is_strong |= is_strong_dep;

            if dry_run {

                self.ready_buffers.insert((buf, grid));

        // When doing a dry run, run the same logic as the real execution, but

        // without modifying the actual buffer status -- instead, we use local

        // overrides.

        // This allows us to know what buffers will be produced before producing any.

        let mut status_overrides = BTreeMap::new();

        let get_status =

            |status_overrides: &mut BTreeMap<(usize, usize), usize>, b: usize, g: usize| {

                if let Some(s) = status_overrides.get(&(b, g)) {

*s

                } else {

                    self.buffer_info[b].buffer_grid[g].get_status()

};

        let mut new_dirty_transforms = vec![];

        while let Some((_, transforms)) = to_process_by_layer.pop_first() {

            trace!("{transforms:?}");

            for (t, is_strong) in transforms {

                let tfm = &self.transform_steps[t];

                trace!("{:?}", tfm);

                let dependency_status = tfm

                    .deps

                    .iter()

                    .map(|(b, g)| get_status(&mut status_overrides, *b, *g))

                    .min()

                    .unwrap_or(BUFFER_STATUS_FINAL_RENDER);

                if dependency_status == BUFFER_STATUS_NOT_RENDERED {

                    continue;

                let is_final = dependency_status == BUFFER_STATUS_FINAL_RENDER;

                let mut previous_output_status = None;

                for (b, g) in tfm.outputs(&self.buffer_info) {

                    let status = get_status(&mut status_overrides, b, g);

                    if previous_output_status.is_none() {

                        previous_output_status = Some(status);

                    assert_eq!(Some(status), previous_output_status);

                    if dry_run {

                        status_overrides.insert((b, g), dependency_status);

                    } else {

                        self.buffer_info[b].buffer_grid[g].set_status(dependency_status);

                let previous_output_status = previous_output_status.unwrap();

                if !dry_run {

                    tfm.do_run(frame_header, &self.buffer_info, is_final)?;

                // If this was the first _or_ the last render, trigger a re-render across weak edges

                // even if the render was caused by a weak edge.

                // This is necessary to finish drawing those renders correctly.

                let is_strong = is_strong

                    || (previous_output_status == BUFFER_STATUS_NOT_RENDERED

                        || dependency_status == BUFFER_STATUS_FINAL_RENDER);

                for (buf, grid) in self.transform_steps[t].outputs(&self.buffer_info) {

                    if self.buffer_info[buf].info.output_channel_idx.is_some() {

                        buffers_to_output.push((buf, grid));

                    for (t, is_strong_dep) in

                        self.buffer_info[buf].buffer_grid[grid].users(is_strong)

                        new_dirty_transforms.push((t, is_strong_dep));

            for (t, is_strong_dep) in new_dirty_transforms.drain(..) {

                let layer = self.transform_steps[t].layer;

                let layer = to_process_by_layer.entry(layer).or_default();

                let is_strong = layer.entry(t).or_default();

                *is_strong |= is_strong_dep;

        // Pass all the output buffers to the render pipeline.

        for (buf, grid) in buffers_to_output {

            self.maybe_output(buf, grid, dry_run, pass_to_pipeline)?;

        Ok(())

    pub fn channel_range(&self) -> Range<usize> {

        if self.modular_color_channels != 0 {

            0..self.buffers_for_channels.len()

        } else {

            // VarDCT image.

            3..self.buffers_for_channels.len()

    pub fn flush_output(

        &mut self,

        group: usize,

        chan: usize,

        pass_to_pipeline: &mut dyn FnMut(usize, usize, bool, Image<i32>) -> Result<()>,

    ) -> Result<()> {

        if !self.can_do_partial_render() {

            return Ok(());

        let buf_idx = self.buffers_for_channels[chan];

        // Skip channels that don't have a real buffer assignment.

        // buffers_for_channels is zero-filled on resize, so intermediate channels

        // (e.g. G/B when modular_color_channels==1) may alias buffer 0 incorrectly.

        if self.buffer_info[buf_idx].info.output_channel_idx != Some(chan) {

            return Ok(());

        self.maybe_output(buf_idx, group, false, &mut |chan, grid, complete, img| {

            pass_to_pipeline(chan, grid, complete, img.unwrap())

})

    pub fn zero_fill_empty_channels(

        &mut self,

        num_passes: usize,

        num_groups: usize,

        num_lf_groups: usize,

    ) -> Result<()> {

        if !self.can_do_partial_render() {

            return Ok(());

        if self.buffer_info.is_empty() {

            return Ok(());

        let mut fill_buffer = |section: usize, grid| -> Result<()> {

            // TODO(veluca): consider filling these buffers with placeholders instead of real images.

            with_buffers(

                &self.buffer_info,

                &self.section_buffer_indices[section],

                grid,

                |_| Ok(()),

)?;

            for b in self.section_buffer_indices[section].iter() {

                if self.buffer_info[*b].buffer_grid[grid].get_status() == BUFFER_STATUS_NOT_RENDERED

                    self.buffer_info[*b].buffer_grid[grid].set_status(BUFFER_STATUS_PARTIAL_RENDER);

                    self.ready_buffers.insert((*b, grid));

            Ok(())

};

        fill_buffer(0, 0)?;

        for grid in 0..num_lf_groups {

            fill_buffer(1, grid)?;

        for pass in 0..num_passes {

            for grid in 0..num_groups {

                fill_buffer(2 + pass, grid)?;

        Ok(())

#[allow(clippy::too_many_arguments)]

fn dequant_lf(

    r: Rect,

    lf: &mut [Image<f32>; 3],

    quant_lf: &mut Image<u8>,

    input: [&Image<i32>; 3],

    color_correlation_params: &ColorCorrelationParams,

    quant_params: &QuantizerParams,

    lf_quant: &LfQuantFactors,

    mul: f32,

    frame_header: &FrameHeader,

    bctx: &BlockContextMap,

) -> Result<()> {

    let inv_quant_lf = (quantizer::GLOBAL_SCALE_DENOM as f32)

        / (quant_params.global_scale as f32 * quant_params.quant_lf as f32);

    let lf_factors = lf_quant.quant_factors.map(|factor| factor * inv_quant_lf);

    if frame_header.is444() {

        let [lf0, lf1, lf2] = lf;

        let mut lf_rects = (

            lf0.get_rect_mut(r),

            lf1.get_rect_mut(r),

            lf2.get_rect_mut(r),

);

        let fac_x = lf_factors[0] * mul;

        let fac_y = lf_factors[1] * mul;

        let fac_b = lf_factors[2] * mul;

        let cfl_fac_x = color_correlation_params.y_to_x_lf();

        let cfl_fac_b = color_correlation_params.y_to_b_lf();

        for y in 0..r.size.1 {

            let quant_row_x = input[1].row(y);

            let quant_row_y = input[0].row(y);

            let quant_row_b = input[2].row(y);

            let dec_row_x = lf_rects.0.row(y);

            let dec_row_y = lf_rects.1.row(y);

            let dec_row_b = lf_rects.2.row(y);

            for x in 0..r.size.0 {

                let in_x = quant_row_x[x] as f32 * fac_x;

                let in_y = quant_row_y[x] as f32 * fac_y;

                let in_b = quant_row_b[x] as f32 * fac_b;

                dec_row_y[x] = in_y;

                dec_row_x[x] = in_y * cfl_fac_x + in_x;

                dec_row_b[x] = in_y * cfl_fac_b + in_b;

    } else {

        for (c, lf_rect) in lf.iter_mut().enumerate() {

            let rect = Rect {

                origin: (

                    r.origin.0 >> frame_header.hshift(c),

                    r.origin.1 >> frame_header.vshift(c),

),

                size: (

                    r.size.0 >> frame_header.hshift(c),

                    r.size.1 >> frame_header.vshift(c),

),

};

            let mut lf_rect = lf_rect.get_rect_mut(rect);

            let fac = lf_factors[c] * mul;

            let ch = input[if c < 2 { c ^ 1 } else { c }];

            for y in 0..rect.size.1 {

                let quant_row = ch.row(y);

                let row = lf_rect.row(y);

                for x in 0..rect.size.0 {

                    row[x] = quant_row[x] as f32 * fac;

    let mut quant_lf_rect = quant_lf.get_rect_mut(r);

    if bctx.num_lf_contexts <= 1 {

        for y in 0..r.size.1 {

            quant_lf_rect.row(y).fill(0);

    } else {

        for y in 0..r.size.1 {

            let qlf_row_val = quant_lf_rect.row(y);

            let quant_row_x = input[1].row(y >> frame_header.vshift(0));

            let quant_row_y = input[0].row(y >> frame_header.vshift(1));

            let quant_row_b = input[2].row(y >> frame_header.vshift(2));

            for x in 0..r.size.0 {

                let bucket_x = bctx.lf_thresholds[0]

                    .iter()

                    .filter(|&t| quant_row_x[x >> frame_header.hshift(0)] > *t)

                    .count();

                let bucket_y = bctx.lf_thresholds[1]

                    .iter()

                    .filter(|&t| quant_row_y[x >> frame_header.hshift(1)] > *t)

                    .count();

                let bucket_b = bctx.lf_thresholds[2]

                    .iter()

                    .filter(|&t| quant_row_b[x >> frame_header.hshift(2)] > *t)

                    .count();

                let mut bucket = bucket_x;

                bucket *= bctx.lf_thresholds[2].len() + 1;

                bucket += bucket_b;

                bucket *= bctx.lf_thresholds[1].len() + 1;

                bucket += bucket_y;

                qlf_row_val[x] = bucket as u8;

    Ok(())

#[allow(clippy::too_many_arguments)]

pub fn decode_vardct_lf(

    group: usize,

    frame_header: &FrameHeader,

    image_metadata: &ImageMetadata,

    global_tree: &Option<Tree>,

    color_correlation_params: &ColorCorrelationParams,

    quant_params: &QuantizerParams,

    lf_quant: &LfQuantFactors,

    bctx: &BlockContextMap,

    lf_image: &mut [Image<f32>; 3],

    quant_lf: &mut Image<u8>,

    br: &mut BitReader,

) -> Result<()> {

    let extra_precision = br.read(2)?;

    debug!(?extra_precision);

    let mul = 1.0 / (1 << extra_precision) as f32;

    let stream_id = ModularStreamId::VarDCTLF(group).get_id(frame_header);

    debug!(?stream_id);

    let r = frame_header.lf_group_rect(group);

    debug!(?r);

    let shrink_rect = |size: (usize, usize), c| {

            size.0 >> frame_header.hshift(c),

            size.1 >> frame_header.vshift(c),

};

    let mut buffers = [

        ModularChannel::new(shrink_rect(r.size, 1), image_metadata.bit_depth)?,

        ModularChannel::new(shrink_rect(r.size, 0), image_metadata.bit_depth)?,

        ModularChannel::new(shrink_rect(r.size, 2), image_metadata.bit_depth)?,

];

    decode_modular_subbitstream(

        buffers.iter_mut().collect(),

        stream_id,

        None,

        global_tree,

br,

        None,

)?;

    dequant_lf(

r,

        lf_image,

        quant_lf,

        [&buffers[0].data, &buffers[1].data, &buffers[2].data],

        color_correlation_params,

        quant_params,

        lf_quant,

        mul,

        frame_header,

        bctx,

pub fn decode_hf_metadata(

    group: usize,

    frame_header: &FrameHeader,

    image_metadata: &ImageMetadata,

    global_tree: &Option<Tree>,

    hf_meta: &mut HfMetadata,

    br: &mut BitReader,

) -> Result<()> {

    let stream_id = ModularStreamId::LFMeta(group).get_id(frame_header);

    debug!(?stream_id);

    let r = frame_header.lf_group_rect(group);

    debug!(?r);

    let upper_bound = r.size.0 * r.size.1;

    let count_num_bits = upper_bound.ceil_log2();

    let count: usize = br.read(count_num_bits)? as usize + 1;

    debug!(?count);

    let cr = Rect {

        origin: (r.origin.0 >> 3, r.origin.1 >> 3),

        size: (r.size.0.div_ceil(8), r.size.1.div_ceil(8)),

};

    let mut buffers = [

        ModularChannel::new_with_shift(cr.size, Some((3, 3)), image_metadata.bit_depth)?,

        ModularChannel::new_with_shift(cr.size, Some((3, 3)), image_metadata.bit_depth)?,

        ModularChannel::new((count, 2), image_metadata.bit_depth)?,

        ModularChannel::new(r.size, image_metadata.bit_depth)?,

];

    decode_modular_subbitstream(

        buffers.iter_mut().collect(),

        stream_id,

        None,

        global_tree,

br,

        None,

)?;

    let ytox_image = &buffers[0].data;

    let ytob_image = &buffers[1].data;

    let mut ytox_map_rect = hf_meta.ytox_map.get_rect_mut(cr);

    let mut ytob_map_rect = hf_meta.ytob_map.get_rect_mut(cr);

    let i8min: i32 = i8::MIN.into();

    let i8max: i32 = i8::MAX.into();

    for y in 0..cr.size.1 {

        let row_in_x = ytox_image.row(y);

        let row_in_b = ytob_image.row(y);

        let row_out_x = ytox_map_rect.row(y);

        let row_out_b = ytob_map_rect.row(y);

        for x in 0..cr.size.0 {

            row_out_x[x] = row_in_x[x].clamp(i8min, i8max) as i8;

            row_out_b[x] = row_in_b[x].clamp(i8min, i8max) as i8;

    let transform_image = &buffers[2].data;

    let epf_image = &buffers[3].data;

    let mut transform_map_rect = hf_meta.transform_map.get_rect_mut(r);

    let mut raw_quant_map_rect = hf_meta.raw_quant_map.get_rect_mut(r);

    let mut epf_map_rect = hf_meta.epf_map.get_rect_mut(r);

    let mut num: usize = 0;

    let mut used_hf_types: u32 = 0;

    for y in 0..r.size.1 {

        let epf_row_in = epf_image.row(y);

        let epf_row_out = epf_map_rect.row(y);

        for x in 0..r.size.0 {

            let epf_val = epf_row_in[x];

            if !(0..8).contains(&epf_val) {

                return Err(Error::InvalidEpfValue(epf_val));

            epf_row_out[x] = epf_val as u8;

            if transform_map_rect.row(y)[x] != HfTransformType::INVALID_TRANSFORM {

                continue;

            if num >= count {

                return Err(Error::InvalidVarDCTTransformMap);

            let raw_transform = transform_image.row(0)[num];

            let raw_quant = 1 + transform_image.row(1)[num].clamp(0, 255);

            let transform_type = HfTransformType::from_usize(raw_transform as usize)

                .ok_or(Error::InvalidVarDCTTransform(raw_transform as usize))?;

            used_hf_types |= 1 << raw_transform;

            let cx = covered_blocks_x(transform_type) as usize;

            let cy = covered_blocks_y(transform_type) as usize;

            if (cx > 1 || cy > 1) && !frame_header.is444() {

                return Err(Error::InvalidBlockSizeForChromaSubsampling);

            let next_group = ((x / 32 + 1) * 32, (y / 32 + 1) * 32);

            if x + cx > min(r.size.0, next_group.0) || y + cy > min(r.size.1, next_group.1) {

                return Err(Error::HFBlockOutOfBounds);

            let transform_id = raw_transform as u8;

            for iy in 0..cy {

                for ix in 0..cx {

                    transform_map_rect.row(y + iy)[x + ix] = if iy == 0 && ix == 0 {

                        transform_id + 128 // Set highest bit to signal first block.

                    } else {

                        transform_id

};

                    raw_quant_map_rect.row(y + iy)[x + ix] = raw_quant;

            num += 1;

    hf_meta.used_hf_types |= used_hf_types;

    Ok(())

Source code

Revision control

Copy as Markdown

Other Tools