From 77108936901a11cd8275a818bd98453f2d9e31e7 Mon Sep 17 00:00:00 2001 From: Martin Bruse Date: Wed, 27 Nov 2024 14:14:20 +0100 Subject: [PATCH] Added noise stage. --- jxl/resources/test/8x8_noise.jxl | Bin 0 -> 69 bytes jxl/src/features/mod.rs | 1 + jxl/src/features/noise.rs | 20 ++ jxl/src/frame.rs | 50 ++++- jxl/src/image.rs | 10 + jxl/src/render/stages/mod.rs | 1 + jxl/src/render/stages/noise.rs | 357 +++++++++++++++++++++++++++++++ 7 files changed, 433 insertions(+), 6 deletions(-) create mode 100644 jxl/resources/test/8x8_noise.jxl create mode 100644 jxl/src/features/noise.rs create mode 100644 jxl/src/render/stages/noise.rs diff --git a/jxl/resources/test/8x8_noise.jxl b/jxl/resources/test/8x8_noise.jxl new file mode 100644 index 0000000000000000000000000000000000000000..78462eab3490adde1f8bf21cdfaf1d6efcabb31f GIT binary patch literal 69 zcmey*<>=s4s3@Vp!SH~AfyID Result { + let mut noise = Noise::default(); + for l in &mut noise.lut { + *l = (br.read(10)? as f32) / ((1 << 10) as f32); + } + Ok(noise) + } +} diff --git a/jxl/src/frame.rs b/jxl/src/frame.rs index 6f4a5c8..c2f7c5b 100644 --- a/jxl/src/frame.rs +++ b/jxl/src/frame.rs @@ -6,7 +6,7 @@ use crate::{ bit_reader::BitReader, error::Result, - features::spline::Splines, + features::{noise::Noise, spline::Splines}, headers::{ color_encoding::ColorSpace, encodings::UnconditionalCoder, @@ -35,7 +35,7 @@ pub struct LfGlobalState { // TODO(veluca93): patches // TODO(veluca93): splines splines: Option, - // TODO(veluca93): noise + noise: Option, lf_quant: LfQuantFactors, // TODO(veluca93), VarDCT: HF quant matrices // TODO(veluca93), VarDCT: block context map @@ -145,10 +145,11 @@ impl Frame { None }; - if self.header.has_noise() { - info!("decoding noise"); - todo!("noise not implemented"); - } + let noise = if self.header.has_noise() { + Some(Noise::read(br)?) + } else { + None + }; let lf_quant = LfQuantFactors::new(br)?; debug!(?lf_quant); @@ -180,6 +181,7 @@ impl Frame { self.lf_global = Some(LfGlobalState { splines, + noise, lf_quant, tree, modular_global, @@ -188,3 +190,39 @@ impl Frame { Ok(()) } } + +#[cfg(test)] +mod test_frame { + use crate::{ + bit_reader::BitReader, + container::ContainerParser, + error::Error, + headers::{FileHeader, JxlHeader}, + util::test::assert_almost_eq, + }; + + use super::Frame; + + fn read_frame(image: &[u8]) -> Result { + let codestream = ContainerParser::collect_codestream(image).unwrap(); + let mut br = BitReader::new(&codestream); + let file_header = FileHeader::read(&mut br).unwrap(); + let mut result = Frame::new(&mut br, &file_header)?; + result.decode_lf_global(&mut br)?; + return Ok(result); + } + + #[test] + fn noise() -> Result<(), Error> { + let frame = read_frame(include_bytes!("../resources/test/8x8_noise.jxl"))?; + let lf_global = frame.lf_global.unwrap(); + let noise = lf_global.noise.unwrap(); + let want_noise = [ + 0.000000, 0.000977, 0.002930, 0.003906, 0.005859, 0.006836, 0.008789, 0.010742, + ]; + for (index, noise_param) in want_noise.iter().enumerate() { + assert_almost_eq!(noise.lut[index], *noise_param, 1e-6f32); + } + Ok(()) + } +} diff --git a/jxl/src/image.rs b/jxl/src/image.rs index 7e2c93d..417f8ce 100644 --- a/jxl/src/image.rs +++ b/jxl/src/image.rs @@ -184,6 +184,16 @@ impl Image { Ok(img) } + #[cfg(test)] + pub fn new_range(size: (usize, usize), start: f32, step: f32) -> Result> { + let mut img = Self::new(size)?; + img.data + .iter_mut() + .enumerate() + .for_each(|(index, x)| *x = T::from_f64((start + step * index as f32) as f64)); + Ok(img) + } + #[cfg(test)] pub fn new_constant(size: (usize, usize), val: T) -> Result> { let mut img = Self::new(size)?; diff --git a/jxl/src/render/stages/mod.rs b/jxl/src/render/stages/mod.rs index bf8c96d..dc89a11 100644 --- a/jxl/src/render/stages/mod.rs +++ b/jxl/src/render/stages/mod.rs @@ -6,6 +6,7 @@ mod chroma_upsample; mod convert; mod nearest_neighbor; +mod noise; mod save; mod upsample; diff --git a/jxl/src/render/stages/noise.rs b/jxl/src/render/stages/noise.rs new file mode 100644 index 0000000..1732572 --- /dev/null +++ b/jxl/src/render/stages/noise.rs @@ -0,0 +1,357 @@ +// Copyright (c) the JPEG XL Project Authors. All rights reserved. +// +// Use of this source code is governed by a BSD-style +// license that can be found in the LICENSE file. + +// TODO(zond): remove once we use this! +#![allow(dead_code, unused_variables)] + +use crate::{ + features::noise::Noise, + render::{RenderPipelineInOutStage, RenderPipelineInPlaceStage, RenderPipelineStage}, +}; + +pub struct ConvolveNoiseStage { + first_channel: usize, +} + +impl ConvolveNoiseStage { + pub fn new(first_channel: usize) -> ConvolveNoiseStage { + ConvolveNoiseStage { first_channel } + } +} + +impl std::fmt::Display for ConvolveNoiseStage { + fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { + write!( + f, + "convolve noise for channels [{},{},{}]", + self.first_channel, + self.first_channel + 1, + self.first_channel + 2 + ) + } +} + +impl RenderPipelineStage for ConvolveNoiseStage { + type Type = RenderPipelineInOutStage; + + fn uses_channel(&self, c: usize) -> bool { + c >= self.first_channel && c < self.first_channel + 3 + } + + fn process_row_chunk( + &mut self, + position: (usize, usize), + xsize: usize, + row: &mut [(&[&[f32]], &mut [&mut [f32]])], + ) { + for (input, output) in row { + for x in 0..xsize { + let mut others = 0.0; + for i in 0..5 { + let offset = (x as i32 + i) as usize; + others += input[0][offset]; + others += input[1][offset]; + others += input[3][offset]; + others += input[4][offset]; + } + others += input[2][x]; + others += input[2][x + 1]; + others += input[2][x + 3]; + others += input[2][x + 4]; + output[0][x] = others * 0.16 + input[2][x + 2] * -3.84; + } + } + } +} + +pub struct AddNoiseStage { + noise: Noise, + // TODO(zond): color_correlation + first_channel: usize, +} + +impl AddNoiseStage { + pub fn new(noise: Noise, first_channel: usize) -> AddNoiseStage { + AddNoiseStage { + noise, + first_channel, + } + } +} + +impl std::fmt::Display for AddNoiseStage { + fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { + write!( + f, + "add noise for channels [{},{},{}]", + self.first_channel, + self.first_channel + 1, + self.first_channel + 2 + ) + } +} + +struct StrengthEvalLut<'a> { + noise: &'a Noise, +} + +impl StrengthEvalLut<'_> { + fn eval(&self, vx: f32) -> f32 { + let k_scale = (self.noise.lut.len() - 2) as f32; + let scaled_vx = f32::max(0.0, vx * k_scale); + let pre_floor_x = scaled_vx.floor(); + let pre_frac_x = scaled_vx / pre_floor_x; + let floor_x = if scaled_vx >= k_scale + 1.0 { + k_scale + } else { + pre_floor_x + }; + let frac_x = if scaled_vx >= k_scale + 1.0 { + 1.0 + } else { + pre_frac_x + }; + let floor_x_int = floor_x as usize; + let low = self.noise.lut[floor_x_int]; + let hi = self.noise.lut[floor_x_int + 1]; + (hi - low) * frac_x + low + } +} + +fn noise_strength(noise_model: &StrengthEvalLut, x: f32) -> f32 { + // clamp doesn't handle NaN the same way as min/max. + #[allow(clippy::manual_clamp)] + f32::max(0.0, f32::min(noise_model.eval(x), 1.0)) +} + +impl RenderPipelineStage for AddNoiseStage { + type Type = RenderPipelineInPlaceStage; + + fn uses_channel(&self, c: usize) -> bool { + c >= self.first_channel && c < self.first_channel + 3 + } + + fn process_row_chunk( + &mut self, + position: (usize, usize), + xsize: usize, + row: &mut [&mut [f32]], + ) { + let noise_model = StrengthEvalLut { noise: &self.noise }; + let norm_const = 0.22; + // TODO(zond): use self.color_correlation. + let ytox = 0.0; + // TODO(zond): use self.color_correlation. + let ytob = 1.0; + for x in 0..xsize { + let row_rnd_r = row[self.first_channel][x]; + let row_rnd_g = row[self.first_channel + 1][x]; + let row_rnd_c = row[self.first_channel + 2][x]; + let vx = row[0][x]; + let vy = row[1][x]; + let in_g = vy - vx; + let in_r = vy + vx; + let noise_strength_g = noise_strength(&noise_model, in_g * 0.5); + let noise_strength_r = noise_strength(&noise_model, in_r * 0.5); + let addit_rnd_noise_red = row_rnd_r * norm_const; + let addit_rnd_noise_green = row_rnd_g * norm_const; + let addit_rnd_noise_correlated = row_rnd_c * norm_const; + println!( + "{}, {}, {}, {}, {}, {}, {}", + addit_rnd_noise_red, + addit_rnd_noise_green, + addit_rnd_noise_correlated, + noise_strength_g, + noise_strength_r, + ytox, + ytob + ); + let k_rg_corr = 0.9921875f32; + let k_rgn_corr = 0.0078125f32; + let red_noise = noise_strength_r + * (k_rgn_corr * addit_rnd_noise_red + k_rg_corr * addit_rnd_noise_correlated); + let green_noise = noise_strength_g + * (k_rgn_corr * addit_rnd_noise_green + k_rg_corr * addit_rnd_noise_correlated); + let rg_noise = red_noise + green_noise; + row[0][x] += ytox * rg_noise + red_noise - green_noise; + row[1][x] += rg_noise; + row[2][x] += ytob * rg_noise; + } + } +} + +#[cfg(test)] +mod test { + use crate::{ + error::Result, + features::noise::Noise, + image::Image, + render::{ + stages::noise::{AddNoiseStage, ConvolveNoiseStage}, + test::make_and_run_simple_pipeline, + RenderPipelineStage, + }, + util::test::assert_almost_eq, + }; + use test_log::test; + + #[test] + fn convolve_noise_uses_channels() -> Result<()> { + let stage = ConvolveNoiseStage::new(1); + assert!( + !stage.uses_channel(0), + "shouldn't use channel < first_channel" + ); + for c in 1..=3 { + assert!( + stage.uses_channel(c), + "should use first_channel <= channel < first_channel + 3" + ); + } + assert!( + !stage.uses_channel(4), + "shouldn't use channel > first_channel + 3" + ); + Ok(()) + } + + #[test] + fn convolve_noise_process_row_chunk() -> Result<()> { + let input_c0: Image = Image::new_range((2, 2), 0.0f32, 1.0f32)?; + let input_c1: Image = Image::new_range((2, 2), 0.0f32, 1.0f32)?; + let input_c2: Image = Image::new_range((2, 2), 0.0f32, 1.0f32)?; + let stage = ConvolveNoiseStage::new(0); + let output: Vec> = + make_and_run_simple_pipeline(stage, &[input_c0, input_c1, input_c2], (2, 2), 256)?.1; + let rect = output[0].as_rect(); + assert_almost_eq!(rect.row(0)[0], 7.2f32, 1e-6f32); + assert_almost_eq!(rect.row(0)[1], 2.4f32, 1e-6f32); + assert_almost_eq!(rect.row(1)[0], -2.4f32, 1e-6f32); + assert_almost_eq!(rect.row(1)[1], -7.2f32, 1e-6f32); + Ok(()) + } + + #[test] + fn add_noise_uses_channels() -> Result<()> { + let stage = AddNoiseStage::new( + Noise { + lut: [ + 0.0f32, 0.0f32, 0.0f32, 0.0f32, 0.0f32, 0.0f32, 0.0f32, 0.0f32, + ], + }, + 1, + ); + assert!( + !stage.uses_channel(0), + "shouldn't use channel < first_channel" + ); + assert!(stage.uses_channel(1), "should use channel == first_channel"); + assert!( + !stage.uses_channel(4), + "shouldn't use channel > first_channel + 3" + ); + Ok(()) + } + + #[test] + fn add_noise_process_row_chunk() -> Result<()> { + let xsize = 8; + let ysize = 8; + let input_c0: Image = Image::new_range((xsize, ysize), 0.1f32, 0.1f32)?; + let input_c1: Image = Image::new_range((xsize, ysize), 0.1f32, 0.1f32)?; + let input_c2: Image = Image::new_range((xsize, ysize), 0.1f32, 0.1f32)?; + let stage = AddNoiseStage::new( + Noise { + lut: [1f32, 2f32, 3f32, 4f32, 5f32, 6f32, 7f32, 8f32], + }, + 0, + ); + let output: Vec> = make_and_run_simple_pipeline( + stage, + &[input_c0, input_c1, input_c2], + (xsize, ysize), + 256, + )? + .1; + // Golden data generated by libjxl. + let want_out = [ + [ + [ + 0.100000, 0.200000, 0.300000, 0.400000, 0.500000, 0.600000, 0.700000, 0.800000, + ], + [0.900000, 1.000000, 1.1, 1.2, 1.3, 1.4, 1.5, 1.6], + [1.7, 1.8, 1.9, 2.000000, 2.1, 2.2, 2.3, 2.4], + [ + 2.5, 2.6, 2.7, 2.799999, 2.899999, 2.999999, 3.099999, 3.199999, + ], + [ + 3.299999, 3.399999, 3.499999, 3.599999, 3.699999, 3.799999, 3.899998, 3.999998, + ], + [ + 4.099998, 4.199998, 4.299998, 4.399998, 4.499998, 4.599998, 4.699998, 4.799998, + ], + [ + 4.899998, 4.999998, 5.099998, 5.199997, 5.299997, 5.399997, 5.499997, 5.599997, + ], + [ + 5.699997, 5.799997, 5.899997, 5.999997, 6.099997, 6.199996, 6.299996, 6.399996, + ], + ], + [ + [ + 0.144000, 0.288000, 0.432000, 0.576000, 0.720000, 0.864000, 1.008, 1.152, + ], + [1.296, 1.44, 1.584, 1.728, 1.872, 2.016, 2.16, 2.304], + [2.448, 2.592, 2.736001, 2.88, 3.024, 3.168, 3.312, 3.456], + [ + 3.6, 3.743999, 3.888, 4.031999, 4.175999, 4.319999, 4.463999, 4.607999, + ], + [ + 4.751998, 4.895998, 5.039998, 5.183998, 5.327998, 5.471998, 5.615998, 5.759997, + ], + [ + 5.903998, 6.047997, 6.191998, 6.335998, 6.479997, 6.623997, 6.767997, 6.911997, + ], + [ + 7.055997, 7.199996, 7.343997, 7.487996, 7.631996, 7.775996, 7.919996, 8.063995, + ], + [ + 8.207995, 8.351995, 8.495996, 8.639996, 8.783995, 8.927995, 9.071995, 9.215995, + ], + ], + [ + [ + 0.144000, 0.288000, 0.432000, 0.576000, 0.720000, 0.864000, 1.008, 1.152, + ], + [1.296, 1.44, 1.584, 1.728, 1.872, 2.016, 2.16, 2.304], + [2.448, 2.592, 2.736001, 2.88, 3.024, 3.168, 3.312, 3.456], + [ + 3.6, 3.743999, 3.888, 4.031999, 4.175999, 4.319999, 4.463999, 4.607999, + ], + [ + 4.751998, 4.895998, 5.039998, 5.183998, 5.327998, 5.471998, 5.615998, 5.759997, + ], + [ + 5.903998, 6.047997, 6.191998, 6.335998, 6.479997, 6.623997, 6.767997, 6.911997, + ], + [ + 7.055997, 7.199996, 7.343997, 7.487996, 7.631996, 7.775996, 7.919996, 8.063995, + ], + [ + 8.207995, 8.351995, 8.495996, 8.639996, 8.783995, 8.927995, 9.071995, 9.215995, + ], + ], + ]; + for c in 0..3 { + let rect = output[c].as_rect(); + for y in 0..rect.size().1 { + for x in 0..rect.size().0 { + assert_almost_eq!(rect.row(y)[x], want_out[c][y][x], 1e-5f32); + } + } + } + Ok(()) + } +}