// Copyright 2021 The libgav1 Authors // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "src/dsp/film_grain.h" #include #include #include #include #include #include #include #include #include #include #include #include "absl/strings/match.h" #include "absl/strings/str_format.h" #include "absl/time/clock.h" #include "absl/time/time.h" #include "gtest/gtest.h" #include "src/dsp/common.h" #include "src/dsp/dsp.h" #include "src/dsp/film_grain_common.h" #include "src/film_grain.h" #include "src/utils/array_2d.h" #include "src/utils/common.h" #include "src/utils/constants.h" #include "src/utils/cpu.h" #include "src/utils/memory.h" #include "src/utils/threadpool.h" #include "src/utils/types.h" #include "tests/block_utils.h" #include "tests/third_party/libvpx/acm_random.h" #include "tests/utils.h" namespace libgav1 { namespace dsp { namespace film_grain { namespace { constexpr int kNumSpeedTests = 50; constexpr int kNumFilmGrainTestParams = 10; constexpr size_t kLumaBlockSize = kLumaWidth * kLumaHeight; constexpr size_t kChromaBlockSize = kMaxChromaWidth * kMaxChromaHeight; // Dimensions for unit tests concerning applying grain to the whole frame. constexpr size_t kNumTestStripes = 64; constexpr int kNoiseStripeHeight = 34; constexpr size_t kFrameWidth = 1921; constexpr size_t kFrameHeight = (kNumTestStripes - 1) * 32 + 1; /* The film grain parameters for 10 frames were generated with the following command line: aomenc --end-usage=q --cq-level=20 --cpu-used=8 -w 1920 -h 1080 \ --denoise-noise-level=50 --ivf breaking_bad_21m23s_10frames.1920_1080.yuv \ -o breaking_bad_21m23s_10frames.1920_1080.noise50.ivf */ constexpr FilmGrainParams kFilmGrainParams[10] = { {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/8, /*num_v_points=*/8, /*point_y_value=*/{0, 13, 27, 40, 54, 121, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{71, 71, 91, 99, 98, 100, 100, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 27, 40, 54, 67, 94, 255, 0, 0}, /*point_u_scaling=*/{37, 37, 43, 48, 48, 50, 51, 51, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 107, 255, 0, 0}, /*point_v_scaling=*/{48, 48, 43, 33, 32, 33, 34, 34, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{2, -2, -2, 10, 3, -2, 1, -4, 5, -1, -25, -13, 3, -1, 0, 7, -20, 103, 26, -2, 1, 14, -49, 117}, /*auto_regression_coeff_u=*/{-2, 1, -3, 4, -4, 0, 3, 5, -5, -17, 17, 0, -10, -5, -3, -30, 14, 70, 29, 9, -2, -10, 50, 71, -11}, /*auto_regression_coeff_v=*/{3, -2, -7, 6, -7, -8, 3, 1, -12, -15, 28, 5, -11, -2, -7, -27, 32, 62, 31, 18, -2, -6, 61, 43, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/7391, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/8, /*num_u_points=*/7, /*num_v_points=*/8, /*point_y_value=*/{0, 13, 27, 40, 54, 94, 134, 255, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{72, 72, 91, 99, 97, 100, 102, 102, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 67, 134, 255, 0, 0, 0}, /*point_u_scaling=*/{38, 38, 50, 49, 51, 53, 53, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 121, 255, 0, 0}, /*point_v_scaling=*/{50, 50, 45, 34, 33, 35, 37, 37, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{2, -2, -2, 10, 3, -1, 1, -3, 3, 1, -27, -12, 2, -1, 1, 7, -17, 100, 27, 0, -1, 13, -50, 116}, /*auto_regression_coeff_u=*/{-3, 1, -2, 3, -3, -1, 2, 5, -3, -16, 16, -2, -10, -2, -1, -31, 14, 70, 29, 9, -1, -10, 47, 70, -11}, /*auto_regression_coeff_v=*/{1, 0, -5, 5, -6, -6, 2, 1, -10, -14, 26, 4, -10, -3, -5, -26, 29, 63, 31, 17, -1, -6, 55, 47, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/10772, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/8, /*num_u_points=*/7, /*num_v_points=*/8, /*point_y_value=*/{0, 13, 27, 40, 54, 94, 134, 255, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{71, 71, 91, 99, 98, 101, 103, 103, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 81, 107, 255, 0, 0, 0}, /*point_u_scaling=*/{37, 37, 49, 48, 51, 52, 52, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 121, 255, 0, 0}, /*point_v_scaling=*/{49, 49, 44, 34, 32, 34, 36, 36, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{1, -2, -2, 10, 3, -1, 1, -4, 4, 1, -26, -12, 2, -1, 1, 7, -18, 101, 26, -1, 0, 13, -49, 116}, /*auto_regression_coeff_u=*/{-3, 1, -3, 4, -3, -1, 2, 5, -4, -16, 17, -2, -10, -3, -2, -31, 15, 70, 28, 9, -1, -10, 48, 70, -11}, /*auto_regression_coeff_v=*/{1, -1, -6, 5, -6, -7, 2, 2, -11, -14, 27, 5, -11, -3, -6, -26, 30, 62, 30, 18, -2, -6, 58, 45, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/14153, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/5, /*num_v_points=*/7, /*point_y_value=*/{0, 13, 27, 40, 54, 121, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{71, 71, 90, 99, 98, 100, 100, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 107, 255, 0, 0, 0, 0, 0}, /*point_u_scaling=*/{37, 37, 48, 51, 51, 0, 0, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 94, 255, 0, 0, 0}, /*point_v_scaling=*/{49, 49, 43, 33, 32, 34, 34, 0, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{2, -2, -2, 10, 3, -1, 1, -4, 6, 0, -26, -13, 3, -1, 1, 6, -20, 103, 26, -2, 1, 13, -48, 117}, /*auto_regression_coeff_u=*/{-3, 1, -2, 4, -4, -1, 2, 5, -5, -16, 18, -1, -10, -3, -2, -30, 16, 69, 28, 9, -2, -10, 50, 68, -11}, /*auto_regression_coeff_v=*/{2, -1, -6, 5, -6, -7, 2, 2, -11, -15, 29, 4, -10, -3, -6, -26, 30, 62, 31, 18, -3, -6, 59, 45, 3}, /*auto_regression_shift=*/8, /*grain_seed=*/17534, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/8, /*num_u_points=*/7, /*num_v_points=*/7, /*point_y_value=*/{0, 13, 27, 40, 54, 94, 134, 255, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{71, 71, 91, 99, 98, 101, 103, 103, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 81, 107, 255, 0, 0, 0}, /*point_u_scaling=*/{37, 37, 49, 49, 52, 53, 53, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 94, 255, 0, 0, 0}, /*point_v_scaling=*/{50, 50, 44, 34, 33, 36, 37, 0, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{2, -2, -2, 10, 3, -1, 1, -4, 3, 1, -26, -12, 2, -1, 1, 7, -17, 101, 26, 0, 0, 13, -50, 116}, /*auto_regression_coeff_u=*/{-2, 1, -2, 3, -3, -1, 2, 5, -4, -16, 16, -2, -10, -3, -1, -31, 14, 70, 28, 9, -1, -10, 48, 70, -11}, /*auto_regression_coeff_v=*/{1, 0, -5, 5, -6, -6, 2, 2, -10, -14, 26, 4, -10, -3, -5, -26, 29, 63, 30, 17, -1, -6, 56, 47, 3}, /*auto_regression_shift=*/8, /*grain_seed=*/20915, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/7, /*num_v_points=*/7, /*point_y_value=*/{0, 13, 27, 40, 54, 134, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{72, 72, 91, 99, 97, 101, 101, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 67, 107, 255, 0, 0, 0}, /*point_u_scaling=*/{38, 38, 51, 50, 52, 53, 54, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 94, 255, 0, 0, 0}, /*point_v_scaling=*/{51, 51, 45, 35, 33, 36, 36, 0, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{2, -2, -2, 9, 3, -1, 1, -3, 2, 2, -27, -12, 2, 0, 1, 7, -16, 100, 27, 0, -1, 13, -51, 116}, /*auto_regression_coeff_u=*/{-3, 1, -2, 3, -3, -1, 1, 4, -2, -17, 14, -3, -10, -2, 0, -31, 14, 71, 29, 8, -2, -10, 45, 71, -11}, /*auto_regression_coeff_v=*/{0, -1, -5, 4, -6, -5, 2, 1, -9, -14, 24, 3, -10, -3, -4, -25, 29, 63, 31, 16, -1, -7, 54, 48, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/24296, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/7, /*num_v_points=*/8, /*point_y_value=*/{0, 13, 27, 40, 54, 134, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{72, 72, 91, 99, 97, 101, 101, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 67, 134, 255, 0, 0, 0}, /*point_u_scaling=*/{38, 38, 50, 50, 51, 53, 53, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 121, 255, 0, 0}, /*point_v_scaling=*/{50, 50, 45, 34, 33, 35, 36, 36, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{2, -2, -2, 10, 3, -1, 1, -3, 3, 2, -27, -12, 2, 0, 1, 7, -17, 100, 27, 0, -1, 13, -51, 116}, /*auto_regression_coeff_u=*/{-3, 1, -2, 3, -3, -1, 1, 5, -3, -16, 15, -2, -10, -2, -1, -31, 14, 70, 29, 8, -1, -10, 46, 71, -11}, /*auto_regression_coeff_v=*/{1, 0, -5, 5, -6, -5, 2, 1, -9, -14, 25, 4, -10, -3, -5, -25, 29, 63, 31, 17, -1, -7, 55, 47, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/27677, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/7, /*num_v_points=*/8, /*point_y_value=*/{0, 13, 27, 40, 54, 121, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{72, 72, 92, 99, 97, 101, 101, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 67, 174, 255, 0, 0, 0}, /*point_u_scaling=*/{38, 38, 51, 50, 52, 54, 54, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 121, 255, 0, 0}, /*point_v_scaling=*/{51, 51, 46, 35, 33, 35, 37, 37, 0, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{1, -1, -2, 9, 3, -1, 1, -3, 2, 2, -28, -12, 2, 0, 1, 8, -16, 99, 27, 0, -1, 13, -51, 116}, /*auto_regression_coeff_u=*/{-3, 1, -2, 3, -3, -1, 2, 4, -2, -16, 14, -3, -10, -2, 0, -31, 13, 71, 29, 8, -2, -11, 44, 72, -11}, /*auto_regression_coeff_v=*/{0, -1, -5, 4, -6, -4, 2, 1, -9, -13, 23, 3, -10, -3, -4, -25, 28, 63, 32, 16, -1, -7, 54, 49, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/31058, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/7, /*num_v_points=*/9, /*point_y_value=*/{0, 13, 27, 40, 54, 121, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{72, 72, 92, 99, 98, 100, 98, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 67, 228, 255, 0, 0, 0}, /*point_u_scaling=*/{38, 38, 51, 51, 52, 54, 54, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 121, 201, 255, 0}, /*point_v_scaling=*/{51, 51, 46, 35, 34, 35, 37, 37, 37, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{1, -1, -2, 9, 3, -1, 1, -3, 2, 2, -28, -12, 2, 0, 1, 8, -16, 99, 27, 0, -1, 13, -52, 116}, /*auto_regression_coeff_u=*/{-3, 1, -2, 3, -3, -1, 1, 4, -2, -16, 13, -3, -10, -2, 0, -31, 13, 71, 29, 8, -2, -11, 44, 72, -11}, /*auto_regression_coeff_v=*/{0, -1, -5, 4, -6, -4, 2, 2, -8, -13, 23, 3, -10, -3, -4, -25, 28, 63, 32, 16, -1, -7, 54, 49, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/34439, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}, {/*apply_grain=*/true, /*update_grain=*/true, /*chroma_scaling_from_luma=*/false, /*overlap_flag=*/true, /*clip_to_restricted_range=*/false, /*num_y_points=*/7, /*num_u_points=*/7, /*num_v_points=*/9, /*point_y_value=*/{0, 13, 27, 40, 54, 121, 255, 0, 0, 0, 0, 0, 0, 0}, /*point_y_scaling=*/{72, 72, 92, 99, 98, 99, 95, 0, 0, 0, 0, 0, 0, 0}, /*point_u_value=*/{0, 13, 40, 54, 67, 228, 255, 0, 0, 0}, /*point_u_scaling=*/{39, 39, 51, 51, 52, 54, 54, 0, 0, 0}, /*point_v_value=*/{0, 13, 27, 40, 54, 67, 121, 201, 255, 0}, /*point_v_scaling=*/{51, 51, 46, 35, 34, 35, 36, 35, 35, 0}, /*chroma_scaling=*/11, /*auto_regression_coeff_lag=*/3, /*auto_regression_coeff_y=*/{1, -1, -2, 9, 3, -1, 1, -3, 2, 2, -28, -11, 2, 0, 1, 8, -16, 99, 27, 0, -1, 13, -52, 116}, /*auto_regression_coeff_u=*/{-3, 1, -2, 3, -3, -1, 1, 4, -2, -16, 13, -3, -10, -2, 0, -30, 13, 71, 29, 8, -2, -10, 43, 72, -11}, /*auto_regression_coeff_v=*/{0, -1, -5, 3, -6, -4, 2, 2, -8, -13, 23, 3, -10, -3, -4, -25, 28, 64, 32, 16, -1, -7, 53, 49, 2}, /*auto_regression_shift=*/8, /*grain_seed=*/37820, /*reference_index=*/0, /*grain_scale_shift=*/0, /*u_multiplier=*/0, /*u_luma_multiplier=*/64, /*u_offset=*/0, /*v_multiplier=*/0, /*v_luma_multiplier=*/64, /*v_offset=*/0}}; const char* GetTestDigestLuma(int bitdepth, int param_index) { static const char* const kTestDigestsLuma8bpp[10] = { "80da8e849110a10c0a73f9dec0d9a2fb", "54352f02aeda541e17a4c2d208897e2b", "2ad9021124c82aca3e7c9517d00d1236", "f6c5f64513925b09ceba31e92511f8a1", "46c6006578c68c3c8619f7a389c7de45", "fcddbd27545254dc50f1c333c8b7e313", "c6d4dc181bf7f2f93ae099b836685151", "2949ef836748271195914fef9acf4e46", "524e79bb87ed550e123d00a61df94381", "182222470d7b7a80017521d0261e4474", }; static const char* const kTestDigestsLuma10bpp[10] = { "27a49a2131fb6d4dd4b8c34da1b7642e", "4ea9134f6831dd398545c85b2a68e31f", "4e12232a18a2b06e958d7ab6b953faad", "0ede12864ddaced2d8062ffa4225ce24", "5fee492c4a430b2417a64aa4920b69e9", "39af842a3f9370d796e8ef047c0c42a8", "0efbad5f9dc07391ad243232b8df1787", "2bd41882cd82960019aa2b87d5fb1fbc", "1c66629c0c4e7b6f9b0a7a6944fbad50", "2c633a50ead62f8e844a409545f46244", }; static const char* const kTestDigestsLuma12bpp[10] = { "1dc9b38a93454a85eb924f25346ae369", "5f9d311ee5384a5a902f8e2d1297319e", "cf1a35878720564c7a741f91eef66565", "47a0608fe0f6f7ccae42a5ca05783cbf", "dbc28da0178e3c18a036c3f2203c300f", "04911d2074e3252119ee2d80426b8c01", "df19ab8103c40b726c842ccf7772208b", "39276967eb16710d98f82068c3eeba41", "b83100f18abb2062d9c9969f07182b86", "b39a69515491329698cf66f6d4fa371f", }; switch (bitdepth) { case 8: return kTestDigestsLuma8bpp[param_index]; case 10: return kTestDigestsLuma10bpp[param_index]; case 12: return kTestDigestsLuma12bpp[param_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetTestDigestChromaU(int bitdepth, int param_index) { static const char* const kTestDigestsChromaU8bpp[10] = { "e56b7bbe9f39bf987770b18aeca59514", "d0b3fd3cf2901dae31b73f20c510d83e", "800c01d58d9fb72136d21ec2bb07899a", "4cd0badba679e8edbcd60a931fce49a1", "cabec236cc17f91f3f08d8cde867aa72", "380a2205cf2d40c6a27152585f61a3b0", "3813526234dc7f90f80f6684772c729a", "97a43a73066d88f9cbd915d56fc9c196", "5b70b27a43dd63b03e23aecd3a935071", "d5cc98685582ffd47a41a97d2e377ac8", }; static const char* const kTestDigestsChromaU10bpp[10] = { "9a6d0369ba86317598e65913276dae6d", "2512bdc4c88f21f8185b040b7752d1db", "1e86b779ce6555fcf5bd0ade2af67e73", "5ad463a354ffce522c52b616fb122024", "290d53c22c2143b0882acb887da3fdf1", "54622407d865371d7e70bbf29fdda626", "be306c6a94c55dbd9ef514f0ad4a0011", "904602329b0dec352b3b177b0a2554d2", "58afc9497d968c67fdf2c0cf23b33aa3", "74fee7be6f62724bf901fdd04a733b46", }; static const char* const kTestDigestsChromaU12bpp[10] = { "846d608050fe7c19d6cabe2d53cb7821", "2caf4665a26aad50f68497e4b1326417", "ce40f0f8f8c207c7c985464c812fea33", "820de51d07a21da5c00833bab546f1fa", "5e7bedd8933cd274af03babb4dbb94dd", "d137cf584eabea86387460a6d3f62bfe", "f206e0c6ed35b3ab35c6ff37e151e963", "55d87981b7044df225b3b5935185449b", "6a655c8bf4df6af0e80ae6d004a73a25", "6234ae36076cc77161af6e6e3c04449a", }; switch (bitdepth) { case 8: return kTestDigestsChromaU8bpp[param_index]; case 10: return kTestDigestsChromaU10bpp[param_index]; case 12: return kTestDigestsChromaU12bpp[param_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetTestDigestChromaV(int bitdepth, int param_index) { static const char* const kTestDigestsChromaV8bpp[10] = { "7205ed6c07ed27b7b52d871e0559b8fa", "fad033b1482dba0ed2d450b461fa310e", "6bb39798ec6a0f7bda0b0fcb0a555734", "08c19856e10123ae520ccfc63e2fbe7b", "a7695a6b69fba740a50310dfa6cf1c00", "ac2eac2d13fc5b21c4f2995d5abe14b9", "be35cb30062db628a9e1304fca8b75dc", "f5bfc7a910c76bcd5b32c40772170879", "aca07b37d63f978d76df5cd75d0cea5e", "107c7c56d4ec21f346a1a02206301b0d", }; static const char* const kTestDigestsChromaV10bpp[10] = { "910724a77710996c90e272f1c1e9ff8e", "d293f861580770a89f1e266931a012ad", "9e4f0c85fb533e51238586f9c3e68b6e", "a5ff4478d9eeb2168262c2e955e17a4f", "fba6b1e8f28e4e90c836d41f28a0c154", "50b9a93f9a1f3845e6903bff9270a3e6", "7b1624c3543badf5fadaee4d1e602e6b", "3be074e4ca0eec5770748b15661aaadd", "639197401032f272d6c30666a2d08f43", "28075dd34246bf9d5e6197b1944f646a", }; static const char* const kTestDigestsChromaV12bpp[10] = { "4957ec919c20707d594fa5c2138c2550", "3f07c65bfb42c81768b1f5ad9611d1ce", "665d9547171c99faba95ac81a35c9a0c", "1b5d032e0cefdb4041ad51796de8a45e", "18fa974579a4f1ff8cd7df664fc339d5", "2ffaa4f143495ff73c06a580a97b6321", "4fd1f562bc47a68dbfaf7c566c7c4da6", "4d37c80c9caf110c1d3d20bd1a1875b3", "8ea29759640962613166dc5154837d14", "5ca4c10f42d0906c72ebee90fae6ce7d", }; switch (bitdepth) { case 8: return kTestDigestsChromaV8bpp[param_index]; case 10: return kTestDigestsChromaV10bpp[param_index]; case 12: return kTestDigestsChromaV12bpp[param_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetARTestDigestLuma(int bitdepth, int coeff_lag, int param_index) { static const char* const kTestDigestsLuma8bpp[3][kNumFilmGrainTestParams] = { {"a835127918f93478b45f1ba4d20d81bd", "a835127918f93478b45f1ba4d20d81bd", "e5db4da626e214bb17bcc7ecffa76303", "a835127918f93478b45f1ba4d20d81bd", "a835127918f93478b45f1ba4d20d81bd", "e5db4da626e214bb17bcc7ecffa76303", "a835127918f93478b45f1ba4d20d81bd", "1da62b7233de502123a18546b6c97da2", "1da62b7233de502123a18546b6c97da2", "1da62b7233de502123a18546b6c97da2"}, {"11464b880de3ecd6e6189c5c4e7f9b28", "dfe411762e283b5f49bece02ec200951", "5c534d92afdf0a5b53dbe4fe7271929c", "2e1a68a18aca96c31320ba7ceab59be9", "584c0323e6b276cb9acb1a294d462d58", "9571eb8f1cbaa96ea3bf64a820a8d9f0", "305285ff0df87aba3c59e3fc0818697d", "0066d35c8818cf20230114dcd3765a4d", "0066d35c8818cf20230114dcd3765a4d", "16d61b046084ef2636eedc5a737cb6f6"}, {"0c9e2cf1b6c3cad0f7668026e8ea0516", "7d094855292d0eded9e0d1b5bab1990b", "fbf28860a5f1285dcc6725a45256a86a", "dccb906904160ccabbd2c9a7797a4bf9", "46f645e17f08a3260b1ae70284e5c5b8", "124fdc90bed11a7320a0cbdee8b94400", "8d2978651dddeaef6282191fa146f0a0", "28b4d5aa33f05b3fb7f9323a11936bdc", "6a8ea684f6736a069e3612d1af6391a8", "2781ea40a63704dbfeb3a1ac5db6f2fc"}, }; static const char* const kTestDigestsLuma10bpp[3][kNumFilmGrainTestParams] = { {"5e6bc8444ece2d38420f51d82238d812", "5e6bc8444ece2d38420f51d82238d812", "2bfaec768794af33d60a9771f971f68d", "5e6bc8444ece2d38420f51d82238d812", "5e6bc8444ece2d38420f51d82238d812", "c880807a368c4e82c23bea6f035ad23f", "5e6bc8444ece2d38420f51d82238d812", "c576667da5286183ec3aab9a76f53a2e", "c576667da5286183ec3aab9a76f53a2e", "c576667da5286183ec3aab9a76f53a2e"}, {"095c2dd4d4d52aff9696df9bfdb70062", "983d14afa497060792d472a449a380c7", "c5fdc0f7c594b2b36132cec6f45a79bd", "acff232ac5597c1712213150552281d1", "4dd7341923b1d260092853553b6b6246", "0ca8afd71a4f564ea1ce69c4af14e9ab", "9bc7565e5359d09194fcee28e4bf7b94", "6fea7805458b9d149f238a30e2dc3f13", "6fea7805458b9d149f238a30e2dc3f13", "681dff5fc7a7244ba4e4a582ca7ecb14"}, {"cb99352c9c6300e7e825188bb4adaee0", "7e40674de0209bd72f8e9c6e39ee6f7c", "3e475572f6b4ecbb2730fd16751ad7ed", "e6e4c63abc9cb112d9d1f23886cd1415", "1a1c953b175c105c604902877e2bab18", "380a53072530223d4ee622e014ee4bdb", "6137394ea1172fb7ea0cbac237ff1703", "85ab0c813e46f97cb9f42542f44c01ad", "68c8ac462f0e28cb35402c538bee32f1", "0038502ffa4760c8feb6f9abd4de7250"}, }; static const char* const kTestDigestsLuma12bpp[3][kNumFilmGrainTestParams] = { {"d618bbb0e337969c91b1805f39561520", "d618bbb0e337969c91b1805f39561520", "678f6e911591daf9eca4e305dabdb2b3", "d618bbb0e337969c91b1805f39561520", "d618bbb0e337969c91b1805f39561520", "3b26f49612fd587c7360790d40adb5de", "d618bbb0e337969c91b1805f39561520", "33f77d3ff50cfc64c6bc9a896b567377", "33f77d3ff50cfc64c6bc9a896b567377", "33f77d3ff50cfc64c6bc9a896b567377"}, {"362fd67050fb7abaf57c43a92d993423", "e014ae0eb9e697281015c38905cc46ef", "82b867e57151dc08afba31eccf5ccf69", "a94ba736cdce7bfa0b550285f59e47a9", "3f1b0b7dd3b10e322254d35e4e185b7c", "7929708e5f017d58c53513cb79b35fda", "6d26d31a091cbe642a7070933bd7de5a", "dc29ac40a994c0a760bfbad0bfc15b3a", "dc29ac40a994c0a760bfbad0bfc15b3a", "399b919db5190a5311ce8d166580827b"}, {"6116d1f569f5b568eca4dc1fbf255086", "7e9cf31ea74e8ea99ffd12094ce6cd05", "bb982c4c39e82a333d744defd16f4388", "7c6e584b082dc6b97ed0d967def3993f", "fb234695353058f03c8e128f2f8de130", "9218c6ca67bf6a9237f98aa1ce7acdfd", "d1fb834bbb388ed066c5cbc1c79b5bdf", "d6f630daedc08216fcea12012e7408b5", "dd7fe49299e6f113a98debc7411c8db8", "8b89e45a5101a28c24209ae119eafeb8"}, }; switch (bitdepth) { case 8: return kTestDigestsLuma8bpp[coeff_lag - 1][param_index]; case 10: return kTestDigestsLuma10bpp[coeff_lag - 1][param_index]; case 12: return kTestDigestsLuma12bpp[coeff_lag - 1][param_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetARTestDigestChromaU(int bitdepth, int coeff_lag, int subsampling_x, int subsampling_y) { static const char* const kTestDigestsChromaU8bpp[12] = { "11ced66de0eaf55c1ff9bad18d7b8ed7", "0c3b77345dd4ab0915ef53693ab93ce4", "b0645044ba080b3ceb8f299e269377d6", "50590ad5d895f0b4bc6694d878e9cd32", "85e1bf3741100135062f5b4abfe7639b", "76955b70dde61ca5c7d079c501b90906", "3f0995e1397fd9efd9fc46b67f7796b3", "0a0d6c3e4e1649eb101395bc97943a07", "1878855ed8db600ccae1d39abac52ec6", "13ab2b28320ed3ac2b820f08fdfd424d", "f3e95544a86ead5387e3dc4e043fd0f0", "ff8f5d2d97a6689e16a7e4f482f69f0b", }; static const char* const kTestDigestsChromaU10bpp[12] = { "707f2aa5aa7e77bc6e83ab08287d748d", "0bcf40c7fead9ac3a5d71b4cc1e21549", "0c1df27053e5da7cf1276a122a8f4e8b", "782962f7425eb38923a4f87e7ab319d9", "b4a709ae5967afef55530b9ea8ef0062", "70a971a0b9bf06212d510b396f0f9095", "d033b89d6e31f8b13c83d94c840b7d54", "40bbe804bf3f90cee667d3b275e3c964", "90bb2b9d518b945adcfd1b1807f7d170", "4bc34aa157fe5ad4270c611afa75e878", "e2688d7286cd43fe0a3ea734d2ad0f77", "853193c4981bd882912171061327bdf2", }; static const char* const kTestDigestsChromaU12bpp[12] = { "04c23b01d01c0e3f3247f3741581b383", "9f8ea1d66e44f6fe93d765ce56b2b0f3", "5dda44b128d6c244963f1e8e17cc1d22", "9dd0a79dd2f772310a95762d445bface", "0dbd40d930e4873d72ea72b9e3d62440", "d7d83c207c6b435a164206d5f457931f", "e8d04f6e63ed63838adff965275a1ff1", "fc09a903e941fcff8bad67a84f705775", "9cd706606a2aa40d0957547756f7abd9", "258b37e7b8f48db77dac7ea24073fe69", "80149b8bb05308da09c1383d8b79d3da", "e993f3bffae53204a1942feb1af42074", }; assert(!(subsampling_x == 0 && subsampling_y == 1)); const int base_index = 3 * coeff_lag + subsampling_x + subsampling_y; switch (bitdepth) { case 8: return kTestDigestsChromaU8bpp[base_index]; case 10: return kTestDigestsChromaU10bpp[base_index]; case 12: return kTestDigestsChromaU12bpp[base_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetARTestDigestChromaV(int bitdepth, int coeff_lag, int subsampling_x, int subsampling_y) { static const char* const kTestDigestsChromaV8bpp[12] = { "5c2179f3d93be0a0da75d2bb90347c2f", "79b883847d7eaa7890e1d633b8e34353", "90ade818e55808e8cf58c11debb5ddd1", "1d0f2a14bc4df2b2a1abaf8137029f92", "ac753a57ade140dccb50c14f941ae1fc", "d24ab497558f6896f08dc17bcc3c50c1", "3d74436c63920022a95c85b234db4e33", "061c2d53ed84c830f454e395c362cb16", "05d24869d7fb952e332457a114c8b9b7", "fcee31b87a2ada8028c2a975e094856a", "c019e2c475737abcf9c2b2a52845c646", "9cd994baa7021f8bdf1d1c468c1c8e9c", }; static const char* const kTestDigestsChromaV10bpp[12] = { "bc9e44454a05cac8571c15af5b720e79", "f0374436698d94e879c03331b1f30df4", "4580dd009abd6eeed59485057c55f63e", "7d1f7aecd45302bb461f4467f2770f72", "1f0d003fce6c5fedc147c6112813f43b", "4771a45c2c1a04c375400619d5536035", "df9cf619a78907c0f6e58bc13d7d5546", "dd3715ce65d905f30070a36977c818e0", "32de5800f76e34c128a1d89146b4010b", "db9d7c70c3f69feb68fae04398efc773", "d3d0912e3fdb956fef416a010bd7b4c2", "a2fca8abd9fd38d2eef3c4495d9eff78", }; static const char* const kTestDigestsChromaV12bpp[12] = { "0d1890335f4464167de22353678ca9c6", "9e6830aba73139407196f1c811f910bc", "6018f2fb76bd648bef0262471cfeba5c", "78e1ae1b790d709cdb8997621cf0fde3", "5b44ae281d7f9db2f17aa3c24b4741dd", "f931d16991669cb16721de87da9b8067", "5580f2aed349d9cabdafb9fc25a57b1c", "86918cd78bf95e6d4405dd050f5890b8", "13c8b314eeebe35fa60b703d94e1b2c1", "13c6fb75cab3f42e0d4ca31e4d068b0e", "bb9ca0bd6f8cd67e44c8ac2803abf5a5", "0da4ea711ffe557bb66577392b6f148b", }; assert(!(subsampling_x == 0 && subsampling_y == 1)); const int base_index = 3 * coeff_lag + subsampling_x + subsampling_y; switch (bitdepth) { case 8: return kTestDigestsChromaV8bpp[base_index]; case 10: return kTestDigestsChromaV10bpp[base_index]; case 12: return kTestDigestsChromaV12bpp[base_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetGrainGenerationTestDigestLuma(int bitdepth, int param_index) { static const char* const kTestDigestsLuma8bpp[kNumFilmGrainTestParams] = { "c48babd99e5cfcbaa13d8b6e0c12e644", "da4b971d2de19b709e2bc98d2e50caf3", "96c72faac19a79c138afeea8b8ae8c7a", "90a2b9c8304a44d14e83ca51bfd2fe8a", "72bd3aa85c17850acb430afb4183bf1a", "a0acf76349b9efbc9181fc31153d9ef6", "6da74dd631a4ec8b9372c0bbec22e246", "6e11fa230f0e5fbb13084255c22cabf9", "be1d257b762f9880d81680e9325932a2", "37e302075af8130b371de4430e8a22cf", }; static const char* const kTestDigestsLuma10bpp[kNumFilmGrainTestParams] = { "0a40fd2f261095a6154584a531328142", "9d0c8173a94a0514c769e94b6f254030", "7894e959fdd5545895412e1512c9352d", "6802cad2748cf6db7f66f53807ee46ab", "ea24e962b98351c3d929a8ae41e320e2", "b333dc944274a3a094073889ca6e11d6", "7211d7ac0ff7d11b5ef1538c0d98f43d", "ef9f9cbc101a07da7bfa62637130e331", "85a122e32648fde84b883a1f98947c60", "dee656e3791138285bc5b71e3491a177", }; static const char* const kTestDigestsLuma12bpp[kNumFilmGrainTestParams] = { "ae359794b5340d073d597117046886ac", "4d4ad3908b4fb0f248a0086537dd6b1e", "672a97e15180cbeeaf76d763992c9f23", "739124d10d16e00a158e833ea92107bc", "4c38c738ff7ffc50adaa4474584d3aae", "ca05ba7e51000a7d10e5cbb2101bbd86", "e207022b916bf03a76ac8742af29853d", "7454bf1859149237ff74f1161156c857", "10fc2a16e663bbc305255b0883cfcd45", "4228abff6899bb33839b579288ab29fe", }; switch (bitdepth) { case 8: return kTestDigestsLuma8bpp[param_index]; case 10: return kTestDigestsLuma10bpp[param_index]; case 12: return kTestDigestsLuma12bpp[param_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetConstructStripesTestDigest(int bitdepth, int overlap_flag, int subsampling_x, int subsampling_y) { static const char* const kTestDigests8bpp[6] = { "cd14aaa6fc1728290fa75772730a2155", "13ad4551feadccc3a3a9bd5e25878d2a", "ed6ad9532c96ef0d79ff3228c89a429f", "82f307a7f5fc3308c3ebe268b5169e70", "aed793d525b85349a8c2eb6d40e93969", "311c3deb727621a7d4f18e8defb65de7", }; static const char* const kTestDigests10bpp[6] = { "4fe2fa1e428737de3595be3a097d0203", "80568c3c3b53bdbbd03b820179092dcd", "bc7b73099961a0739c36e027d6d09ea1", "e5331364e5146a6327fd94e1467f59a3", "125bf18b7787e8f0792ea12f9210de0d", "21cf98cbce17eca77dc150cc9be0e0a0", }; static const char* const kTestDigests12bpp[6] = { "57f8e17078b6e8935252e918a2562636", "556a7b294a99bf1163b7166b4f68357e", "249bee5572cd7d1cc07182c97adc4ba7", "9bf43ae1998c2a5b2e5f4d8236b58747", "477c08fa26499936e5bb03bde097633e", "fe64b7166ff87ea0711ae4f519cadd59", }; const int base_index = 3 * overlap_flag + subsampling_x + subsampling_y; switch (bitdepth) { case 8: return kTestDigests8bpp[base_index]; case 10: return kTestDigests10bpp[base_index]; case 12: return kTestDigests12bpp[base_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetConstructImageTestDigest(int bitdepth, int overlap_flag, int subsampling_x, int subsampling_y) { static const char* const kTestDigests8bpp[6] = { "17030fc692e685557a3717f9334af7e8", "d16ea46147183cd7bc36bcfc2f936a5b", "68152958540dbec885f71e3bcd7aa088", "bb43b420f05a122eb4780aca06055ab1", "87567b04fbdf64f391258c0742de266b", "ce87d556048b3de32570faf6729f4010", }; static const char* const kTestDigests10bpp[6] = { "5b31b29a5e22126a9bf8cd6a01645777", "2bb94a25164117f2ab18dae18e2c6577", "27e57a4ed6f0c9fe0a763a03f44805e8", "481642ab0b07437b76b169aa4eb82123", "656a9ef056b04565bec9ca7e0873c408", "a70fff81ab28d02d99dd4f142699ba39", }; static const char* const kTestDigests12bpp[6] = { "146f7ceadaf77e7a3c41e191a58c1d3c", "de18526db39630936733e687cdca189e", "165c96ff63bf3136505ab1d239f7ceae", "a102636662547f84e5f6fb6c3e4ef959", "4cb073fcc783c158a95c0b1ce0d27e9f", "3a734c71d4325a7da53e2a6e00f81647", }; const int base_index = 3 * overlap_flag + subsampling_x + subsampling_y; switch (bitdepth) { case 8: return kTestDigests8bpp[base_index]; case 10: return kTestDigests10bpp[base_index]; case 12: return kTestDigests12bpp[base_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetScalingInitTestDigest(int param_index, int bitdepth) { static const char* const kTestDigests8bpp[kNumFilmGrainTestParams] = { "315202ca3bf9c46eac8605e89baffd2a", "640f6408702b07ab7e832e7326cce56f", "f75ee83e3912a3f25949e852d67326cf", "211223f5d6a4b42a8e3c662f921b71c0", "f75ee83e3912a3f25949e852d67326cf", "e7a1de8c5a2cac2145c586ecf1f9051c", "e7a1de8c5a2cac2145c586ecf1f9051c", "276fe5e3b30b2db2a9ff798eb6cb8e00", "ac67f1c3aff2f50ed4b1975bde67ffe3", "8db6145a60d506cc94f07cef8b27c681", }; static const char* const kTestDigests10bpp[kNumFilmGrainTestParams] = { "c50be59c62b634ff45ddfbe5b978adfc", "7626286109a2a1eaf0a26f6b2bbab9aa", "f2302988140c47a0724fc55ff523b6ec", "5318e33d8a59a526347ffa6a72ba6ebd", "f2302988140c47a0724fc55ff523b6ec", "f435b5fe98e9d8b6c61fa6f457601c2c", "f435b5fe98e9d8b6c61fa6f457601c2c", "ff07a2944dbe094d01e199098764941c", "11b3e256c74cee2b5679f7457793869a", "89fab5c1db09e242d0494d1c696a774a", }; static const char* const kTestDigests12bpp[kNumFilmGrainTestParams] = { "1554df49a863a851d146213e09d311a4", "84808c3ed3b5495a62c9d2dd9a08cb26", "bb31f083a3bd9ef26587478b8752f280", "34fdfe61d6871e4882e38062a0725c5c", "bb31f083a3bd9ef26587478b8752f280", "e7b8c3e4508ceabe89b78f10a9e160b8", "e7b8c3e4508ceabe89b78f10a9e160b8", "a0ccc9e3d0f0c9d1f08f1249264d92f5", "7992a96883c8a9a35d6ca8961bc4515b", "de906ce2c0fceed6f168215447b21b16", }; switch (bitdepth) { case 8: return kTestDigests8bpp[param_index]; case 10: return kTestDigests10bpp[param_index]; case 12: return kTestDigests12bpp[param_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetBlendLumaTestDigest(int bitdepth) { static const char* const kTestDigests[] = { "de35b16c702690b1d311cdd0973835d7", "60e9f24dcaaa0207a8db5ab5f3c66608", "8e7d44b620bb7768459074be6bfbca7b", }; assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return kTestDigests[(bitdepth - 8) / 2]; } const char* GetBlendChromaUTestDigest(int bitdepth, int chroma_scaling_from_luma, int subsampling_x, int subsampling_y) { static const char* const kTestDigests8bpp[6] = { "36ca194734d45e75079baba1f3ec9e9e", "182b388061f59fd3e24ef4581c536e67", "2e7843b4c624f03316c3cbe1cc835859", "39e6d9606915da6a41168fbb006b55e4", "3f44a4e252d4823544ac66a900dc7983", "1860f0831841f262d66b23f6a6b5833b", }; static const char* const kTestDigests10bpp[6] = { "2054665564f55750c9588b505eb01ac0", "4d8b0e248f8a6bfc72516aa164e76b0b", "7e549800a4f9fff6833bb7738e272baf", "8de6f30dcda99a37b359fd815e62d2f7", "9b7958a2278a16bce2b7bc31fdd811f5", "c5c3c8cccf6a2b4e40b4a412a5bf4f08", }; static const char* const kTestDigests12bpp[6] = { "8fad0cc641da35e0d2d8f178c7ce8394", "793eb9d2e6b4ea2e3bb08e7068236155", "9156bd85ab9493d8867a174f920bb1e6", "6834319b4c88e3e0c96b6f8d7efd08dd", "c40e492790d3803a734efbc6feca46e2", "d884c3b1e2c21d98844ca7639e0599a5", }; const int base_index = 3 * chroma_scaling_from_luma + subsampling_x + subsampling_y; switch (bitdepth) { case 8: return kTestDigests8bpp[base_index]; case 10: return kTestDigests10bpp[base_index]; case 12: return kTestDigests12bpp[base_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } const char* GetBlendChromaVTestDigest(int bitdepth, int chroma_scaling_from_luma, int subsampling_x, int subsampling_y) { static const char* const kTestDigests8bpp[6] = { "9a353e4f86d7ebaa980f7f6cfc0995ad", "17589b4039ed49ba16f32db9fae724b7", "76ae8bed48a173b548993b6e1824ff67", "c1458ac9bdfbf0b4d6a175343b17b27b", "fa76d1c8e48957537f26af6a5b54ec14", "313fe3c34568b7f9c5ecb09d419d4ba4", }; static const char* const kTestDigests10bpp[6] = { "8ab5a8e03f07547260033d6a0b689e3c", "275ede58d311e2f5fd76f222f45a64fc", "ce13916e0f7b02087fd0356534d32770", "165bfc8cda0266936a67fa4ec9b215cb", "ed4382caa936acf1158ff8049d18ffac", "942bdd1344c9182dd7572099fb9372db", }; static const char* const kTestDigests12bpp[6] = { "70704a1e171a3a70d40b7d0037a75fbc", "62549e2afbf36a1ed405a6574d39c542", "e93889927ab77c6e0767ff071d980c02", "a0c1f6ed78874137710fee7418d80959", "f6283e36a25cb867e30bdf0bfdb2124b", "741c2d48898835b9d9e3bd0b6ac6269a", }; const int base_index = 3 * chroma_scaling_from_luma + subsampling_x + subsampling_y; switch (bitdepth) { case 8: return kTestDigests8bpp[base_index]; case 10: return kTestDigests10bpp[base_index]; case 12: return kTestDigests12bpp[base_index]; default: assert(bitdepth == 8 || bitdepth == 10 || bitdepth == 12); return nullptr; } } // GetFilmGrainRandomNumber() is only invoked with |bits| equal to 11 or 8. Test // both values of |bits|. TEST(FilmGrainTest, GetFilmGrainRandomNumber) { uint16_t seed = 51968; const struct { int rand; uint16_t seed; } kExpected11[5] = { {812, 25984}, {406, 12992}, {1227, 39264}, {1637, 52400}, {818, 26200}, }; for (int i = 0; i < 5; ++i) { int rand = GetFilmGrainRandomNumber(11, &seed); EXPECT_EQ(rand, kExpected11[i].rand) << "i = " << i; EXPECT_EQ(seed, kExpected11[i].seed) << "i = " << i; } const struct { int rand; uint16_t seed; } kExpected8[5] = { {179, 45868}, {89, 22934}, {44, 11467}, {150, 38501}, {75, 19250}, }; for (int i = 0; i < 5; ++i) { int rand = GetFilmGrainRandomNumber(8, &seed); EXPECT_EQ(rand, kExpected8[i].rand) << "i = " << i; EXPECT_EQ(seed, kExpected8[i].seed) << "i = " << i; } } // In FilmGrainParams, if num_u_points and num_v_points are both 0 and // chroma_scaling_from_luma is false, GenerateChromaGrains() should set both // the u_grain and v_grain arrays to all zeros. TEST(FilmGrainTest, GenerateZeroChromaGrains) { FilmGrainParams film_grain_params = {}; film_grain_params.apply_grain = true; film_grain_params.update_grain = true; film_grain_params.chroma_scaling = 8; film_grain_params.auto_regression_shift = 6; film_grain_params.grain_seed = 51968; int8_t u_grain[73 * 82]; int8_t v_grain[73 * 82]; const int chroma_width = 44; const int chroma_height = 38; // Initialize u_grain and v_grain with arbitrary nonzero values. memset(u_grain, 1, sizeof(u_grain)); memset(v_grain, 2, sizeof(v_grain)); for (int y = 0; y < chroma_height; ++y) { for (int x = 0; x < chroma_width; ++x) { EXPECT_NE(u_grain[y * chroma_width + x], 0); EXPECT_NE(v_grain[y * chroma_width + x], 0); } } FilmGrain<8>::GenerateChromaGrains(film_grain_params, chroma_width, chroma_height, u_grain, v_grain); for (int y = 0; y < chroma_height; ++y) { for (int x = 0; x < chroma_width; ++x) { EXPECT_EQ(u_grain[y * chroma_width + x], 0); EXPECT_EQ(v_grain[y * chroma_width + x], 0); } } } // First parameter is coefficient lag. Second parameter is the index into // |kFilmGrainParams|. template class AutoRegressionTestLuma : public testing::TestWithParam> { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); using GrainType = typename std::conditional::type; AutoRegressionTestLuma() { FilmGrainInit_C(); const dsp::Dsp* const dsp = dsp::GetDspTable(bitdepth); const int index = std::get<0>(GetParam()) - 1; base_luma_auto_regression_func_ = dsp->film_grain.luma_auto_regression[index]; const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "C/")) { base_luma_auto_regression_func_ = nullptr; } else if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } luma_auto_regression_func_ = dsp->film_grain.luma_auto_regression[index]; } protected: // |compare| determines whether to compare the output blocks from the SIMD // implementation, if used, and the C implementation. // |saturate| determines whether to set the inputs to maximum values. This is // intended primarily as a way to simplify differences in output when // debugging. void TestAutoRegressiveFilterLuma(int coeff_lag, int param_index, int num_runs, bool saturate, bool compare); LumaAutoRegressionFunc luma_auto_regression_func_; LumaAutoRegressionFunc base_luma_auto_regression_func_; GrainType luma_block_buffer_[kLumaBlockSize]; GrainType base_luma_block_buffer_[kLumaBlockSize]; }; // First parameter is coefficient lag. Second parameter is the index into // |kFilmGrainParams|. template void AutoRegressionTestLuma::TestAutoRegressiveFilterLuma( int coeff_lag, int param_index, int num_runs, bool saturate, bool compare) { if (luma_auto_regression_func_ == nullptr) return; // Compare is only needed for NEON tests to compare with C output. if (base_luma_auto_regression_func_ == nullptr && compare) return; FilmGrainParams params = kFilmGrainParams[param_index]; params.auto_regression_coeff_lag = coeff_lag; const int grain_max = GetGrainMax(); for (int y = 0; y < kLumaHeight; ++y) { for (int x = 0; x < kLumaWidth; ++x) { if (saturate) { luma_block_buffer_[y * kLumaWidth + x] = grain_max; } else { luma_block_buffer_[y * kLumaWidth + x] = std::min(x - (kLumaWidth >> 1), y - (kLumaHeight >> 1)) * (1 << (bitdepth - 8)); } } } if (saturate) { memset(params.auto_regression_coeff_y, 127, sizeof(params.auto_regression_coeff_y)); } if (compare) { memcpy(base_luma_block_buffer_, luma_block_buffer_, sizeof(luma_block_buffer_)); } const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { luma_auto_regression_func_(params, luma_block_buffer_); } const absl::Duration elapsed_time = absl::Now() - start; if (num_runs > 1) { printf("AutoRegressionLuma lag=%d, param_index=%d: %d us\n", coeff_lag, param_index, static_cast(absl::ToInt64Microseconds(elapsed_time))); return; } if (compare) { base_luma_auto_regression_func_(params, base_luma_block_buffer_); EXPECT_TRUE(test_utils::CompareBlocks( luma_block_buffer_, base_luma_block_buffer_, kLumaWidth, kLumaHeight, kLumaWidth, kLumaWidth, false)); } else { test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("AutoRegressionLuma lag=%d, param_index=%d", coeff_lag, param_index) .c_str(), GetARTestDigestLuma(bitdepth, coeff_lag, param_index), luma_block_buffer_, sizeof(luma_block_buffer_), elapsed_time); } } using AutoRegressionTestLuma8bpp = AutoRegressionTestLuma<8>; TEST_P(AutoRegressionTestLuma8bpp, AutoRegressiveFilterLuma) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1, /*saturate=*/false, /*compare=*/false); } TEST_P(AutoRegressionTestLuma8bpp, AutoRegressiveFilterLumaSaturated) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1, /*saturate=*/true, /*compare=*/true); } TEST_P(AutoRegressionTestLuma8bpp, DISABLED_Speed) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1e5, /*saturate=*/false, /*compare=*/false); } #if LIBGAV1_MAX_BITDEPTH >= 10 using AutoRegressionTestLuma10bpp = AutoRegressionTestLuma<10>; TEST_P(AutoRegressionTestLuma10bpp, AutoRegressiveFilterLuma) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1, /*saturate=*/false, /*compare=*/false); } TEST_P(AutoRegressionTestLuma10bpp, AutoRegressiveFilterLumaSaturated) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1, /*saturate=*/true, /*compare=*/true); } TEST_P(AutoRegressionTestLuma10bpp, DISABLED_Speed) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1e5, /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using AutoRegressionTestLuma12bpp = AutoRegressionTestLuma<12>; TEST_P(AutoRegressionTestLuma12bpp, AutoRegressiveFilterLuma) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1, /*saturate=*/false, /*compare=*/false); } TEST_P(AutoRegressionTestLuma12bpp, AutoRegressiveFilterLumaSaturated) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1, /*saturate=*/true, /*compare=*/true); } TEST_P(AutoRegressionTestLuma12bpp, DISABLED_Speed) { TestAutoRegressiveFilterLuma(std::get<0>(GetParam()), std::get<1>(GetParam()), 1e5, /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P( C, AutoRegressionTestLuma8bpp, testing::Combine(testing::Range(1, 4) /* coeff_lag */, testing::Range(0, 10) /* param_index */)); #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P( NEON, AutoRegressionTestLuma8bpp, testing::Combine(testing::Range(1, 4) /* coeff_lag */, testing::Range(0, 10) /* param_index */)); #endif #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P( C, AutoRegressionTestLuma10bpp, testing::Combine(testing::Range(1, 4) /* coeff_lag */, testing::Range(0, 10) /* param_index */)); #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P( NEON, AutoRegressionTestLuma10bpp, testing::Combine(testing::Range(1, 4) /* coeff_lag */, testing::Range(0, 10) /* param_index */)); #endif #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P( C, AutoRegressionTestLuma12bpp, testing::Combine(testing::Range(1, 4) /* coeff_lag */, testing::Range(0, 10) /* param_index */)); #endif // LIBGAV1_MAX_BITDEPTH == 12 struct AutoRegressionChromaTestParam { explicit AutoRegressionChromaTestParam(const std::tuple& in) : coeff_lag(std::get<0>(in)) { switch (std::get<1>(in)) { case 0: subsampling_x = 0; subsampling_y = 0; break; case 1: subsampling_x = 1; subsampling_y = 0; break; default: assert(std::get<1>(in) == 2); subsampling_x = 1; subsampling_y = 1; } } const int coeff_lag; int subsampling_x; int subsampling_y; }; template class AutoRegressionTestChroma : public testing::TestWithParam> { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); using GrainType = typename std::conditional::type; AutoRegressionTestChroma() { AutoRegressionChromaTestParam test_param(GetParam()); FilmGrainInit_C(); const dsp::Dsp* const dsp = dsp::GetDspTable(bitdepth); // This test suite does not cover num_y_points == 0. This should be covered // in the test of the full synthesis process. base_chroma_auto_regression_func_ = dsp->film_grain.chroma_auto_regression[1][test_param.coeff_lag]; const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "C/")) { base_chroma_auto_regression_func_ = nullptr; } else if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } chroma_auto_regression_func_ = dsp->film_grain.chroma_auto_regression[1][test_param.coeff_lag]; } ~AutoRegressionTestChroma() override = default; protected: // |compare| determines whether to compare the output blocks from the SIMD // implementation, if used, and the C implementation. // |saturate| determines whether to set the inputs to maximum values. This is // intended primarily as a way to simplify differences in output when // debugging. void TestAutoRegressiveFilterChroma(int coeff_lag, int subsampling_x, int subsampling_y, int num_runs, bool saturate, bool compare); ChromaAutoRegressionFunc chroma_auto_regression_func_; ChromaAutoRegressionFunc base_chroma_auto_regression_func_; GrainType luma_block_buffer_[kLumaBlockSize]; GrainType u_block_buffer_[kChromaBlockSize]; GrainType v_block_buffer_[kChromaBlockSize]; GrainType base_u_block_buffer_[kChromaBlockSize]; GrainType base_v_block_buffer_[kChromaBlockSize]; }; template void AutoRegressionTestChroma::TestAutoRegressiveFilterChroma( int coeff_lag, int subsampling_x, int subsampling_y, int num_runs, bool saturate, bool compare) { if (chroma_auto_regression_func_ == nullptr) return; // Compare is only needed for NEON tests to compare with C output. if (base_chroma_auto_regression_func_ == nullptr && compare) return; // This function relies on the first set of sampled params for basics. The // test param generators are used for coverage. FilmGrainParams params = kFilmGrainParams[0]; params.auto_regression_coeff_lag = coeff_lag; const int grain_max = GetGrainMax(); const int grain_min = GetGrainMin(); const int chroma_width = (subsampling_x != 0) ? kMinChromaWidth : kMaxChromaWidth; const int chroma_height = (subsampling_y != 0) ? kMinChromaHeight : kMaxChromaHeight; if (saturate) { memset(params.auto_regression_coeff_u, 127, sizeof(params.auto_regression_coeff_u)); memset(params.auto_regression_coeff_v, 127, sizeof(params.auto_regression_coeff_v)); for (int y = 0; y < kLumaHeight; ++y) { for (int x = 0; x < kLumaWidth; ++x) { // This loop relies on the fact that kMaxChromaWidth == kLumaWidth. luma_block_buffer_[y * kLumaWidth + x] = grain_max; u_block_buffer_[y * kLumaWidth + x] = grain_max; v_block_buffer_[y * kLumaWidth + x] = grain_max; } } } else { libvpx_test::ACMRandom rnd(libvpx_test::ACMRandom::DeterministicSeed()); // Allow any valid grain values. const int random_range = grain_max - grain_min + 1; for (int y = 0; y < kLumaHeight; ++y) { for (int x = 0; x < kLumaWidth; ++x) { // This loop relies on the fact that kMaxChromaWidth == kLumaWidth. const int random_y = rnd(random_range); luma_block_buffer_[y * kLumaWidth + x] = random_y + grain_min; const int random_u = rnd(random_range); u_block_buffer_[y * kLumaWidth + x] = random_u + grain_min; const int random_v = rnd(random_range); v_block_buffer_[y * kLumaWidth + x] = random_v + grain_min; } } } if (compare) { memcpy(base_u_block_buffer_, u_block_buffer_, sizeof(u_block_buffer_)); memcpy(base_v_block_buffer_, v_block_buffer_, sizeof(v_block_buffer_)); } const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { chroma_auto_regression_func_(params, luma_block_buffer_, subsampling_x, subsampling_y, u_block_buffer_, v_block_buffer_); } const absl::Duration elapsed_time = absl::Now() - start; if (num_runs > 1) { printf("AutoRegressionChroma lag=%d, sub_x=%d, sub_y=%d: %d us\n", coeff_lag, subsampling_x, subsampling_y, static_cast(absl::ToInt64Microseconds(elapsed_time))); return; } if (compare) { base_chroma_auto_regression_func_(params, luma_block_buffer_, subsampling_x, subsampling_y, base_u_block_buffer_, base_v_block_buffer_); EXPECT_TRUE(test_utils::CompareBlocks(u_block_buffer_, base_u_block_buffer_, chroma_width, chroma_height, chroma_width, chroma_width, false)); EXPECT_TRUE(test_utils::CompareBlocks(v_block_buffer_, base_v_block_buffer_, chroma_width, chroma_height, chroma_width, chroma_width, false)); } else { test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("AutoRegressionChromaU lag=%d, sub_x=%d, sub_y=%d", coeff_lag, subsampling_x, subsampling_y) .c_str(), GetARTestDigestChromaU(bitdepth, coeff_lag, subsampling_x, subsampling_y), u_block_buffer_, sizeof(u_block_buffer_), elapsed_time); test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("AutoRegressionChromaV lag=%d, sub_x=%d, sub_y=%d", coeff_lag, subsampling_x, subsampling_y) .c_str(), GetARTestDigestChromaV(bitdepth, coeff_lag, subsampling_x, subsampling_y), v_block_buffer_, sizeof(v_block_buffer_), elapsed_time); } } using AutoRegressionTestChroma8bpp = AutoRegressionTestChroma<8>; TEST_P(AutoRegressionTestChroma8bpp, AutoRegressiveFilterChroma) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma(test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, 1, /*saturate=*/false, /*compare=*/false); } TEST_P(AutoRegressionTestChroma8bpp, AutoRegressiveFilterChromaSaturated) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma(test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, 1, /*saturate=*/true, /*compare=*/true); } TEST_P(AutoRegressionTestChroma8bpp, DISABLED_Speed) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma( test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, // Subsampling cuts each dimension of the chroma blocks in half, so run // twice as many times to compensate. 1e5 * (1 << (test_param.subsampling_y + test_param.subsampling_x)), /*saturate=*/false, /*compare=*/false); } #if LIBGAV1_MAX_BITDEPTH >= 10 using AutoRegressionTestChroma10bpp = AutoRegressionTestChroma<10>; TEST_P(AutoRegressionTestChroma10bpp, AutoRegressiveFilterChroma) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma(test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, 1, /*saturate=*/false, /*compare=*/false); } TEST_P(AutoRegressionTestChroma10bpp, AutoRegressiveFilterChromaSaturated) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma(test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, 1, /*saturate=*/true, /*compare=*/true); } TEST_P(AutoRegressionTestChroma10bpp, DISABLED_Speed) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma( test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, // Subsampling cuts each dimension of the chroma blocks in half, so run // twice as many times to compensate. 1e5 * (1 << (test_param.subsampling_y + test_param.subsampling_x)), /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using AutoRegressionTestChroma12bpp = AutoRegressionTestChroma<12>; TEST_P(AutoRegressionTestChroma12bpp, AutoRegressiveFilterChroma) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma(test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, 1, /*saturate=*/false, /*compare=*/false); } TEST_P(AutoRegressionTestChroma12bpp, AutoRegressiveFilterChromaSaturated) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma(test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, 1, /*saturate=*/true, /*compare=*/true); } TEST_P(AutoRegressionTestChroma12bpp, DISABLED_Speed) { AutoRegressionChromaTestParam test_param(GetParam()); TestAutoRegressiveFilterChroma( test_param.coeff_lag, test_param.subsampling_x, test_param.subsampling_y, // Subsampling cuts each dimension of the chroma blocks in half, so run // twice as many times to compensate. 1e5 * (1 << (test_param.subsampling_y + test_param.subsampling_x)), /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, AutoRegressionTestChroma8bpp, testing::Combine(testing::Range(0, 4) /* coeff_lag */, testing::Range(0, 3) /* subsampling */)); #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P(C, AutoRegressionTestChroma10bpp, testing::Combine(testing::Range(0, 4) /* coeff_lag */, testing::Range(0, 3) /* subsampling */)); #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, AutoRegressionTestChroma12bpp, testing::Combine(testing::Range(0, 4) /* coeff_lag */, testing::Range(0, 3) /* subsampling */)); #endif // LIBGAV1_MAX_BITDEPTH == 12 #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, AutoRegressionTestChroma8bpp, testing::Combine(testing::Range(0, 4) /* coeff_lag */, testing::Range(0, 3) /* subsampling */)); #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P(NEON, AutoRegressionTestChroma10bpp, testing::Combine(testing::Range(0, 4) /* coeff_lag */, testing::Range(0, 3) /* subsampling */)); #endif // LIBGAV1_MAX_BITDEPTH >= 10 #endif // LIBGAV1_ENABLE_NEON template class GrainGenerationTest : public testing::TestWithParam { protected: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); using GrainType = typename std::conditional::type; void TestGenerateGrainLuma(int param_index, int num_runs); GrainType luma_block_buffer_[kLumaBlockSize]; }; template void GrainGenerationTest::TestGenerateGrainLuma(int param_index, int num_runs) { FilmGrainParams params = kFilmGrainParams[param_index]; const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { FilmGrain::GenerateLumaGrain(params, luma_block_buffer_); } const absl::Duration elapsed_time = absl::Now() - start; if (num_runs == 1) { test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("GenerateGrainLuma param_index=%d", param_index) .c_str(), GetGrainGenerationTestDigestLuma(bitdepth, param_index), luma_block_buffer_, sizeof(luma_block_buffer_), elapsed_time); } else { printf("GenerateGrainLuma param_index=%d: %d us\n", param_index, static_cast(absl::ToInt64Microseconds(elapsed_time))); } } using GrainGenerationTest8bpp = GrainGenerationTest<8>; TEST_P(GrainGenerationTest8bpp, GenerateGrainLuma) { TestGenerateGrainLuma(GetParam(), 1); } TEST_P(GrainGenerationTest8bpp, DISABLED_LumaSpeed) { TestGenerateGrainLuma(GetParam(), 1e5); } #if LIBGAV1_MAX_BITDEPTH >= 10 using GrainGenerationTest10bpp = GrainGenerationTest<10>; TEST_P(GrainGenerationTest10bpp, GenerateGrainLuma) { TestGenerateGrainLuma(GetParam(), 1); } TEST_P(GrainGenerationTest10bpp, DISABLED_LumaSpeed) { TestGenerateGrainLuma(GetParam(), 1e5); } #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using GrainGenerationTest12bpp = GrainGenerationTest<12>; TEST_P(GrainGenerationTest12bpp, GenerateGrainLuma) { TestGenerateGrainLuma(GetParam(), 1); } TEST_P(GrainGenerationTest12bpp, DISABLED_LumaSpeed) { TestGenerateGrainLuma(GetParam(), 1e5); } #endif // LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, GrainGenerationTest8bpp, testing::Range(0, 10) /* param_index */); #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P(C, GrainGenerationTest10bpp, testing::Range(0, 10) /* param_index */); #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, GrainGenerationTest12bpp, testing::Range(0, 10) /* param_index */); #endif // LIBGAV1_MAX_BITDEPTH == 12 // This param type is used for both ConstructStripesTest and // ConstructImageTest. struct ConstructNoiseTestParam { explicit ConstructNoiseTestParam(const std::tuple& in) : overlap_flag(std::get<0>(in)) { switch (std::get<1>(in)) { case 0: subsampling_x = 0; subsampling_y = 0; break; case 1: subsampling_x = 1; subsampling_y = 0; break; default: assert(std::get<1>(in) == 2); subsampling_x = 1; subsampling_y = 1; } } const int overlap_flag; int subsampling_x; int subsampling_y; }; template class ConstructStripesTest : public testing::TestWithParam> { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); using GrainType = typename std::conditional::type; ConstructStripesTest() { FilmGrainInit_C(); const dsp::Dsp* const dsp = dsp::GetDspTable(bitdepth); base_construct_noise_stripes_func_ = dsp->film_grain.construct_noise_stripes[std::get<0>(GetParam())]; const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "C/")) { base_construct_noise_stripes_func_ = nullptr; } else if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } construct_noise_stripes_func_ = dsp->film_grain.construct_noise_stripes[std::get<0>(GetParam())]; } ~ConstructStripesTest() override = default; protected: // |compare| determines whether to compare the output blocks from the SIMD // implementation, if used, and the C implementation. // |saturate| determines whether to set the inputs to maximum values. This is // intended primarily as a way to simplify differences in output when // debugging. void TestConstructNoiseStripes(int overlap_flag, int subsampling_x, int subsampling_y, int num_runs, bool saturate, bool compare); ConstructNoiseStripesFunc construct_noise_stripes_func_; ConstructNoiseStripesFunc base_construct_noise_stripes_func_; GrainType grain_buffer_[kLumaBlockSize]; Array2DView noise_stripes_; // Owns the memory that noise_stripes_ points to. std::unique_ptr stripe_buffer_; Array2DView base_noise_stripes_; // Owns the memory that base_stripe_buffer_ points to. std::unique_ptr base_stripe_buffer_; }; template void ConstructStripesTest::TestConstructNoiseStripes( int overlap_flag, int subsampling_x, int subsampling_y, int num_runs, bool saturate, bool compare) { if (construct_noise_stripes_func_ == nullptr) return; // Compare is only needed for NEON tests to compare with C output. if (base_construct_noise_stripes_func_ == nullptr && compare) return; const int stripe_width = ((kFrameWidth + subsampling_x) >> subsampling_x); const int stripe_height = kNoiseStripeHeight; const int stripe_size = stripe_height * stripe_width; const int stripe_buffer_size = stripe_size * kNumTestStripes; if (compare) { base_stripe_buffer_.reset(new ( std::nothrow) GrainType[stripe_buffer_size + kNoiseStripePadding]()); ASSERT_NE(base_stripe_buffer_, nullptr); base_noise_stripes_.Reset(kNumTestStripes, stripe_size, base_stripe_buffer_.get()); } stripe_buffer_.reset( new (std::nothrow) GrainType[stripe_buffer_size + kNoiseStripePadding]()); ASSERT_NE(stripe_buffer_, nullptr); noise_stripes_.Reset(kNumTestStripes, stripe_size, stripe_buffer_.get()); const int grain_max = GetGrainMax(); const int grain_min = GetGrainMin(); if (saturate) { for (int y = 0; y < kLumaHeight; ++y) { for (int x = 0; x < kLumaWidth; ++x) { grain_buffer_[y * kLumaWidth + x] = grain_max; } } } else { libvpx_test::ACMRandom rnd(libvpx_test::ACMRandom::DeterministicSeed()); // Allow any valid grain values. const int random_range = grain_max - grain_min + 1; for (int y = 0; y < kLumaHeight; ++y) { for (int x = 0; x < kLumaWidth; ++x) { grain_buffer_[y * kLumaWidth + x] = grain_min + rnd(random_range); } } } const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { construct_noise_stripes_func_(grain_buffer_, 68, kFrameWidth, kFrameHeight, subsampling_x, subsampling_y, &noise_stripes_); } const absl::Duration elapsed_time = absl::Now() - start; if (num_runs > 1) { printf( "ConstructNoiseStripes Speed Test for overlap=%d, sub_x=%d, " "sub_y=%d: %d us\n", overlap_flag, subsampling_x, subsampling_y, static_cast(absl::ToInt64Microseconds(elapsed_time))); return; } if (compare) { base_construct_noise_stripes_func_(grain_buffer_, 68, kFrameWidth, kFrameHeight, subsampling_x, subsampling_y, &base_noise_stripes_); constexpr int kCompareWidth = 64; for (int stripe = 0; stripe < kNumTestStripes;) { EXPECT_TRUE(test_utils::CompareBlocks( noise_stripes_[stripe], base_noise_stripes_[stripe], kCompareWidth, stripe_height, stripe_width, stripe_width, /*check_padding=*/false, /*print_diff=*/false)); } } else { test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("ConstructNoiseStripes overlap=%d, sub_x=%d, sub_y=%d", overlap_flag, subsampling_x, subsampling_y) .c_str(), GetConstructStripesTestDigest(bitdepth, overlap_flag, subsampling_x, subsampling_y), noise_stripes_[0], stripe_buffer_size, elapsed_time); } } using ConstructStripesTest8bpp = ConstructStripesTest<8>; TEST_P(ConstructStripesTest8bpp, RandomValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/false, /*compare=*/false); } TEST_P(ConstructStripesTest8bpp, SaturatedValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/true, /*compare=*/true); } TEST_P(ConstructStripesTest8bpp, DISABLED_Speed) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/500, /*saturate=*/false, /*compare=*/false); } #if LIBGAV1_MAX_BITDEPTH >= 10 using ConstructStripesTest10bpp = ConstructStripesTest<10>; TEST_P(ConstructStripesTest10bpp, RandomValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/false, /*compare=*/false); } TEST_P(ConstructStripesTest10bpp, SaturatedValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/true, /*compare=*/true); } TEST_P(ConstructStripesTest10bpp, DISABLED_Speed) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/500, /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using ConstructStripesTest12bpp = ConstructStripesTest<12>; TEST_P(ConstructStripesTest12bpp, RandomValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/false, /*compare=*/false); } TEST_P(ConstructStripesTest12bpp, SaturatedValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/true, /*compare=*/true); } TEST_P(ConstructStripesTest12bpp, DISABLED_Speed) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseStripes(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/500, /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, ConstructStripesTest8bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P(C, ConstructStripesTest10bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, ConstructStripesTest12bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif // LIBGAV1_MAX_BITDEPTH == 12 template class ConstructImageTest : public testing::TestWithParam> { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); using GrainType = typename std::conditional::type; ConstructImageTest() { FilmGrainInit_C(); const dsp::Dsp* const dsp = dsp::GetDspTable(bitdepth); base_construct_noise_image_overlap_func_ = dsp->film_grain.construct_noise_image_overlap; const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "C/")) { base_construct_noise_image_overlap_func_ = nullptr; } else if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } construct_noise_image_overlap_func_ = dsp->film_grain.construct_noise_image_overlap; } ~ConstructImageTest() override = default; protected: // |compare| determines whether to compare the output blocks from the SIMD // implementation, if used, and the C implementation. // |saturate| determines whether to set the inputs to maximum values. This is // intended primarily as a way to simplify differences in output when // debugging. void TestConstructNoiseImage(int overlap_flag, int subsampling_x, int subsampling_y, int num_runs, bool saturate, bool compare); ConstructNoiseImageOverlapFunc construct_noise_image_overlap_func_; ConstructNoiseImageOverlapFunc base_construct_noise_image_overlap_func_; Array2DView noise_stripes_; // Owns the memory that noise_stripes_ points to. std::unique_ptr stripe_buffer_; Array2D noise_image_; Array2D base_noise_image_; }; template void ConstructImageTest::TestConstructNoiseImage( int overlap_flag, int subsampling_x, int subsampling_y, int num_runs, bool saturate, bool compare) { if (construct_noise_image_overlap_func_ == nullptr) return; // Compare is only needed for NEON tests to compare with C output. if (base_construct_noise_image_overlap_func_ == nullptr && compare) return; const int image_width = ((kFrameWidth + subsampling_x) >> subsampling_x); const int image_height = ((kFrameHeight + subsampling_y) >> subsampling_y); const int stripe_height = ((kNoiseStripeHeight + subsampling_y) >> subsampling_y); const int image_stride = image_width + kNoiseImagePadding; const int stripe_size = stripe_height * image_width; if (compare) { ASSERT_TRUE(base_noise_image_.Reset(image_height, image_stride, /*zero_initialize=*/false)); } ASSERT_TRUE(noise_image_.Reset(image_height, image_stride, /*zero_initialize=*/false)); // Stride between stripe rows is |image_width|. Padding is only at the // end of the final row of the final stripe to protect from overreads. stripe_buffer_.reset( new (std::nothrow) GrainType[kNumTestStripes * stripe_size + kNoiseStripePadding]); ASSERT_NE(stripe_buffer_, nullptr); noise_stripes_.Reset(kNumTestStripes, stripe_size, stripe_buffer_.get()); const int grain_max = GetGrainMax(); const int grain_min = GetGrainMin(); if (saturate) { for (int i = 0; i < stripe_size; ++i) { noise_stripes_[0][i] = grain_max; } for (int stripe = 1; stripe < kNumTestStripes; ++stripe) { memcpy(noise_stripes_[stripe], noise_stripes_[0], stripe_size * sizeof(noise_stripes_[0][0])); } } else { libvpx_test::ACMRandom rnd(libvpx_test::ACMRandom::DeterministicSeed()); // Allow any valid grain values. const int random_range = grain_max - grain_min + 1; for (int stripe = 0; stripe < kNumTestStripes; ++stripe) { // Assign all allocated memory for this stripe. for (int i = 0; i < stripe_height; ++i) { for (int x = 0; x < image_width; ++x) { noise_stripes_[stripe][i * image_width + x] = grain_min + rnd(random_range); } } } } const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { FilmGrain::ConstructNoiseImage( &noise_stripes_, kFrameWidth, kFrameHeight, subsampling_x, subsampling_y, overlap_flag << (1 - subsampling_y), &noise_image_); if (overlap_flag == 1) { construct_noise_image_overlap_func_(&noise_stripes_, kFrameWidth, kFrameHeight, subsampling_x, subsampling_y, &noise_image_); } } const absl::Duration elapsed_time = absl::Now() - start; if (num_runs > 1) { printf( "ConstructNoiseImage Speed Test for overlap=%d, sub_x=%d, " "sub_y=%d: %d us\n", overlap_flag, subsampling_x, subsampling_y, static_cast(absl::ToInt64Microseconds(elapsed_time))); return; } if (compare) { FilmGrain::ConstructNoiseImage( &noise_stripes_, kFrameWidth, kFrameHeight, subsampling_x, subsampling_y, overlap_flag << (1 - subsampling_y), &base_noise_image_); if (overlap_flag == 1) { base_construct_noise_image_overlap_func_( &noise_stripes_, kFrameWidth, kFrameHeight, subsampling_x, subsampling_y, &base_noise_image_); } constexpr int kCompareWidth = 72; constexpr int kCompareHeight = 72; EXPECT_TRUE(test_utils::CompareBlocks( noise_image_[0], base_noise_image_[0], kCompareWidth, kCompareHeight, image_stride, image_stride, /*check_padding=*/false, /*print_diff=*/false)); } else { printf("BD%d \"%s\",\n", bitdepth, test_utils::GetMd5Sum(noise_image_[0], image_width, image_height, image_stride) .c_str()); test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("ConstructNoiseImage overlap=%d, sub_x=%d, sub_y=%d", overlap_flag, subsampling_x, subsampling_y) .c_str(), GetConstructImageTestDigest(bitdepth, overlap_flag, subsampling_x, subsampling_y), noise_image_[0], image_width, image_height, image_stride, elapsed_time); } } using ConstructImageTest8bpp = ConstructImageTest<8>; TEST_P(ConstructImageTest8bpp, RandomValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/false, /*compare=*/false); } TEST_P(ConstructImageTest8bpp, SaturatedValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/true, /*compare=*/true); } TEST_P(ConstructImageTest8bpp, DISABLED_Speed) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/500, /*saturate=*/false, /*compare=*/false); } #if LIBGAV1_MAX_BITDEPTH >= 10 using ConstructImageTest10bpp = ConstructImageTest<10>; TEST_P(ConstructImageTest10bpp, RandomValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/false, /*compare=*/false); } TEST_P(ConstructImageTest10bpp, SaturatedValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/true, /*compare=*/true); } TEST_P(ConstructImageTest10bpp, DISABLED_Speed) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/500, /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using ConstructImageTest12bpp = ConstructImageTest<12>; TEST_P(ConstructImageTest12bpp, RandomValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/false, /*compare=*/false); } TEST_P(ConstructImageTest12bpp, SaturatedValues) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/1, /*saturate=*/true, /*compare=*/true); } TEST_P(ConstructImageTest12bpp, DISABLED_Speed) { ConstructNoiseTestParam test_params(GetParam()); TestConstructNoiseImage(test_params.overlap_flag, test_params.subsampling_x, test_params.subsampling_y, /*num_runs=*/500, /*saturate=*/false, /*compare=*/false); } #endif // LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, ConstructImageTest8bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, ConstructImageTest8bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif // LIBGAV1_ENABLE_NEON #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P(C, ConstructImageTest10bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, ConstructImageTest12bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif // LIBGAV1_MAX_BITDEPTH == 12 template class ScalingLookupTableTest : public testing::TestWithParam { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); ScalingLookupTableTest() { test_utils::ResetDspTable(bitdepth); FilmGrainInit_C(); const dsp::Dsp* const dsp = dsp::GetDspTable(bitdepth); const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } initialize_func_ = dsp->film_grain.initialize_scaling_lut; } ~ScalingLookupTableTest() override = default; protected: void TestSpeed(int num_runs); void ZeroPoints(); private: static constexpr int kScalingLutBufferLength = (kScalingLookupTableSize + kScalingLookupTablePadding) << (bitdepth - 8); dsp::InitializeScalingLutFunc initialize_func_; int16_t scaling_lut_[kScalingLutBufferLength]; }; template void ScalingLookupTableTest::TestSpeed(int num_runs) { if (initialize_func_ == nullptr) return; const int param_index = GetParam(); const FilmGrainParams& params = kFilmGrainParams[param_index]; const absl::Time start = absl::Now(); Memset(scaling_lut_, 0, kScalingLutBufferLength); for (int i = 0; i < num_runs; ++i) { initialize_func_(params.num_y_points, params.point_y_value, params.point_y_scaling, scaling_lut_, kScalingLutBufferLength); } const absl::Duration elapsed_time = absl::Now() - start; if (num_runs > 1) { printf("InitializeScalingLut: %d us\n", static_cast(absl::ToInt64Microseconds(elapsed_time))); return; } test_utils::CheckMd5Digest( "FilmGrain", absl::StrFormat("InitializeScalingLut for param set: %d", param_index) .c_str(), GetScalingInitTestDigest(param_index, bitdepth), scaling_lut_, (sizeof(scaling_lut_[0]) * kScalingLookupTableSize) << (bitdepth - 8), elapsed_time); } template void ScalingLookupTableTest::ZeroPoints() { if (initialize_func_ == nullptr) return; const int param_index = GetParam(); const FilmGrainParams& params = kFilmGrainParams[param_index]; initialize_func_(0, params.point_y_value, params.point_y_scaling, scaling_lut_, kScalingLookupTableSize); for (int i = 0; i < kScalingLookupTableSize; ++i) { ASSERT_EQ(scaling_lut_[i], 0); } } using ScalingLookupTableTest8bpp = ScalingLookupTableTest<8>; TEST_P(ScalingLookupTableTest8bpp, ZeroPoints) { ZeroPoints(); } TEST_P(ScalingLookupTableTest8bpp, Correctness) { TestSpeed(/*num_runs=*/1); } TEST_P(ScalingLookupTableTest8bpp, DISABLED_Speed) { TestSpeed(/*num_runs=*/1e5); } #if LIBGAV1_MAX_BITDEPTH >= 10 using ScalingLookupTableTest10bpp = ScalingLookupTableTest<10>; TEST_P(ScalingLookupTableTest10bpp, ZeroPoints) { ZeroPoints(); } TEST_P(ScalingLookupTableTest10bpp, Correctness) { TestSpeed(/*num_runs=*/1); } TEST_P(ScalingLookupTableTest10bpp, DISABLED_Speed) { TestSpeed(/*num_runs=*/1e5); } #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using ScalingLookupTableTest12bpp = ScalingLookupTableTest<12>; TEST_P(ScalingLookupTableTest12bpp, ZeroPoints) { ZeroPoints(); } TEST_P(ScalingLookupTableTest12bpp, Correctness) { TestSpeed(/*num_runs=*/1); } TEST_P(ScalingLookupTableTest12bpp, DISABLED_Speed) { TestSpeed(/*num_runs=*/1e5); } #endif // LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, ScalingLookupTableTest8bpp, testing::Range(0, kNumFilmGrainTestParams)); #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, ScalingLookupTableTest8bpp, testing::Range(0, kNumFilmGrainTestParams)); #endif #if LIBGAV1_MAX_BITDEPTH >= 10 INSTANTIATE_TEST_SUITE_P(C, ScalingLookupTableTest10bpp, testing::Range(0, kNumFilmGrainTestParams)); #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, ScalingLookupTableTest10bpp, testing::Range(0, kNumFilmGrainTestParams)); #endif #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 INSTANTIATE_TEST_SUITE_P(C, ScalingLookupTableTest12bpp, testing::Range(0, kNumFilmGrainTestParams)); #endif // LIBGAV1_MAX_BITDEPTH == 12 struct BlendNoiseTestParam { explicit BlendNoiseTestParam(const std::tuple& in) : chroma_scaling_from_luma(std::get<0>(in)) { switch (std::get<1>(in)) { case 0: subsampling_x = 0; subsampling_y = 0; break; case 1: subsampling_x = 1; subsampling_y = 0; break; default: assert(std::get<1>(in) == 2); subsampling_x = 1; subsampling_y = 1; } } const int chroma_scaling_from_luma; int subsampling_x; int subsampling_y; }; template class BlendNoiseTest : public testing::TestWithParam> { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); using GrainType = typename std::conditional::type; ~BlendNoiseTest() override = default; protected: void SetUp() override { test_utils::ResetDspTable(bitdepth); FilmGrainInit_C(); const dsp::Dsp* const dsp = dsp::GetDspTable(bitdepth); const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } else if (absl::StartsWith(test_case, "SSE41/")) { if ((GetCpuInfo() & kSSE4_1) == 0) GTEST_SKIP() << "No SSE4.1 support!"; FilmGrainInit_SSE4_1(); } const BlendNoiseTestParam test_param(GetParam()); chroma_scaling_from_luma_ = test_param.chroma_scaling_from_luma; blend_luma_func_ = dsp->film_grain.blend_noise_luma; blend_chroma_func_ = dsp->film_grain.blend_noise_chroma[chroma_scaling_from_luma_]; subsampling_x_ = test_param.subsampling_x; subsampling_y_ = test_param.subsampling_y; uv_width_ = (width_ + subsampling_x_) >> subsampling_x_; uv_height_ = (height_ + subsampling_y_) >> subsampling_y_; uv_stride_ = uv_width_ * sizeof(Pixel); y_stride_ = width_ * sizeof(Pixel); const size_t buffer_size = sizeof(Pixel) * (width_ * height_ + 2 * uv_width_ * uv_height_ + 3 * kBorderPixelsFilmGrain); source_buffer_.reset(new (std::nothrow) uint8_t[buffer_size]); memset(source_buffer_.get(), 0, sizeof(source_buffer_[0]) * buffer_size); dest_buffer_.reset(new (std::nothrow) uint8_t[buffer_size]); memset(dest_buffer_.get(), 0, sizeof(dest_buffer_[0]) * buffer_size); source_plane_y_ = source_buffer_.get(); source_plane_u_ = source_plane_y_ + y_stride_ * height_ + kBorderPixelsFilmGrain; source_plane_v_ = source_plane_u_ + uv_stride_ * uv_height_ + kBorderPixelsFilmGrain; dest_plane_y_ = dest_buffer_.get(); dest_plane_u_ = dest_plane_y_ + y_stride_ * height_ + kBorderPixelsFilmGrain; dest_plane_v_ = dest_plane_u_ + uv_stride_ * uv_height_ + kBorderPixelsFilmGrain; } void TestSpeed(int num_runs); private: static constexpr int kScalingLutBufferLength = (kScalingLookupTableSize + kScalingLookupTablePadding) << 2; void ConvertScalingLut10bpp(int16_t* scaling_lut_10bpp, const int16_t* src_scaling_lut); dsp::BlendNoiseWithImageLumaFunc blend_luma_func_; dsp::BlendNoiseWithImageChromaFunc blend_chroma_func_; const int width_ = 1921; const int height_ = 1081; int chroma_scaling_from_luma_ = 0; int subsampling_x_ = 0; int subsampling_y_ = 0; int uv_width_ = 0; int uv_height_ = 0; int uv_stride_ = 0; int y_stride_ = 0; // This holds the data that |source_plane_y_|, |source_plane_u_|, and // |source_plane_v_| point to. std::unique_ptr source_buffer_; // This holds the data that |dest_plane_y_|, |dest_plane_u_|, and // |dest_plane_v_| point to. std::unique_ptr dest_buffer_; uint8_t* source_plane_y_ = nullptr; uint8_t* source_plane_u_ = nullptr; uint8_t* source_plane_v_ = nullptr; uint8_t* dest_plane_y_ = nullptr; uint8_t* dest_plane_u_ = nullptr; uint8_t* dest_plane_v_ = nullptr; Array2D noise_image_[kMaxPlanes]; int16_t scaling_lut_10bpp_y_[kScalingLutBufferLength]; int16_t scaling_lut_10bpp_u_[kScalingLutBufferLength]; int16_t scaling_lut_10bpp_v_[kScalingLutBufferLength]; }; template void BlendNoiseTest::ConvertScalingLut10bpp( int16_t* scaling_lut_10bpp, const int16_t* src_scaling_lut) { for (int i = 0; i < kScalingLookupTableSize - 1; ++i) { const int x_base = i << 2; const int start = src_scaling_lut[i]; const int end_index = std::min(i + 1, kScalingLookupTableSize - 1); const int end = src_scaling_lut[end_index]; const int delta = end - start; scaling_lut_10bpp[x_base] = start; scaling_lut_10bpp[x_base + 1] = start + RightShiftWithRounding(delta, 2); scaling_lut_10bpp[x_base + 2] = start + RightShiftWithRounding(2 * delta, 2); scaling_lut_10bpp[x_base + 3] = start + RightShiftWithRounding(3 * delta, 2); } } template void BlendNoiseTest::TestSpeed(const int num_runs) { if (blend_chroma_func_ == nullptr || blend_luma_func_ == nullptr) return; // Allow optimized code to read into the border without generating MSan // warnings. This matches the behavior in FilmGrain::AllocateNoiseImage(). constexpr bool zero_initialize = LIBGAV1_MSAN == 1; ASSERT_TRUE(noise_image_[kPlaneY].Reset(height_, width_ + kNoiseImagePadding, zero_initialize)); ASSERT_TRUE(noise_image_[kPlaneU].Reset( uv_height_, uv_width_ + kNoiseImagePadding, zero_initialize)); ASSERT_TRUE(noise_image_[kPlaneV].Reset( uv_height_, uv_width_ + kNoiseImagePadding, zero_initialize)); libvpx_test::ACMRandom rnd(libvpx_test::ACMRandom::DeterministicSeed()); // Allow any valid grain values. const int grain_max = GetGrainMax(); const int grain_min = GetGrainMin(); const int random_range = grain_max - grain_min + 1; auto* src_y = reinterpret_cast(source_plane_y_); auto* src_u = reinterpret_cast(source_plane_u_); auto* src_v = reinterpret_cast(source_plane_v_); for (int y = 0; y < height_; ++y) { for (int x = 0; x < width_; ++x) { const int random_source_y = rnd(random_range); // Populating the luma source ensures the lookup table is tested. Chroma // planes are given identical values. Giving them different values would // artificially differentiate the outputs. It's important that the test // expect that different outputs are caused by the different scaling // lookup tables, rather than by different inputs. const int uv_y_pos = y >> subsampling_y_; const int uv_x_pos = x >> subsampling_x_; src_y[y * width_ + x] = random_source_y; src_u[uv_y_pos * uv_width_ + uv_x_pos] = random_source_y; src_v[uv_y_pos * uv_width_ + uv_x_pos] = random_source_y; const int random_y = rnd(random_range); noise_image_[kPlaneY][y][x] = random_y + grain_min; const int random_u = rnd(random_range); noise_image_[kPlaneU][uv_y_pos][uv_x_pos] = random_u + grain_min; const int random_v = rnd(random_range); noise_image_[kPlaneV][uv_y_pos][uv_x_pos] = random_v + grain_min; } } static constexpr int16_t kTestScalingLutY[kScalingLookupTableSize] = { 72, 72, 72, 72, 72, 72, 72, 72, 72, 72, 72, 72, 72, 72, 73, 75, 76, 77, 79, 80, 81, 83, 84, 86, 87, 88, 90, 91, 92, 92, 93, 93, 94, 95, 95, 96, 97, 97, 98, 98, 99, 99, 99, 99, 98, 98, 98, 98, 98, 98, 98, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, 102, }; static constexpr int16_t kTestScalingLutU[kScalingLookupTableSize] = { 30, 42, 53, 65, 74, 74, 74, 74, 74, 74, 74, 74, 74, 74, 74, 75, 76, 78, 79, 81, 82, 83, 85, 86, 88, 89, 91, 92, 93, 93, 94, 94, 95, 95, 96, 96, 97, 97, 98, 98, 99, 99, 99, 99, 99, 99, 99, 99, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 110, 110, 110, 110, 110, 110, 110, 110, 110, 110, 110, 110, 110, 110, 110, 98, 98, 98, 98, 98, 98, 98, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 96, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, 95, }; static constexpr int16_t kTestScalingLutV[kScalingLookupTableSize] = { 73, 73, 73, 73, 73, 73, 73, 73, 73, 73, 73, 73, 74, 74, 74, 75, 75, 78, 79, 81, 82, 83, 85, 86, 88, 89, 91, 92, 93, 93, 94, 94, 95, 95, 96, 96, 97, 97, 98, 98, 99, 99, 99, 99, 98, 98, 98, 98, 98, 98, 98, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 97, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 98, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 99, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 101, 150, 150, 150, 150, 150, 150, 150, 150, 150, 150, 150, 150, 150, 150, 150, 180, 180, 180, 180, 180, 180, 180, 180, 180, 180, 180, 180, 180, 180, 180, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 255, 255, }; if (bitdepth == 10) { for (int i = 0; i < kScalingLutBufferLength; ++i) { ConvertScalingLut10bpp(scaling_lut_10bpp_y_, kTestScalingLutY); ConvertScalingLut10bpp(scaling_lut_10bpp_u_, kTestScalingLutU); ConvertScalingLut10bpp(scaling_lut_10bpp_v_, kTestScalingLutV); } } const FilmGrainParams& params = kFilmGrainParams[0]; const int min_value = 16 << (bitdepth - 8); const int max_value = 235 << (bitdepth - 8); const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { if (chroma_scaling_from_luma_) { blend_chroma_func_( kPlaneU, params, noise_image_, min_value, max_value, width_, height_, /*start_height=*/0, subsampling_x_, subsampling_y_, (bitdepth == 10) ? scaling_lut_10bpp_y_ : kTestScalingLutY, source_plane_y_, y_stride_, source_plane_u_, uv_stride_, dest_plane_u_, uv_stride_); blend_chroma_func_( kPlaneV, params, noise_image_, min_value, max_value, width_, height_, /*start_height=*/0, subsampling_x_, subsampling_y_, (bitdepth == 10) ? scaling_lut_10bpp_y_ : kTestScalingLutY, source_plane_y_, y_stride_, source_plane_v_, uv_stride_, dest_plane_v_, uv_stride_); } else { blend_chroma_func_( kPlaneU, params, noise_image_, min_value, max_value, width_, height_, /*start_height=*/0, subsampling_x_, subsampling_y_, (bitdepth == 10) ? scaling_lut_10bpp_u_ : kTestScalingLutU, source_plane_y_, y_stride_, source_plane_u_, uv_stride_, dest_plane_u_, uv_stride_); blend_chroma_func_( kPlaneV, params, noise_image_, min_value, max_value, width_, height_, /*start_height=*/0, subsampling_x_, subsampling_y_, (bitdepth == 10) ? scaling_lut_10bpp_v_ : kTestScalingLutV, source_plane_y_, y_stride_, source_plane_v_, uv_stride_, dest_plane_v_, uv_stride_); } blend_luma_func_(noise_image_, min_value, max_value, params.chroma_scaling, width_, height_, /*start_height=*/0, (bitdepth == 10) ? scaling_lut_10bpp_y_ : kTestScalingLutY, source_plane_y_, y_stride_, dest_plane_y_, y_stride_); } const absl::Duration elapsed_time = absl::Now() - start; const char* digest_luma = GetBlendLumaTestDigest(bitdepth); printf("YBD%d \"%s\",\n", bitdepth, test_utils::GetMd5Sum(dest_plane_y_, y_stride_ * height_).c_str()); printf("UBD%d \"%s\",\n", bitdepth, test_utils::GetMd5Sum(dest_plane_u_, uv_stride_ * uv_height_).c_str()); printf("VBD%d \"%s\",\n", bitdepth, test_utils::GetMd5Sum(dest_plane_v_, uv_stride_ * uv_height_).c_str()); test_utils::CheckMd5Digest( "BlendNoiseWithImage", absl::StrFormat("Luma cfl=%d, sub_x=%d, sub_y=%d", chroma_scaling_from_luma_, subsampling_x_, subsampling_y_) .c_str(), digest_luma, dest_plane_y_, y_stride_ * height_, elapsed_time); const char* digest_chroma_u = GetBlendChromaUTestDigest( bitdepth, chroma_scaling_from_luma_, subsampling_x_, subsampling_y_); test_utils::CheckMd5Digest( "BlendNoiseWithImage", absl::StrFormat("ChromaU cfl=%d, sub_x=%d, sub_y=%d", chroma_scaling_from_luma_, subsampling_x_, subsampling_y_) .c_str(), digest_chroma_u, dest_plane_u_, uv_stride_ * uv_height_, elapsed_time); const char* digest_chroma_v = GetBlendChromaVTestDigest( bitdepth, chroma_scaling_from_luma_, subsampling_x_, subsampling_y_); test_utils::CheckMd5Digest( "BlendNoiseWithImage", absl::StrFormat("ChromaV cfl=%d, sub_x=%d, sub_y=%d", chroma_scaling_from_luma_, subsampling_x_, subsampling_y_) .c_str(), digest_chroma_v, dest_plane_v_, uv_stride_ * uv_height_, elapsed_time); } using BlendNoiseTest8bpp = BlendNoiseTest<8, uint8_t>; TEST_P(BlendNoiseTest8bpp, MatchesOriginalOutput) { TestSpeed(1); } TEST_P(BlendNoiseTest8bpp, DISABLED_Speed) { TestSpeed(kNumSpeedTests); } INSTANTIATE_TEST_SUITE_P(C, BlendNoiseTest8bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #if LIBGAV1_ENABLE_SSE4_1 INSTANTIATE_TEST_SUITE_P(SSE41, BlendNoiseTest8bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, BlendNoiseTest8bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif #if LIBGAV1_MAX_BITDEPTH >= 10 using BlendNoiseTest10bpp = BlendNoiseTest<10, uint16_t>; TEST_P(BlendNoiseTest10bpp, MatchesOriginalOutput) { TestSpeed(1); } TEST_P(BlendNoiseTest10bpp, DISABLED_Speed) { TestSpeed(kNumSpeedTests); } INSTANTIATE_TEST_SUITE_P(C, BlendNoiseTest10bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #if LIBGAV1_ENABLE_SSE4_1 INSTANTIATE_TEST_SUITE_P(SSE41, BlendNoiseTest10bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, BlendNoiseTest10bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using BlendNoiseTest12bpp = BlendNoiseTest<12, uint16_t>; TEST_P(BlendNoiseTest12bpp, MatchesOriginalOutput) { TestSpeed(1); } TEST_P(BlendNoiseTest12bpp, DISABLED_Speed) { TestSpeed(kNumSpeedTests); } INSTANTIATE_TEST_SUITE_P(C, BlendNoiseTest12bpp, testing::Combine(testing::Range(0, 2), testing::Range(0, 3))); #endif // LIBGAV1_MAX_BITDEPTH == 12 template class FilmGrainSpeedTest : public testing::TestWithParam { public: static_assert(bitdepth >= kBitdepth8 && bitdepth <= LIBGAV1_MAX_BITDEPTH, ""); ~FilmGrainSpeedTest() override = default; protected: void SetUp() override { test_utils::ResetDspTable(bitdepth); FilmGrainInit_C(); const testing::TestInfo* const test_info = testing::UnitTest::GetInstance()->current_test_info(); const char* const test_case = test_info->test_suite_name(); if (absl::StartsWith(test_case, "NEON/")) { #if LIBGAV1_ENABLE_NEON FilmGrainInit_NEON(); #endif } else if (absl::StartsWith(test_case, "SSE41/")) { if ((GetCpuInfo() & kSSE4_1) == 0) GTEST_SKIP() << "No SSE4.1 support!"; FilmGrainInit_SSE4_1(); } uv_width_ = (width_ + subsampling_x_) >> subsampling_x_; uv_height_ = (height_ + subsampling_y_) >> subsampling_y_; uv_stride_ = uv_width_ * sizeof(Pixel); y_stride_ = width_ * sizeof(Pixel); const size_t buffer_size = sizeof(Pixel) * (width_ * height_ + 2 * uv_width_ * uv_height_); source_buffer_.reset(new (std::nothrow) uint8_t[buffer_size]); memset(source_buffer_.get(), 0, sizeof(source_buffer_[0]) * buffer_size); dest_buffer_.reset(new (std::nothrow) uint8_t[buffer_size]); memset(dest_buffer_.get(), 0, sizeof(dest_buffer_[0]) * buffer_size); source_plane_y_ = source_buffer_.get(); source_plane_u_ = source_plane_y_ + y_stride_ * height_; source_plane_v_ = source_plane_u_ + uv_stride_ * uv_height_; dest_plane_y_ = dest_buffer_.get(); dest_plane_u_ = dest_plane_y_ + y_stride_ * height_; dest_plane_v_ = dest_plane_u_ + uv_stride_ * uv_height_; const int num_threads = GetParam(); thread_pool_ = ThreadPool::Create(num_threads); } void TestSpeed(int num_runs); private: const int width_ = 1920; const int height_ = 1080; const int subsampling_x_ = 1; const int subsampling_y_ = 1; int uv_width_ = 0; int uv_height_ = 0; int uv_stride_ = 0; int y_stride_ = 0; std::unique_ptr source_buffer_; std::unique_ptr dest_buffer_; const uint8_t* source_plane_y_ = nullptr; const uint8_t* source_plane_u_ = nullptr; const uint8_t* source_plane_v_ = nullptr; uint8_t* dest_plane_y_ = nullptr; uint8_t* dest_plane_u_ = nullptr; uint8_t* dest_plane_v_ = nullptr; std::unique_ptr thread_pool_; }; // Each run of the speed test adds film grain noise to 10 dummy frames. The // film grain parameters for the 10 frames were generated with aomenc. template void FilmGrainSpeedTest::TestSpeed(const int num_runs) { const dsp::Dsp* dsp = GetDspTable(bitdepth); if (dsp->film_grain.blend_noise_chroma[0] == nullptr || dsp->film_grain.blend_noise_luma == nullptr) { return; } for (int k = 0; k < kNumFilmGrainTestParams; ++k) { const FilmGrainParams& params = kFilmGrainParams[k]; const absl::Time start = absl::Now(); for (int i = 0; i < num_runs; ++i) { FilmGrain film_grain(params, /*is_monochrome=*/false, /*color_matrix_is_identity=*/false, subsampling_x_, subsampling_y_, width_, height_, thread_pool_.get()); EXPECT_TRUE(film_grain.AddNoise( source_plane_y_, y_stride_, source_plane_u_, source_plane_v_, uv_stride_, dest_plane_y_, y_stride_, dest_plane_u_, dest_plane_v_, uv_stride_)); } const absl::Duration elapsed_time = absl::Now() - start; const char* digest_luma = GetTestDigestLuma(bitdepth, k); test_utils::CheckMd5Digest( "FilmGrainSynthesisLuma", absl::StrFormat("kFilmGrainParams[%d]", k).c_str(), digest_luma, dest_plane_y_, y_stride_ * height_, elapsed_time); const char* digest_chroma_u = GetTestDigestChromaU(bitdepth, k); test_utils::CheckMd5Digest( "FilmGrainSynthesisChromaU", absl::StrFormat("kFilmGrainParams[%d]", k).c_str(), digest_chroma_u, dest_plane_u_, uv_stride_ * uv_height_, elapsed_time); const char* digest_chroma_v = GetTestDigestChromaV(bitdepth, k); test_utils::CheckMd5Digest( "FilmGrainSynthesisChromaV", absl::StrFormat("kFilmGrainParams[%d]", k).c_str(), digest_chroma_v, dest_plane_v_, uv_stride_ * uv_height_, elapsed_time); } } using FilmGrainSpeedTest8bpp = FilmGrainSpeedTest<8, uint8_t>; TEST_P(FilmGrainSpeedTest8bpp, MatchesOriginalOutput) { TestSpeed(1); } TEST_P(FilmGrainSpeedTest8bpp, DISABLED_Speed) { TestSpeed(kNumSpeedTests); } INSTANTIATE_TEST_SUITE_P(C, FilmGrainSpeedTest8bpp, testing::Values(0, 3, 8)); #if LIBGAV1_ENABLE_SSE4_1 INSTANTIATE_TEST_SUITE_P(SSE41, FilmGrainSpeedTest8bpp, testing::Values(0, 3, 8)); #endif #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, FilmGrainSpeedTest8bpp, testing::Values(0, 3, 8)); #endif #if LIBGAV1_MAX_BITDEPTH >= 10 using FilmGrainSpeedTest10bpp = FilmGrainSpeedTest<10, uint16_t>; TEST_P(FilmGrainSpeedTest10bpp, MatchesOriginalOutput) { TestSpeed(1); } TEST_P(FilmGrainSpeedTest10bpp, DISABLED_Speed) { TestSpeed(kNumSpeedTests); } INSTANTIATE_TEST_SUITE_P(C, FilmGrainSpeedTest10bpp, testing::Values(0, 3, 8)); #if LIBGAV1_ENABLE_SSE4_1 INSTANTIATE_TEST_SUITE_P(SSE41, FilmGrainSpeedTest10bpp, testing::Values(0, 3, 8)); #endif #if LIBGAV1_ENABLE_NEON INSTANTIATE_TEST_SUITE_P(NEON, FilmGrainSpeedTest10bpp, testing::Values(0, 3, 8)); #endif #endif // LIBGAV1_MAX_BITDEPTH >= 10 #if LIBGAV1_MAX_BITDEPTH == 12 using FilmGrainSpeedTest12bpp = FilmGrainSpeedTest<12, uint16_t>; TEST_P(FilmGrainSpeedTest12bpp, MatchesOriginalOutput) { TestSpeed(1); } TEST_P(FilmGrainSpeedTest12bpp, DISABLED_Speed) { TestSpeed(kNumSpeedTests); } INSTANTIATE_TEST_SUITE_P(C, FilmGrainSpeedTest12bpp, testing::Values(0, 3, 8)); #endif // LIBGAV1_MAX_BITDEPTH == 12 } // namespace } // namespace film_grain } // namespace dsp } // namespace libgav1