X-Git-Url: https://git.sesse.net/?a=blobdiff_plain;f=resample_effect_test.cpp;h=84f61e78e16381bd70174c4fc470dfcc29591ccf;hb=910df1ba510ad8dfda93e175d1d66d33e9519b19;hp=7955c5ba99f480a94f048385f1697ffa0fb09091;hpb=e09662ec1b11f72746c7691fef56e14241d32d1c;p=movit diff --git a/resample_effect_test.cpp b/resample_effect_test.cpp index 7955c5b..84f61e7 100644 --- a/resample_effect_test.cpp +++ b/resample_effect_test.cpp @@ -8,7 +8,9 @@ #include "effect_chain.h" #include "flat_input.h" +#include "fp16.h" #include "image_format.h" +#include "init.h" #include "resample_effect.h" #include "test_util.h" @@ -430,6 +432,8 @@ TEST(ResampleEffectTest, Precision) { } #ifdef HAVE_BENCHMARK +template<> inline uint8_t from_fp32(float x) { return x; } + template void BM_ResampleEffect(benchmark::State &state, GammaCurve gamma_curve, GLenum output_format, const std::string &shader_type) { @@ -443,7 +447,7 @@ void BM_ResampleEffect(benchmark::State &state, GammaCurve gamma_curve, GLenum o unique_ptr out_data(new T[out_width * out_height * 4]); for (unsigned i = 0; i < in_width * in_height * 4; ++i) { - data[i] = rand(); + data[i] = from_fp32(float(rand())); } EffectChainTester tester(nullptr, out_width, out_height, FORMAT_BGRA_POSTMULTIPLIED_ALPHA, COLORSPACE_sRGB, gamma_curve, output_format); @@ -456,9 +460,9 @@ void BM_ResampleEffect(benchmark::State &state, GammaCurve gamma_curve, GLenum o tester.benchmark(state, out_data.get(), GL_BGRA, COLORSPACE_sRGB, gamma_curve, OUTPUT_ALPHA_FORMAT_PREMULTIPLIED); } -void BM_ResampleEffectFloat(benchmark::State &state, GammaCurve gamma_curve, const std::string &shader_type) +void BM_ResampleEffectHalf(benchmark::State &state, GammaCurve gamma_curve, const std::string &shader_type) { - BM_ResampleEffect(state, gamma_curve, GL_RGBA16F, shader_type); + BM_ResampleEffect(state, gamma_curve, GL_RGBA16F, shader_type); } void BM_ResampleEffectInt8(benchmark::State &state, GammaCurve gamma_curve, const std::string &shader_type) @@ -467,9 +471,27 @@ void BM_ResampleEffectInt8(benchmark::State &state, GammaCurve gamma_curve, cons } BENCHMARK_CAPTURE(BM_ResampleEffectInt8, Int8Upscale, GAMMA_REC_709, "fragment")->Args({640, 360, 1280, 720})->Args({320, 180, 1280, 720})->Args({321, 181, 1280, 720})->UseRealTime()->Unit(benchmark::kMicrosecond); -BENCHMARK_CAPTURE(BM_ResampleEffectFloat, Float32Upscale, GAMMA_LINEAR, "fragment")->Args({640, 360, 1280, 720})->Args({320, 180, 1280, 720})->Args({321, 181, 1280, 720})->UseRealTime()->Unit(benchmark::kMicrosecond); +BENCHMARK_CAPTURE(BM_ResampleEffectHalf, Float16Upscale, GAMMA_LINEAR, "fragment")->Args({640, 360, 1280, 720})->Args({320, 180, 1280, 720})->Args({321, 181, 1280, 720})->UseRealTime()->Unit(benchmark::kMicrosecond); BENCHMARK_CAPTURE(BM_ResampleEffectInt8, Int8Downscale, GAMMA_REC_709, "fragment")->Args({1280, 720, 640, 360})->Args({1280, 720, 320, 180})->Args({1280, 720, 321, 181})->UseRealTime()->Unit(benchmark::kMicrosecond); -BENCHMARK_CAPTURE(BM_ResampleEffectFloat, Float32Downscale, GAMMA_LINEAR, "fragment")->Args({1280, 720, 640, 360})->Args({1280, 720, 320, 180})->Args({1280, 720, 321, 181})->UseRealTime()->Unit(benchmark::kMicrosecond); +BENCHMARK_CAPTURE(BM_ResampleEffectHalf, Float16Downscale, GAMMA_LINEAR, "fragment")->Args({1280, 720, 640, 360})->Args({1280, 720, 320, 180})->Args({1280, 720, 321, 181})->UseRealTime()->Unit(benchmark::kMicrosecond); + +void BM_ComputeScalingWeights(benchmark::State &state) +{ + constexpr unsigned src_size = 1280; + constexpr unsigned dst_size = 35; + int old_precision = movit_texel_subpixel_precision; + movit_texel_subpixel_precision = 64; // To get consistent results across GPUs; this is a CPU test. + + // One iteration warmup to make sure the Lanczos table is computed. + calculate_scaling_weights(src_size, dst_size, 0.999f, 0.0f); + + for (auto _ : state) { + ScalingWeights weights = calculate_scaling_weights(src_size, dst_size, 0.999f, 0.0f); + } + + movit_texel_subpixel_precision = old_precision; +} +BENCHMARK(BM_ComputeScalingWeights)->Unit(benchmark::kMicrosecond); #endif