123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527 |
- // The MIT License(MIT)
- //
- // Copyright(c) 2021 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
- //
- // Permission is hereby granted, free of charge, to any person obtaining a copy of
- // this software and associated documentation files(the "Software"), to deal in
- // the Software without restriction, including without limitation the rights to
- // use, copy, modify, merge, publish, distribute, sublicense, and / or sell copies of
- // the Software, and to permit persons to whom the Software is furnished to do so,
- // subject to the following conditions :
- //
- // The above copyright notice and this permission notice shall be included in all
- // copies or substantial portions of the Software.
- //
- // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
- // FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.IN NO EVENT SHALL THE AUTHORS OR
- // COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
- // IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
- // CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- #pragma once
- #include <algorithm>
- #include <cmath>
- #include <cstdint>
- #ifndef NIS_ALIGNED
- #if defined(_MSC_VER)
- #define NIS_ALIGNED(x) __declspec(align(x))
- #else
- #if defined(__GNUC__)
- #define NIS_ALIGNED(x) __attribute__ ((aligned(x)))
- #endif
- #endif
- #endif
- struct NIS_ALIGNED(256) NISConfig
- {
- float kDetectRatio;
- float kDetectThres;
- float kMinContrastRatio;
- float kRatioNorm;
- float kContrastBoost;
- float kEps;
- float kSharpStartY;
- float kSharpScaleY;
- float kSharpStrengthMin;
- float kSharpStrengthScale;
- float kSharpLimitMin;
- float kSharpLimitScale;
- float kScaleX;
- float kScaleY;
- float kDstNormX;
- float kDstNormY;
- float kSrcNormX;
- float kSrcNormY;
- uint32_t kInputViewportOriginX;
- uint32_t kInputViewportOriginY;
- uint32_t kInputViewportWidth;
- uint32_t kInputViewportHeight;
- uint32_t kOutputViewportOriginX;
- uint32_t kOutputViewportOriginY;
- uint32_t kOutputViewportWidth;
- uint32_t kOutputViewportHeight;
- float reserved0;
- float reserved1;
- };
- enum class NISHDRMode : uint32_t
- {
- None = 0,
- Linear = 1,
- PQ = 2
- };
- enum class NISGPUArchitecture : uint32_t
- {
- NVIDIA_Generic = 0,
- AMD_Generic = 1,
- Intel_Generic = 2
- };
- struct NISOptimizer
- {
- bool isUpscaling;
- NISGPUArchitecture gpuArch;
- constexpr NISOptimizer(bool isUpscaling = true, NISGPUArchitecture gpuArch = NISGPUArchitecture::NVIDIA_Generic)
- : isUpscaling(isUpscaling)
- , gpuArch(gpuArch)
- {}
- constexpr uint32_t GetOptimalBlockWidth()
- {
- switch (gpuArch) {
- case NISGPUArchitecture::NVIDIA_Generic:
- return 32;
- case NISGPUArchitecture::AMD_Generic:
- return 32;
- case NISGPUArchitecture::Intel_Generic:
- return 32;
- }
- return 32;
- }
- constexpr uint32_t GetOptimalBlockHeight()
- {
- switch (gpuArch) {
- case NISGPUArchitecture::NVIDIA_Generic:
- return isUpscaling ? 24 : 32;
- case NISGPUArchitecture::AMD_Generic:
- return isUpscaling ? 24 : 32;
- case NISGPUArchitecture::Intel_Generic:
- return isUpscaling ? 24 : 32;
- }
- return isUpscaling ? 24 : 32;
- }
- constexpr uint32_t GetOptimalThreadGroupSize()
- {
- switch (gpuArch) {
- case NISGPUArchitecture::NVIDIA_Generic:
- return 128;
- case NISGPUArchitecture::AMD_Generic:
- return 256;
- case NISGPUArchitecture::Intel_Generic:
- return 256;
- }
- return 256;
- }
- };
- inline bool NVScalerUpdateConfig(NISConfig& config, float sharpness,
- uint32_t inputViewportOriginX, uint32_t inputViewportOriginY,
- uint32_t inputViewportWidth, uint32_t inputViewportHeight,
- uint32_t inputTextureWidth, uint32_t inputTextureHeight,
- uint32_t outputViewportOriginX, uint32_t outputViewportOriginY,
- uint32_t outputViewportWidth, uint32_t outputViewportHeight,
- uint32_t outputTextureWidth, uint32_t outputTextureHeight,
- NISHDRMode hdrMode = NISHDRMode::None)
- {
- // adjust params based on value from sharpness slider
- sharpness = std::max<float>(std::min<float>(1.f, sharpness), 0.f);
- float sharpen_slider = sharpness - 0.5f; // Map 0 to 1 to -0.5 to +0.5
- // Different range for 0 to 50% vs 50% to 100%
- // The idea is to make sure sharpness of 0% map to no-sharpening,
- // while also ensuring that sharpness of 100% doesn't cause too much over-sharpening.
- const float MaxScale = (sharpen_slider >= 0.0f) ? 1.25f : 1.75f;
- const float MinScale = (sharpen_slider >= 0.0f) ? 1.25f : 1.0f;
- const float LimitScale = (sharpen_slider >= 0.0f) ? 1.25f : 1.0f;
- float kDetectRatio = 1127.f / 1024.f;
- // Params for SDR
- float kDetectThres = 64.0f / 1024.0f;
- float kMinContrastRatio = 2.0f;
- float kMaxContrastRatio = 10.0f;
- float kSharpStartY = 0.45f;
- float kSharpEndY = 0.9f;
- float kSharpStrengthMin = std::max<float>(0.0f, 0.4f + sharpen_slider * MinScale * 1.2f);
- float kSharpStrengthMax = 1.6f + sharpen_slider * 1.8f;
- float kSharpLimitMin = std::max<float>(0.1f, 0.14f + sharpen_slider * LimitScale * 0.32f);
- float kSharpLimitMax = 0.5f + sharpen_slider * LimitScale * 0.6f;
- if (hdrMode == NISHDRMode::Linear || hdrMode == NISHDRMode::PQ)
- {
- kDetectThres = 32.0f / 1024.0f;
- kMinContrastRatio = 1.5f;
- kMaxContrastRatio = 5.0f;
- kSharpStrengthMin = std::max<float>(0.0f, 0.4f + sharpen_slider * MinScale * 1.1f);
- kSharpStrengthMax = 2.2f + sharpen_slider * MaxScale * 1.8f;
- kSharpLimitMin = std::max<float>(0.06f, 0.10f + sharpen_slider * LimitScale * 0.28f);
- kSharpLimitMax = 0.6f + sharpen_slider * LimitScale * 0.6f;
- if (hdrMode == NISHDRMode::PQ)
- {
- kSharpStartY = 0.35f;
- kSharpEndY = 0.55f;
- }
- else
- {
- kSharpStartY = 0.3f;
- kSharpEndY = 0.5f;
- }
- }
- float kRatioNorm = 1.0f / (kMaxContrastRatio - kMinContrastRatio);
- float kSharpScaleY = 1.0f / (kSharpEndY - kSharpStartY);
- float kSharpStrengthScale = kSharpStrengthMax - kSharpStrengthMin;
- float kSharpLimitScale = kSharpLimitMax - kSharpLimitMin;
- config.kInputViewportWidth = inputViewportWidth == 0 ? inputTextureWidth : inputViewportWidth;
- config.kInputViewportHeight = inputViewportHeight == 0 ? inputTextureHeight : inputViewportHeight;
- config.kOutputViewportWidth = outputViewportWidth == 0 ? outputTextureWidth : outputViewportWidth;
- config.kOutputViewportHeight = outputViewportHeight == 0 ? outputTextureHeight : outputViewportHeight;
- if (config.kInputViewportWidth == 0 || config.kInputViewportHeight == 0 ||
- config.kOutputViewportWidth == 0 || config.kOutputViewportHeight == 0)
- return false;
- config.kInputViewportOriginX = inputViewportOriginX;
- config.kInputViewportOriginY = inputViewportOriginY;
- config.kOutputViewportOriginX = outputViewportOriginX;
- config.kOutputViewportOriginY = outputViewportOriginY;
- config.kSrcNormX = 1.f / inputTextureWidth;
- config.kSrcNormY = 1.f / inputTextureHeight;
- config.kDstNormX = 1.f / outputTextureWidth;
- config.kDstNormY = 1.f / outputTextureHeight;
- config.kScaleX = config.kInputViewportWidth / float(config.kOutputViewportWidth);
- config.kScaleY = config.kInputViewportHeight / float(config.kOutputViewportHeight);
- if (config.kScaleX < 0.5f || config.kScaleX > 1.f || config.kScaleY < 0.5f || config.kScaleY > 1.f)
- return false;
- config.kDetectRatio = kDetectRatio;
- config.kDetectThres = kDetectThres;
- config.kMinContrastRatio = kMinContrastRatio;
- config.kRatioNorm = kRatioNorm;
- config.kContrastBoost = 1.0f;
- config.kEps = 1.0f;
- config.kSharpStartY = kSharpStartY;
- config.kSharpScaleY = kSharpScaleY;
- config.kSharpStrengthMin = kSharpStrengthMin;
- config.kSharpStrengthScale = kSharpStrengthScale;
- config.kSharpLimitMin = kSharpLimitMin;
- config.kSharpLimitScale = kSharpLimitScale;
- return true;
- }
- inline bool NVSharpenUpdateConfig(NISConfig& config, float sharpness,
- uint32_t inputViewportOriginX, uint32_t inputViewportOriginY,
- uint32_t inputViewportWidth, uint32_t inputViewportHeight,
- uint32_t inputTextureWidth, uint32_t inputTextureHeight,
- uint32_t outputViewportOriginX, uint32_t outputViewportOriginY,
- NISHDRMode hdrMode = NISHDRMode::None)
- {
- return NVScalerUpdateConfig(config, sharpness,
- inputViewportOriginX, inputViewportOriginY, inputViewportWidth, inputViewportHeight, inputTextureWidth, inputTextureHeight,
- outputViewportOriginX, outputViewportOriginY, inputViewportWidth, inputViewportHeight, inputTextureWidth, inputTextureHeight,
- hdrMode);
- }
- namespace {
- constexpr size_t kPhaseCount = 64;
- constexpr size_t kFilterSize = 8;
- constexpr float coef_scale[kPhaseCount][kFilterSize] = {
- {0.0, 0.0, 1.0000, 0.0, 0.0, 0.0, 0.0, 0.0},
- {0.0029, -0.0127, 1.0000, 0.0132, -0.0034, 0.0, 0.0, 0.0},
- {0.0063, -0.0249, 0.9985, 0.0269, -0.0068, 0.0, 0.0, 0.0},
- {0.0088, -0.0361, 0.9956, 0.0415, -0.0103, 0.0005, 0.0, 0.0},
- {0.0117, -0.0474, 0.9932, 0.0562, -0.0142, 0.0005, 0.0, 0.0},
- {0.0142, -0.0576, 0.9897, 0.0713, -0.0181, 0.0005, 0.0, 0.0},
- {0.0166, -0.0674, 0.9844, 0.0874, -0.0220, 0.0010, 0.0, 0.0},
- {0.0186, -0.0762, 0.9785, 0.1040, -0.0264, 0.0015, 0.0, 0.0},
- {0.0205, -0.0850, 0.9727, 0.1206, -0.0308, 0.0020, 0.0, 0.0},
- {0.0225, -0.0928, 0.9648, 0.1382, -0.0352, 0.0024, 0.0, 0.0},
- {0.0239, -0.1006, 0.9575, 0.1558, -0.0396, 0.0029, 0.0, 0.0},
- {0.0254, -0.1074, 0.9487, 0.1738, -0.0439, 0.0034, 0.0, 0.0},
- {0.0264, -0.1138, 0.9390, 0.1929, -0.0488, 0.0044, 0.0, 0.0},
- {0.0278, -0.1191, 0.9282, 0.2119, -0.0537, 0.0049, 0.0, 0.0},
- {0.0288, -0.1245, 0.9170, 0.2310, -0.0581, 0.0059, 0.0, 0.0},
- {0.0293, -0.1294, 0.9058, 0.2510, -0.0630, 0.0063, 0.0, 0.0},
- {0.0303, -0.1333, 0.8926, 0.2710, -0.0679, 0.0073, 0.0, 0.0},
- {0.0308, -0.1367, 0.8789, 0.2915, -0.0728, 0.0083, 0.0, 0.0},
- {0.0308, -0.1401, 0.8657, 0.3120, -0.0776, 0.0093, 0.0, 0.0},
- {0.0313, -0.1426, 0.8506, 0.3330, -0.0825, 0.0103, 0.0, 0.0},
- {0.0313, -0.1445, 0.8354, 0.3540, -0.0874, 0.0112, 0.0, 0.0},
- {0.0313, -0.1460, 0.8193, 0.3755, -0.0923, 0.0122, 0.0, 0.0},
- {0.0313, -0.1470, 0.8022, 0.3965, -0.0967, 0.0137, 0.0, 0.0},
- {0.0308, -0.1479, 0.7856, 0.4185, -0.1016, 0.0146, 0.0, 0.0},
- {0.0303, -0.1479, 0.7681, 0.4399, -0.1060, 0.0156, 0.0, 0.0},
- {0.0298, -0.1479, 0.7505, 0.4614, -0.1104, 0.0166, 0.0, 0.0},
- {0.0293, -0.1470, 0.7314, 0.4829, -0.1147, 0.0181, 0.0, 0.0},
- {0.0288, -0.1460, 0.7119, 0.5049, -0.1187, 0.0190, 0.0, 0.0},
- {0.0278, -0.1445, 0.6929, 0.5264, -0.1226, 0.0200, 0.0, 0.0},
- {0.0273, -0.1431, 0.6724, 0.5479, -0.1260, 0.0215, 0.0, 0.0},
- {0.0264, -0.1411, 0.6528, 0.5693, -0.1299, 0.0225, 0.0, 0.0},
- {0.0254, -0.1387, 0.6323, 0.5903, -0.1328, 0.0234, 0.0, 0.0},
- {0.0244, -0.1357, 0.6113, 0.6113, -0.1357, 0.0244, 0.0, 0.0},
- {0.0234, -0.1328, 0.5903, 0.6323, -0.1387, 0.0254, 0.0, 0.0},
- {0.0225, -0.1299, 0.5693, 0.6528, -0.1411, 0.0264, 0.0, 0.0},
- {0.0215, -0.1260, 0.5479, 0.6724, -0.1431, 0.0273, 0.0, 0.0},
- {0.0200, -0.1226, 0.5264, 0.6929, -0.1445, 0.0278, 0.0, 0.0},
- {0.0190, -0.1187, 0.5049, 0.7119, -0.1460, 0.0288, 0.0, 0.0},
- {0.0181, -0.1147, 0.4829, 0.7314, -0.1470, 0.0293, 0.0, 0.0},
- {0.0166, -0.1104, 0.4614, 0.7505, -0.1479, 0.0298, 0.0, 0.0},
- {0.0156, -0.1060, 0.4399, 0.7681, -0.1479, 0.0303, 0.0, 0.0},
- {0.0146, -0.1016, 0.4185, 0.7856, -0.1479, 0.0308, 0.0, 0.0},
- {0.0137, -0.0967, 0.3965, 0.8022, -0.1470, 0.0313, 0.0, 0.0},
- {0.0122, -0.0923, 0.3755, 0.8193, -0.1460, 0.0313, 0.0, 0.0},
- {0.0112, -0.0874, 0.3540, 0.8354, -0.1445, 0.0313, 0.0, 0.0},
- {0.0103, -0.0825, 0.3330, 0.8506, -0.1426, 0.0313, 0.0, 0.0},
- {0.0093, -0.0776, 0.3120, 0.8657, -0.1401, 0.0308, 0.0, 0.0},
- {0.0083, -0.0728, 0.2915, 0.8789, -0.1367, 0.0308, 0.0, 0.0},
- {0.0073, -0.0679, 0.2710, 0.8926, -0.1333, 0.0303, 0.0, 0.0},
- {0.0063, -0.0630, 0.2510, 0.9058, -0.1294, 0.0293, 0.0, 0.0},
- {0.0059, -0.0581, 0.2310, 0.9170, -0.1245, 0.0288, 0.0, 0.0},
- {0.0049, -0.0537, 0.2119, 0.9282, -0.1191, 0.0278, 0.0, 0.0},
- {0.0044, -0.0488, 0.1929, 0.9390, -0.1138, 0.0264, 0.0, 0.0},
- {0.0034, -0.0439, 0.1738, 0.9487, -0.1074, 0.0254, 0.0, 0.0},
- {0.0029, -0.0396, 0.1558, 0.9575, -0.1006, 0.0239, 0.0, 0.0},
- {0.0024, -0.0352, 0.1382, 0.9648, -0.0928, 0.0225, 0.0, 0.0},
- {0.0020, -0.0308, 0.1206, 0.9727, -0.0850, 0.0205, 0.0, 0.0},
- {0.0015, -0.0264, 0.1040, 0.9785, -0.0762, 0.0186, 0.0, 0.0},
- {0.0010, -0.0220, 0.0874, 0.9844, -0.0674, 0.0166, 0.0, 0.0},
- {0.0005, -0.0181, 0.0713, 0.9897, -0.0576, 0.0142, 0.0, 0.0},
- {0.0005, -0.0142, 0.0562, 0.9932, -0.0474, 0.0117, 0.0, 0.0},
- {0.0005, -0.0103, 0.0415, 0.9956, -0.0361, 0.0088, 0.0, 0.0},
- {0.0, -0.0068, 0.0269, 0.9985, -0.0249, 0.0063, 0.0, 0.0},
- {0.0, -0.0034, 0.0132, 1.0000, -0.0127, 0.0029, 0.0, 0.0}
- };
- constexpr float coef_usm[kPhaseCount][kFilterSize] = {
- {0, -0.6001, 1.2002, -0.6001, 0, 0, 0, 0},
- {0.0029, -0.6084, 1.1987, -0.5903, -0.0029, 0, 0, 0},
- {0.0049, -0.6147, 1.1958, -0.5791, -0.0068, 0.0005, 0, 0},
- {0.0073, -0.6196, 1.1890, -0.5659, -0.0103, 0, 0, 0},
- {0.0093, -0.6235, 1.1802, -0.5513, -0.0151, 0, 0, 0},
- {0.0112, -0.6265, 1.1699, -0.5352, -0.0195, 0.0005, 0, 0},
- {0.0122, -0.6270, 1.1582, -0.5181, -0.0259, 0.0005, 0, 0},
- {0.0142, -0.6284, 1.1455, -0.5005, -0.0317, 0.0005, 0, 0},
- {0.0156, -0.6265, 1.1274, -0.4790, -0.0386, 0.0005, 0, 0},
- {0.0166, -0.6235, 1.1089, -0.4570, -0.0454, 0.0010, 0, 0},
- {0.0176, -0.6187, 1.0879, -0.4346, -0.0532, 0.0010, 0, 0},
- {0.0181, -0.6138, 1.0659, -0.4102, -0.0615, 0.0015, 0, 0},
- {0.0190, -0.6069, 1.0405, -0.3843, -0.0698, 0.0015, 0, 0},
- {0.0195, -0.6006, 1.0161, -0.3574, -0.0796, 0.0020, 0, 0},
- {0.0200, -0.5928, 0.9893, -0.3286, -0.0898, 0.0024, 0, 0},
- {0.0200, -0.5820, 0.9580, -0.2988, -0.1001, 0.0029, 0, 0},
- {0.0200, -0.5728, 0.9292, -0.2690, -0.1104, 0.0034, 0, 0},
- {0.0200, -0.5620, 0.8975, -0.2368, -0.1226, 0.0039, 0, 0},
- {0.0205, -0.5498, 0.8643, -0.2046, -0.1343, 0.0044, 0, 0},
- {0.0200, -0.5371, 0.8301, -0.1709, -0.1465, 0.0049, 0, 0},
- {0.0195, -0.5239, 0.7944, -0.1367, -0.1587, 0.0054, 0, 0},
- {0.0195, -0.5107, 0.7598, -0.1021, -0.1724, 0.0059, 0, 0},
- {0.0190, -0.4966, 0.7231, -0.0649, -0.1865, 0.0063, 0, 0},
- {0.0186, -0.4819, 0.6846, -0.0288, -0.1997, 0.0068, 0, 0},
- {0.0186, -0.4668, 0.6460, 0.0093, -0.2144, 0.0073, 0, 0},
- {0.0176, -0.4507, 0.6055, 0.0479, -0.2290, 0.0083, 0, 0},
- {0.0171, -0.4370, 0.5693, 0.0859, -0.2446, 0.0088, 0, 0},
- {0.0161, -0.4199, 0.5283, 0.1255, -0.2598, 0.0098, 0, 0},
- {0.0161, -0.4048, 0.4883, 0.1655, -0.2754, 0.0103, 0, 0},
- {0.0151, -0.3887, 0.4497, 0.2041, -0.2910, 0.0107, 0, 0},
- {0.0142, -0.3711, 0.4072, 0.2446, -0.3066, 0.0117, 0, 0},
- {0.0137, -0.3555, 0.3672, 0.2852, -0.3228, 0.0122, 0, 0},
- {0.0132, -0.3394, 0.3262, 0.3262, -0.3394, 0.0132, 0, 0},
- {0.0122, -0.3228, 0.2852, 0.3672, -0.3555, 0.0137, 0, 0},
- {0.0117, -0.3066, 0.2446, 0.4072, -0.3711, 0.0142, 0, 0},
- {0.0107, -0.2910, 0.2041, 0.4497, -0.3887, 0.0151, 0, 0},
- {0.0103, -0.2754, 0.1655, 0.4883, -0.4048, 0.0161, 0, 0},
- {0.0098, -0.2598, 0.1255, 0.5283, -0.4199, 0.0161, 0, 0},
- {0.0088, -0.2446, 0.0859, 0.5693, -0.4370, 0.0171, 0, 0},
- {0.0083, -0.2290, 0.0479, 0.6055, -0.4507, 0.0176, 0, 0},
- {0.0073, -0.2144, 0.0093, 0.6460, -0.4668, 0.0186, 0, 0},
- {0.0068, -0.1997, -0.0288, 0.6846, -0.4819, 0.0186, 0, 0},
- {0.0063, -0.1865, -0.0649, 0.7231, -0.4966, 0.0190, 0, 0},
- {0.0059, -0.1724, -0.1021, 0.7598, -0.5107, 0.0195, 0, 0},
- {0.0054, -0.1587, -0.1367, 0.7944, -0.5239, 0.0195, 0, 0},
- {0.0049, -0.1465, -0.1709, 0.8301, -0.5371, 0.0200, 0, 0},
- {0.0044, -0.1343, -0.2046, 0.8643, -0.5498, 0.0205, 0, 0},
- {0.0039, -0.1226, -0.2368, 0.8975, -0.5620, 0.0200, 0, 0},
- {0.0034, -0.1104, -0.2690, 0.9292, -0.5728, 0.0200, 0, 0},
- {0.0029, -0.1001, -0.2988, 0.9580, -0.5820, 0.0200, 0, 0},
- {0.0024, -0.0898, -0.3286, 0.9893, -0.5928, 0.0200, 0, 0},
- {0.0020, -0.0796, -0.3574, 1.0161, -0.6006, 0.0195, 0, 0},
- {0.0015, -0.0698, -0.3843, 1.0405, -0.6069, 0.0190, 0, 0},
- {0.0015, -0.0615, -0.4102, 1.0659, -0.6138, 0.0181, 0, 0},
- {0.0010, -0.0532, -0.4346, 1.0879, -0.6187, 0.0176, 0, 0},
- {0.0010, -0.0454, -0.4570, 1.1089, -0.6235, 0.0166, 0, 0},
- {0.0005, -0.0386, -0.4790, 1.1274, -0.6265, 0.0156, 0, 0},
- {0.0005, -0.0317, -0.5005, 1.1455, -0.6284, 0.0142, 0, 0},
- {0.0005, -0.0259, -0.5181, 1.1582, -0.6270, 0.0122, 0, 0},
- {0.0005, -0.0195, -0.5352, 1.1699, -0.6265, 0.0112, 0, 0},
- {0, -0.0151, -0.5513, 1.1802, -0.6235, 0.0093, 0, 0},
- {0, -0.0103, -0.5659, 1.1890, -0.6196, 0.0073, 0, 0},
- {0.0005, -0.0068, -0.5791, 1.1958, -0.6147, 0.0049, 0, 0},
- {0, -0.0029, -0.5903, 1.1987, -0.6084, 0.0029, 0, 0}
- };
- constexpr uint16_t coef_scale_fp16[kPhaseCount][kFilterSize] = {
- { 0, 0, 15360, 0, 0, 0, 0, 0 },
- { 6640, 41601, 15360, 8898, 39671, 0, 0, 0 },
- { 7796, 42592, 15357, 9955, 40695, 0, 0, 0 },
- { 8321, 43167, 15351, 10576, 41286, 4121, 0, 0 },
- { 8702, 43537, 15346, 11058, 41797, 4121, 0, 0 },
- { 9029, 43871, 15339, 11408, 42146, 4121, 0, 0 },
- { 9280, 44112, 15328, 11672, 42402, 5145, 0, 0 },
- { 9411, 44256, 15316, 11944, 42690, 5669, 0, 0 },
- { 9535, 44401, 15304, 12216, 42979, 6169, 0, 0 },
- { 9667, 44528, 15288, 12396, 43137, 6378, 0, 0 },
- { 9758, 44656, 15273, 12540, 43282, 6640, 0, 0 },
- { 9857, 44768, 15255, 12688, 43423, 6903, 0, 0 },
- { 9922, 44872, 15235, 12844, 43583, 7297, 0, 0 },
- { 10014, 44959, 15213, 13000, 43744, 7429, 0, 0 },
- { 10079, 45048, 15190, 13156, 43888, 7691, 0, 0 },
- { 10112, 45092, 15167, 13316, 44040, 7796, 0, 0 },
- { 10178, 45124, 15140, 13398, 44120, 8058, 0, 0 },
- { 10211, 45152, 15112, 13482, 44201, 8256, 0, 0 },
- { 10211, 45180, 15085, 13566, 44279, 8387, 0, 0 },
- { 10242, 45200, 15054, 13652, 44360, 8518, 0, 0 },
- { 10242, 45216, 15023, 13738, 44440, 8636, 0, 0 },
- { 10242, 45228, 14990, 13826, 44520, 8767, 0, 0 },
- { 10242, 45236, 14955, 13912, 44592, 8964, 0, 0 },
- { 10211, 45244, 14921, 14002, 44673, 9082, 0, 0 },
- { 10178, 45244, 14885, 14090, 44745, 9213, 0, 0 },
- { 10145, 45244, 14849, 14178, 44817, 9280, 0, 0 },
- { 10112, 45236, 14810, 14266, 44887, 9378, 0, 0 },
- { 10079, 45228, 14770, 14346, 44953, 9437, 0, 0 },
- { 10014, 45216, 14731, 14390, 45017, 9503, 0, 0 },
- { 9981, 45204, 14689, 14434, 45064, 9601, 0, 0 },
- { 9922, 45188, 14649, 14478, 45096, 9667, 0, 0 },
- { 9857, 45168, 14607, 14521, 45120, 9726, 0, 0 },
- { 9791, 45144, 14564, 14564, 45144, 9791, 0, 0 },
- { 9726, 45120, 14521, 14607, 45168, 9857, 0, 0 },
- { 9667, 45096, 14478, 14649, 45188, 9922, 0, 0 },
- { 9601, 45064, 14434, 14689, 45204, 9981, 0, 0 },
- { 9503, 45017, 14390, 14731, 45216, 10014, 0, 0 },
- { 9437, 44953, 14346, 14770, 45228, 10079, 0, 0 },
- { 9378, 44887, 14266, 14810, 45236, 10112, 0, 0 },
- { 9280, 44817, 14178, 14849, 45244, 10145, 0, 0 },
- { 9213, 44745, 14090, 14885, 45244, 10178, 0, 0 },
- { 9082, 44673, 14002, 14921, 45244, 10211, 0, 0 },
- { 8964, 44592, 13912, 14955, 45236, 10242, 0, 0 },
- { 8767, 44520, 13826, 14990, 45228, 10242, 0, 0 },
- { 8636, 44440, 13738, 15023, 45216, 10242, 0, 0 },
- { 8518, 44360, 13652, 15054, 45200, 10242, 0, 0 },
- { 8387, 44279, 13566, 15085, 45180, 10211, 0, 0 },
- { 8256, 44201, 13482, 15112, 45152, 10211, 0, 0 },
- { 8058, 44120, 13398, 15140, 45124, 10178, 0, 0 },
- { 7796, 44040, 13316, 15167, 45092, 10112, 0, 0 },
- { 7691, 43888, 13156, 15190, 45048, 10079, 0, 0 },
- { 7429, 43744, 13000, 15213, 44959, 10014, 0, 0 },
- { 7297, 43583, 12844, 15235, 44872, 9922, 0, 0 },
- { 6903, 43423, 12688, 15255, 44768, 9857, 0, 0 },
- { 6640, 43282, 12540, 15273, 44656, 9758, 0, 0 },
- { 6378, 43137, 12396, 15288, 44528, 9667, 0, 0 },
- { 6169, 42979, 12216, 15304, 44401, 9535, 0, 0 },
- { 5669, 42690, 11944, 15316, 44256, 9411, 0, 0 },
- { 5145, 42402, 11672, 15328, 44112, 9280, 0, 0 },
- { 4121, 42146, 11408, 15339, 43871, 9029, 0, 0 },
- { 4121, 41797, 11058, 15346, 43537, 8702, 0, 0 },
- { 4121, 41286, 10576, 15351, 43167, 8321, 0, 0 },
- { 0, 40695, 9955, 15357, 42592, 7796, 0, 0 },
- { 0, 39671, 8898, 15360, 41601, 6640, 0, 0 },
- };
- constexpr uint16_t coef_usm_fp16[kPhaseCount][kFilterSize] = {
- { 0, 47309, 15565, 47309, 0, 0, 0, 0 },
- { 6640, 47326, 15563, 47289, 39408, 0, 0, 0 },
- { 7429, 47339, 15560, 47266, 40695, 4121, 0, 0 },
- { 8058, 47349, 15554, 47239, 41286, 0, 0, 0 },
- { 8387, 47357, 15545, 47209, 41915, 0, 0, 0 },
- { 8636, 47363, 15534, 47176, 42238, 4121, 0, 0 },
- { 8767, 47364, 15522, 47141, 42657, 4121, 0, 0 },
- { 9029, 47367, 15509, 47105, 43023, 4121, 0, 0 },
- { 9213, 47363, 15490, 47018, 43249, 4121, 0, 0 },
- { 9280, 47357, 15472, 46928, 43472, 5145, 0, 0 },
- { 9345, 47347, 15450, 46836, 43727, 5145, 0, 0 },
- { 9378, 47337, 15427, 46736, 43999, 5669, 0, 0 },
- { 9437, 47323, 15401, 46630, 44152, 5669, 0, 0 },
- { 9470, 47310, 15376, 46520, 44312, 6169, 0, 0 },
- { 9503, 47294, 15338, 46402, 44479, 6378, 0, 0 },
- { 9503, 47272, 15274, 46280, 44648, 6640, 0, 0 },
- { 9503, 47253, 15215, 46158, 44817, 6903, 0, 0 },
- { 9503, 47231, 15150, 45972, 45017, 7165, 0, 0 },
- { 9535, 47206, 15082, 45708, 45132, 7297, 0, 0 },
- { 9503, 47180, 15012, 45432, 45232, 7429, 0, 0 },
- { 9470, 47153, 14939, 45152, 45332, 7560, 0, 0 },
- { 9470, 47126, 14868, 44681, 45444, 7691, 0, 0 },
- { 9437, 47090, 14793, 44071, 45560, 7796, 0, 0 },
- { 9411, 47030, 14714, 42847, 45668, 7927, 0, 0 },
- { 9411, 46968, 14635, 8387, 45788, 8058, 0, 0 },
- { 9345, 46902, 14552, 10786, 45908, 8256, 0, 0 },
- { 9313, 46846, 14478, 11647, 46036, 8321, 0, 0 },
- { 9247, 46776, 14394, 12292, 46120, 8453, 0, 0 },
- { 9247, 46714, 14288, 12620, 46184, 8518, 0, 0 },
- { 9147, 46648, 14130, 12936, 46248, 8570, 0, 0 },
- { 9029, 46576, 13956, 13268, 46312, 8702, 0, 0 },
- { 8964, 46512, 13792, 13456, 46378, 8767, 0, 0 },
- { 8898, 46446, 13624, 13624, 46446, 8898, 0, 0 },
- { 8767, 46378, 13456, 13792, 46512, 8964, 0, 0 },
- { 8702, 46312, 13268, 13956, 46576, 9029, 0, 0 },
- { 8570, 46248, 12936, 14130, 46648, 9147, 0, 0 },
- { 8518, 46184, 12620, 14288, 46714, 9247, 0, 0 },
- { 8453, 46120, 12292, 14394, 46776, 9247, 0, 0 },
- { 8321, 46036, 11647, 14478, 46846, 9313, 0, 0 },
- { 8256, 45908, 10786, 14552, 46902, 9345, 0, 0 },
- { 8058, 45788, 8387, 14635, 46968, 9411, 0, 0 },
- { 7927, 45668, 42847, 14714, 47030, 9411, 0, 0 },
- { 7796, 45560, 44071, 14793, 47090, 9437, 0, 0 },
- { 7691, 45444, 44681, 14868, 47126, 9470, 0, 0 },
- { 7560, 45332, 45152, 14939, 47153, 9470, 0, 0 },
- { 7429, 45232, 45432, 15012, 47180, 9503, 0, 0 },
- { 7297, 45132, 45708, 15082, 47206, 9535, 0, 0 },
- { 7165, 45017, 45972, 15150, 47231, 9503, 0, 0 },
- { 6903, 44817, 46158, 15215, 47253, 9503, 0, 0 },
- { 6640, 44648, 46280, 15274, 47272, 9503, 0, 0 },
- { 6378, 44479, 46402, 15338, 47294, 9503, 0, 0 },
- { 6169, 44312, 46520, 15376, 47310, 9470, 0, 0 },
- { 5669, 44152, 46630, 15401, 47323, 9437, 0, 0 },
- { 5669, 43999, 46736, 15427, 47337, 9378, 0, 0 },
- { 5145, 43727, 46836, 15450, 47347, 9345, 0, 0 },
- { 5145, 43472, 46928, 15472, 47357, 9280, 0, 0 },
- { 4121, 43249, 47018, 15490, 47363, 9213, 0, 0 },
- { 4121, 43023, 47105, 15509, 47367, 9029, 0, 0 },
- { 4121, 42657, 47141, 15522, 47364, 8767, 0, 0 },
- { 4121, 42238, 47176, 15534, 47363, 8636, 0, 0 },
- { 0, 41915, 47209, 15545, 47357, 8387, 0, 0 },
- { 0, 41286, 47239, 15554, 47349, 8058, 0, 0 },
- { 4121, 40695, 47266, 15560, 47339, 7429, 0, 0 },
- { 0, 39408, 47289, 15563, 47326, 6640, 0, 0 },
- };
- }
|