/* * Copyright 2012-17 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. * * Authors: AMD * */ #include "reg_helper.h" #include "fixed31_32.h" #include "resource.h" #include "dwb.h" #include "dcn20_dwb.h" #define NUM_PHASES 16 #define HORZ_MAX_TAPS 12 #define VERT_MAX_TAPS 12 #define REG(reg)\ dwbc20->dwbc_regs->reg #define CTX \ dwbc20->base.ctx #undef FN #define FN(reg_name, field_name) \ dwbc20->dwbc_shift->field_name, dwbc20->dwbc_mask->field_name #define TO_DCN20_DWBC(dwbc_base) \ container_of(dwbc_base, struct dcn20_dwbc, base) static const uint16_t filter_3tap_16p_upscale[27] = { 2048, 2048, 0, 1708, 2424, 16348, 1372, 2796, 16308, 1056, 3148, 16272, 768, 3464, 16244, 512, 3728, 16236, 296, 3928, 16252, 124, 4052, 16296, 0, 4096, 0 }; static const uint16_t filter_3tap_16p_117[27] = { 2048, 2048, 0, 1824, 2276, 16376, 1600, 2496, 16380, 1376, 2700, 16, 1156, 2880, 52, 948, 3032, 108, 756, 3144, 192, 580, 3212, 296, 428, 3236, 428 }; static const uint16_t filter_3tap_16p_150[27] = { 2048, 2048, 0, 1872, 2184, 36, 1692, 2308, 88, 1516, 2420, 156, 1340, 2516, 236, 1168, 2592, 328, 1004, 2648, 440, 844, 2684, 560, 696, 2696, 696 }; static const uint16_t filter_3tap_16p_183[27] = { 2048, 2048, 0, 1892, 2104, 92, 1744, 2152, 196, 1592, 2196, 300, 1448, 2232, 412, 1304, 2256, 528, 1168, 2276, 648, 1032, 2288, 772, 900, 2292, 900 }; static const uint16_t filter_4tap_16p_upscale[36] = { 0, 4096, 0, 0, 16240, 4056, 180, 16380, 16136, 3952, 404, 16364, 16072, 3780, 664, 16344, 16040, 3556, 952, 16312, 16036, 3284, 1268, 16272, 16052, 2980, 1604, 16224, 16084, 2648, 1952, 16176, 16128, 2304, 2304, 16128 }; static const uint16_t filter_4tap_16p_117[36] = { 428, 3236, 428, 0, 276, 3232, 604, 16364, 148, 3184, 800, 16340, 44, 3104, 1016, 16312, 16344, 2984, 1244, 16284, 16284, 2832, 1488, 16256, 16244, 2648, 1732, 16236, 16220, 2440, 1976, 16220, 16212, 2216, 2216, 16212 }; static const uint16_t filter_4tap_16p_150[36] = { 696, 2700, 696, 0, 560, 2700, 848, 16364, 436, 2676, 1008, 16348, 328, 2628, 1180, 16336, 232, 2556, 1356, 16328, 152, 2460, 1536, 16328, 84, 2344, 1716, 16332, 28, 2208, 1888, 16348, 16376, 2052, 2052, 16376 }; static const uint16_t filter_4tap_16p_183[36] = { 940, 2208, 940, 0, 832, 2200, 1052, 4, 728, 2180, 1164, 16, 628, 2148, 1280, 36, 536, 2100, 1392, 60, 448, 2044, 1504, 92, 368, 1976, 1612, 132, 296, 1900, 1716, 176, 232, 1812, 1812, 232 }; static const uint16_t filter_5tap_16p_upscale[45] = { 15936, 2496, 2496, 15936, 0, 15992, 2128, 2832, 15896, 12, 16056, 1760, 3140, 15876, 24, 16120, 1404, 3420, 15876, 36, 16188, 1060, 3652, 15908, 44, 16248, 744, 3844, 15972, 44, 16304, 460, 3980, 16072, 40, 16348, 212, 4064, 16208, 24, 0, 0, 4096, 0, 0, }; static const uint16_t filter_5tap_16p_117[45] = { 16056, 2372, 2372, 16056, 0, 16052, 2124, 2600, 16076, 0, 16060, 1868, 2808, 16120, 0, 16080, 1612, 2992, 16180, 16376, 16112, 1356, 3144, 16268, 16364, 16144, 1108, 3268, 16376, 16344, 16184, 872, 3356, 124, 16320, 16220, 656, 3412, 276, 16292, 16256, 456, 3428, 456, 16256, }; static const uint16_t filter_5tap_16p_150[45] = { 16368, 2064, 2064, 16368, 0, 16316, 1924, 2204, 44, 16372, 16280, 1772, 2328, 116, 16356, 16256, 1616, 2440, 204, 16340, 16240, 1456, 2536, 304, 16320, 16232, 1296, 2612, 416, 16300, 16232, 1132, 2664, 544, 16284, 16240, 976, 2700, 680, 16264, 16248, 824, 2708, 824, 16248, }; static const uint16_t filter_5tap_16p_183[45] = { 228, 1816, 1816, 228, 0, 168, 1728, 1904, 300, 16372, 116, 1632, 1988, 376, 16360, 72, 1528, 2060, 460, 16348, 36, 1424, 2120, 552, 16340, 4, 1312, 2168, 652, 16336, 16368, 1200, 2204, 752, 16332, 16352, 1084, 2224, 860, 16332, 16340, 972, 2232, 972, 16340, }; static const uint16_t filter_6tap_16p_upscale[54] = { 0, 0, 4092, 0, 0, 0, 44, 16188, 4064, 228, 16324, 0, 80, 16036, 3980, 492, 16256, 4, 108, 15916, 3844, 788, 16184, 16, 120, 15836, 3656, 1108, 16104, 28, 128, 15792, 3420, 1448, 16024, 44, 124, 15776, 3144, 1800, 15948, 64, 112, 15792, 2836, 2152, 15880, 80, 100, 15828, 2504, 2504, 15828, 100, }; static const uint16_t filter_6tap_16p_117[54] = { 16168, 476, 3568, 476, 16168, 0, 16216, 280, 3540, 692, 16116, 8, 16264, 104, 3472, 924, 16068, 16, 16304, 16340, 3372, 1168, 16024, 28, 16344, 16212, 3236, 1424, 15988, 36, 16372, 16112, 3072, 1680, 15956, 44, 12, 16036, 2880, 1936, 15940, 48, 28, 15984, 2668, 2192, 15936, 48, 40, 15952, 2436, 2436, 15952, 40, }; static const uint16_t filter_6tap_16p_150[54] = { 16148, 920, 2724, 920, 16148, 0, 16156, 768, 2712, 1072, 16144, 0, 16172, 628, 2684, 1232, 16148, 16380, 16192, 492, 2632, 1388, 16160, 16372, 16212, 368, 2564, 1548, 16180, 16364, 16232, 256, 2480, 1704, 16212, 16352, 16256, 156, 2380, 1856, 16256, 16336, 16276, 64, 2268, 2004, 16308, 16320, 16300, 16372, 2140, 2140, 16372, 16300, }; static const uint16_t filter_6tap_16p_183[54] = { 16296, 1032, 2196, 1032, 16296, 0, 16284, 924, 2196, 1144, 16320, 16376, 16272, 820, 2180, 1256, 16348, 16364, 16268, 716, 2156, 1364, 16380, 16352, 16264, 620, 2116, 1472, 36, 16340, 16268, 524, 2068, 1576, 88, 16328, 16272, 436, 2008, 1680, 144, 16316, 16280, 352, 1940, 1772, 204, 16304, 16292, 276, 1860, 1860, 276, 16292, }; static const uint16_t filter_7tap_16p_upscale[63] = { 176, 15760, 2488, 2488, 15760, 176, 0, 160, 15812, 2152, 2816, 15728, 192, 16376, 136, 15884, 1812, 3124, 15720, 196, 16368, 108, 15964, 1468, 3400, 15740, 196, 16364, 84, 16048, 1132, 3640, 15792, 180, 16360, 56, 16140, 812, 3832, 15884, 152, 16360, 32, 16228, 512, 3976, 16012, 116, 16364, 12, 16308, 240, 4064, 16180, 60, 16372, 0, 0, 0, 4096, 0, 0, 0, }; static const uint16_t filter_7tap_16p_117[63] = { 92, 15868, 2464, 2464, 15868, 92, 0, 108, 15852, 2216, 2700, 15904, 72, 0, 112, 15856, 1960, 2916, 15964, 44, 0, 116, 15876, 1696, 3108, 16048, 8, 8, 112, 15908, 1428, 3268, 16156, 16348, 12, 104, 15952, 1168, 3400, 16288, 16300, 24, 92, 16004, 916, 3496, 64, 16244, 36, 80, 16064, 676, 3556, 248, 16184, 48, 64, 16124, 452, 3576, 452, 16124, 64, }; static const uint16_t filter_7tap_16p_150[63] = { 16224, 16380, 2208, 2208, 16380, 16224, 0, 16252, 16304, 2072, 2324, 84, 16196, 4, 16276, 16240, 1924, 2432, 184, 16172, 8, 16300, 16184, 1772, 2524, 296, 16144, 12, 16324, 16144, 1616, 2600, 416, 16124, 12, 16344, 16112, 1456, 2660, 548, 16104, 12, 16360, 16092, 1296, 2704, 688, 16088, 12, 16372, 16080, 1140, 2732, 832, 16080, 8, 0, 16076, 984, 2740, 984, 16076, 0, }; static const uint16_t filter_7tap_16p_183[63] = { 16216, 324, 1884, 1884, 324, 16216, 0, 16228, 248, 1804, 1960, 408, 16212, 16380, 16240, 176, 1716, 2028, 496, 16208, 16376, 16252, 112, 1624, 2084, 588, 16208, 16372, 16264, 56, 1524, 2132, 684, 16212, 16364, 16280, 4, 1424, 2168, 788, 16220, 16356, 16292, 16344, 1320, 2196, 892, 16232, 16344, 16308, 16308, 1212, 2212, 996, 16252, 16332, 16320, 16276, 1104, 2216, 1104, 16276, 16320, }; static const uint16_t filter_8tap_16p_upscale[72] = { 0, 0, 0, 4096, 0, 0, 0, 0, 16360, 76, 16172, 4064, 244, 16296, 24, 16380, 16340, 136, 15996, 3980, 524, 16204, 56, 16380, 16328, 188, 15860, 3844, 828, 16104, 92, 16372, 16320, 224, 15760, 3656, 1156, 16008, 128, 16368, 16320, 248, 15696, 3428, 1496, 15912, 160, 16360, 16320, 256, 15668, 3156, 1844, 15828, 192, 16348, 16324, 256, 15672, 2856, 2192, 15756, 220, 16340, 16332, 244, 15704, 2532, 2532, 15704, 244, 16332, }; static const uint16_t filter_8tap_16p_117[72] = { 116, 16100, 428, 3564, 428, 16100, 116, 0, 96, 16168, 220, 3548, 656, 16032, 136, 16376, 76, 16236, 32, 3496, 904, 15968, 152, 16372, 56, 16300, 16252, 3408, 1164, 15908, 164, 16368, 36, 16360, 16116, 3284, 1428, 15856, 172, 16364, 20, 28, 16000, 3124, 1700, 15820, 176, 16364, 4, 76, 15912, 2940, 1972, 15800, 172, 16364, 16380, 112, 15848, 2724, 2236, 15792, 160, 16364, 16372, 140, 15812, 2488, 2488, 15812, 140, 16372, }; static const uint16_t filter_8tap_16p_150[72] = { 16380, 16020, 1032, 2756, 1032, 16020, 16380, 0, 12, 16020, 876, 2744, 1184, 16032, 16364, 4, 24, 16028, 728, 2716, 1344, 16052, 16340, 8, 36, 16040, 584, 2668, 1500, 16080, 16316, 16, 40, 16060, 448, 2608, 1652, 16120, 16288, 20, 44, 16080, 320, 2528, 1804, 16168, 16260, 28, 48, 16108, 204, 2436, 1948, 16232, 16228, 32, 44, 16136, 100, 2328, 2084, 16304, 16200, 40, 44, 16168, 4, 2212, 2212, 4, 16168, 44, }; static const uint16_t filter_8tap_16p_183[72] = { 16264, 16264, 1164, 2244, 1164, 16264, 16264, 0, 16280, 16232, 1056, 2236, 1268, 16300, 16248, 0, 16296, 16204, 948, 2220, 1372, 16348, 16232, 0, 16312, 16184, 844, 2192, 1472, 12, 16216, 4, 16328, 16172, 740, 2156, 1572, 72, 16200, 0, 16340, 16160, 640, 2108, 1668, 136, 16188, 0, 16352, 16156, 544, 2052, 1756, 204, 16176, 16380, 16360, 16156, 452, 1988, 1840, 280, 16164, 16376, 16368, 16160, 364, 1920, 1920, 364, 16160, 16368, }; static const uint16_t filter_9tap_16p_upscale[81] = { 16284, 296, 15660, 2572, 2572, 15660, 296, 16284, 0, 16296, 272, 15712, 2228, 2896, 15632, 304, 16276, 4, 16308, 240, 15788, 1876, 3192, 15632, 304, 16276, 4, 16320, 204, 15876, 1520, 3452, 15664, 288, 16280, 8, 16336, 164, 15976, 1176, 3676, 15732, 260, 16288, 12, 16348, 120, 16080, 844, 3856, 15840, 216, 16300, 12, 16364, 76, 16188, 532, 3988, 15984, 156, 16324, 8, 16376, 36, 16288, 252, 4068, 16164, 84, 16352, 4, 0, 0, 0, 0, 4096, 0, 0, 0, 0, }; static const uint16_t filter_9tap_16p_117[81] = { 16356, 172, 15776, 2504, 2504, 15776, 172, 16356, 0, 16344, 200, 15756, 2252, 2740, 15816, 136, 16372, 16380, 16336, 216, 15756, 1988, 2956, 15884, 92, 8, 16380, 16332, 224, 15780, 1720, 3144, 15976, 40, 28, 16376, 16328, 224, 15816, 1448, 3304, 16096, 16364, 52, 16372, 16328, 216, 15868, 1180, 3432, 16240, 16296, 80, 16364, 16332, 200, 15928, 916, 3524, 24, 16224, 108, 16356, 16336, 184, 15996, 668, 3580, 220, 16148, 132, 16352, 16344, 160, 16072, 436, 3600, 436, 16072, 160, 16344, }; static const uint16_t filter_9tap_16p_150[81] = { 84, 16128, 0, 2216, 2216, 0, 16128, 84, 0, 80, 16160, 16296, 2088, 2332, 100, 16092, 84, 0, 76, 16196, 16220, 1956, 2432, 208, 16064, 80, 0, 72, 16232, 16152, 1812, 2524, 328, 16036, 76, 4, 64, 16264, 16096, 1664, 2600, 460, 16012, 64, 8, 56, 16300, 16052, 1508, 2656, 596, 15996, 52, 12, 48, 16328, 16020, 1356, 2700, 740, 15984, 36, 20, 40, 16356, 15996, 1196, 2728, 888, 15980, 20, 24, 32, 0, 15984, 1044, 2736, 1044, 15984, 0, 32, }; static const uint16_t filter_9tap_16p_183[81] = { 16356, 16112, 388, 1952, 1952, 388, 16112, 16356, 0, 16368, 16116, 304, 1876, 2020, 480, 16112, 16344, 4, 16376, 16124, 224, 1792, 2080, 576, 16116, 16328, 8, 0, 16136, 148, 1700, 2132, 672, 16124, 16312, 8, 8, 16148, 80, 1604, 2176, 772, 16140, 16296, 12, 12, 16164, 16, 1504, 2208, 876, 16156, 16276, 16, 16, 16180, 16344, 1404, 2232, 980, 16184, 16256, 20, 20, 16200, 16296, 1300, 2244, 1088, 16212, 16240, 20, 20, 16220, 16252, 1196, 2252, 1196, 16252, 16220, 20, }; static const uint16_t filter_10tap_16p_upscale[90] = { 0, 0, 0, 0, 4096, 0, 0, 0, 0, 0, 12, 16344, 88, 16160, 4068, 252, 16280, 44, 16368, 0, 24, 16308, 168, 15976, 3988, 540, 16176, 92, 16348, 0, 32, 16280, 236, 15828, 3852, 852, 16064, 140, 16328, 4, 36, 16260, 284, 15720, 3672, 1184, 15956, 188, 16308, 8, 36, 16244, 320, 15648, 3448, 1528, 15852, 236, 16288, 12, 36, 16240, 336, 15612, 3184, 1880, 15764, 276, 16272, 20, 32, 16240, 340, 15608, 2888, 2228, 15688, 308, 16256, 24, 28, 16244, 332, 15636, 2568, 2568, 15636, 332, 16244, 28, }; static const uint16_t filter_10tap_16p_117[90] = { 16308, 196, 16048, 440, 3636, 440, 16048, 196, 16308, 0, 16316, 164, 16132, 220, 3612, 676, 15972, 220, 16300, 0, 16324, 132, 16212, 20, 3552, 932, 15900, 240, 16296, 4, 16336, 100, 16292, 16232, 3456, 1192, 15836, 256, 16296, 4, 16348, 68, 16364, 16084, 3324, 1464, 15784, 264, 16296, 8, 16356, 36, 48, 15960, 3164, 1736, 15748, 260, 16304, 4, 16364, 8, 108, 15864, 2972, 2008, 15728, 252, 16312, 4, 16372, 16368, 160, 15792, 2756, 2268, 15724, 228, 16328, 0, 16380, 16344, 200, 15748, 2520, 2520, 15748, 200, 16344, 16380, }; static const uint16_t filter_10tap_16p_150[90] = { 64, 0, 15956, 1048, 2716, 1048, 15956, 0, 64, 0, 52, 24, 15952, 896, 2708, 1204, 15972, 16356, 72, 16380, 44, 48, 15952, 748, 2684, 1360, 16000, 16320, 84, 16380, 32, 68, 15964, 604, 2644, 1516, 16032, 16288, 92, 16376, 24, 88, 15980, 464, 2588, 1668, 16080, 16248, 100, 16376, 16, 100, 16004, 332, 2516, 1816, 16140, 16212, 108, 16376, 8, 108, 16032, 212, 2428, 1956, 16208, 16172, 112, 16376, 4, 116, 16060, 100, 2328, 2092, 16288, 16132, 116, 16380, 0, 116, 16096, 16380, 2216, 2216, 16380, 16096, 116, 0, }; static const uint16_t filter_10tap_16p_183[90] = { 40, 16180, 16240, 1216, 2256, 1216, 16240, 16180, 40, 0, 44, 16204, 16200, 1112, 2252, 1320, 16288, 16160, 36, 0, 44, 16224, 16168, 1004, 2236, 1424, 16344, 16144, 28, 4, 44, 16248, 16136, 900, 2208, 1524, 16, 16124, 24, 8, 44, 16268, 16116, 796, 2176, 1620, 84, 16108, 12, 12, 40, 16288, 16100, 692, 2132, 1712, 156, 16096, 4, 16, 36, 16308, 16088, 592, 2080, 1796, 232, 16088, 16376, 20, 32, 16328, 16080, 496, 2020, 1876, 316, 16080, 16360, 24, 28, 16344, 16080, 404, 1952, 1952, 404, 16080, 16344, 28, }; static const uint16_t filter_11tap_16p_upscale[99] = { 60, 16216, 356, 15620, 2556, 2556, 15620, 356, 16216, 60, 0, 52, 16224, 336, 15672, 2224, 2876, 15592, 368, 16208, 64, 16380, 44, 16244, 304, 15744, 1876, 3176, 15596, 364, 16212, 64, 16376, 36, 16264, 260, 15836, 1532, 3440, 15636, 340, 16220, 60, 16376, 28, 16288, 212, 15940, 1188, 3668, 15708, 304, 16236, 56, 16376, 20, 16312, 160, 16052, 856, 3848, 15820, 248, 16264, 48, 16376, 12, 16336, 104, 16164, 544, 3984, 15968, 180, 16296, 36, 16376, 4, 16360, 48, 16276, 256, 4068, 16160, 96, 16336, 16, 16380, 0, 0, 0, 0, 0, 4096, 0, 0, 0, 0, 0, }; static const uint16_t filter_11tap_16p_117[99] = { 16380, 16332, 220, 15728, 2536, 2536, 15728, 220, 16332, 16380, 0, 4, 16308, 256, 15704, 2280, 2768, 15772, 176, 16360, 16368, 0, 12, 16292, 280, 15704, 2016, 2984, 15848, 120, 8, 16356, 0, 20, 16276, 292, 15724, 1744, 3172, 15948, 56, 40, 16340, 4, 24, 16268, 292, 15760, 1468, 3328, 16072, 16368, 80, 16324, 8, 24, 16264, 288, 15816, 1196, 3456, 16224, 16288, 116, 16312, 12, 24, 16264, 272, 15880, 932, 3548, 16, 16208, 152, 16296, 16, 24, 16268, 248, 15956, 676, 3604, 216, 16120, 188, 16284, 20, 24, 16276, 220, 16036, 436, 3624, 436, 16036, 220, 16276, 24, }; static const uint16_t filter_11tap_16p_150[99] = { 0, 144, 16072, 0, 2212, 2212, 0, 16072, 144, 0, 0, 16376, 144, 16112, 16288, 2092, 2324, 104, 16036, 140, 8, 16380, 16368, 144, 16152, 16204, 1960, 2424, 216, 16004, 132, 16, 16376, 16364, 140, 16192, 16132, 1820, 2512, 340, 15976, 116, 28, 16376, 16364, 132, 16232, 16072, 1676, 2584, 476, 15952, 100, 40, 16372, 16360, 124, 16272, 16020, 1528, 2644, 612, 15936, 80, 52, 16368, 16360, 116, 16312, 15980, 1372, 2684, 760, 15928, 56, 64, 16364, 16360, 104, 16348, 15952, 1216, 2712, 908, 15928, 28, 76, 16364, 16360, 92, 0, 15936, 1064, 2720, 1064, 15936, 0, 92, 16360, }; static const uint16_t filter_11tap_16p_183[99] = { 60, 16336, 16052, 412, 1948, 1948, 412, 16052, 16336, 60, 0, 56, 16356, 16052, 324, 1876, 2016, 504, 16056, 16316, 64, 0, 48, 16372, 16060, 240, 1796, 2072, 604, 16064, 16292, 64, 0, 44, 4, 16068, 160, 1712, 2124, 700, 16080, 16272, 68, 0, 40, 20, 16080, 84, 1620, 2164, 804, 16096, 16248, 68, 4, 32, 32, 16096, 16, 1524, 2200, 908, 16124, 16224, 68, 4, 28, 40, 16112, 16340, 1428, 2220, 1012, 16152, 16200, 64, 8, 24, 52, 16132, 16284, 1328, 2236, 1120, 16192, 16176, 64, 12, 16, 56, 16156, 16236, 1224, 2240, 1224, 16236, 16156, 56, 16, }; static const uint16_t filter_12tap_16p_upscale[108] = { 0, 0, 0, 0, 0, 4096, 0, 0, 0, 0, 0, 0, 16376, 24, 16332, 100, 16156, 4068, 260, 16272, 56, 16356, 8, 0, 16368, 44, 16284, 188, 15964, 3988, 548, 16156, 112, 16328, 20, 16380, 16360, 64, 16248, 260, 15812, 3856, 864, 16040, 172, 16296, 32, 16380, 16360, 76, 16216, 320, 15696, 3672, 1196, 15928, 228, 16268, 44, 16376, 16356, 84, 16196, 360, 15620, 3448, 1540, 15820, 280, 16240, 56, 16372, 16356, 88, 16184, 384, 15580, 3188, 1888, 15728, 324, 16216, 68, 16368, 16360, 88, 16180, 392, 15576, 2892, 2236, 15652, 360, 16200, 80, 16364, 16360, 84, 16188, 384, 15600, 2576, 2576, 15600, 384, 16188, 84, 16360, }; static const uint16_t filter_12tap_16p_117[108] = { 48, 16248, 240, 16028, 436, 3612, 436, 16028, 240, 16248, 48, 0, 44, 16260, 208, 16116, 212, 3596, 676, 15944, 272, 16240, 48, 16380, 40, 16276, 168, 16204, 12, 3540, 932, 15868, 296, 16240, 48, 16380, 36, 16292, 128, 16288, 16220, 3452, 1196, 15800, 312, 16240, 44, 16380, 28, 16308, 84, 16372, 16064, 3324, 1472, 15748, 316, 16244, 40, 16380, 24, 16328, 44, 64, 15936, 3168, 1744, 15708, 312, 16256, 32, 16380, 16, 16344, 8, 132, 15836, 2980, 2016, 15688, 300, 16272, 20, 0, 12, 16364, 16356, 188, 15760, 2768, 2280, 15688, 272, 16296, 8, 4, 8, 16380, 16324, 236, 15712, 2532, 2532, 15712, 236, 16324, 16380, 8, }; static const uint16_t filter_12tap_16p_150[108] = { 16340, 116, 0, 15916, 1076, 2724, 1076, 15916, 0, 116, 16340, 0, 16340, 100, 32, 15908, 920, 2716, 1232, 15936, 16344, 128, 16340, 0, 16344, 84, 64, 15908, 772, 2692, 1388, 15968, 16304, 140, 16344, 16380, 16344, 68, 92, 15912, 624, 2652, 1540, 16008, 16264, 152, 16344, 16380, 16348, 52, 112, 15928, 484, 2592, 1688, 16060, 16220, 160, 16348, 16380, 16352, 40, 132, 15952, 348, 2520, 1836, 16124, 16176, 168, 16356, 16376, 16356, 24, 148, 15980, 224, 2436, 1976, 16200, 16132, 172, 16364, 16372, 16360, 12, 160, 16012, 108, 2336, 2104, 16288, 16088, 172, 16372, 16368, 16364, 0, 168, 16048, 0, 2228, 2228, 0, 16048, 168, 0, 16364, }; static const uint16_t filter_12tap_16p_183[108] = { 36, 72, 16132, 16228, 1224, 2224, 1224, 16228, 16132, 72, 36, 0, 28, 80, 16156, 16184, 1120, 2224, 1328, 16280, 16112, 64, 40, 16380, 24, 84, 16180, 16144, 1016, 2208, 1428, 16340, 16092, 52, 48, 16380, 16, 88, 16208, 16112, 912, 2188, 1524, 16, 16072, 36, 56, 16380, 12, 92, 16232, 16084, 812, 2156, 1620, 88, 16056, 24, 64, 16380, 8, 92, 16256, 16064, 708, 2116, 1708, 164, 16044, 4, 68, 16380, 4, 88, 16280, 16048, 608, 2068, 1792, 244, 16036, 16372, 76, 16380, 0, 88, 16308, 16036, 512, 2008, 1872, 328, 16032, 16352, 80, 16380, 0, 84, 16328, 16032, 416, 1944, 1944, 416, 16032, 16328, 84, 0, }; const uint16_t *wbscl_get_filter_3tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_3tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_3tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_3tap_16p_150; else return filter_3tap_16p_183; } const uint16_t *wbscl_get_filter_4tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_4tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_4tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_4tap_16p_150; else return filter_4tap_16p_183; } static const uint16_t *wbscl_get_filter_5tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_5tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_5tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_5tap_16p_150; else return filter_5tap_16p_183; } static const uint16_t *wbscl_get_filter_6tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_6tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_6tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_6tap_16p_150; else return filter_6tap_16p_183; } static const uint16_t *wbscl_get_filter_7tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_7tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_7tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_7tap_16p_150; else return filter_7tap_16p_183; } static const uint16_t *wbscl_get_filter_8tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_8tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_8tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_8tap_16p_150; else return filter_8tap_16p_183; } static const uint16_t *wbscl_get_filter_9tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_9tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_9tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_9tap_16p_150; else return filter_9tap_16p_183; } static const uint16_t *wbscl_get_filter_10tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_10tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_10tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_10tap_16p_150; else return filter_10tap_16p_183; } static const uint16_t *wbscl_get_filter_11tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_11tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_11tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_11tap_16p_150; else return filter_11tap_16p_183; } static const uint16_t *wbscl_get_filter_12tap_16p(struct fixed31_32 ratio) { if (ratio.value < dc_fixpt_one.value) return filter_12tap_16p_upscale; else if (ratio.value < dc_fixpt_from_fraction(4, 3).value) return filter_12tap_16p_117; else if (ratio.value < dc_fixpt_from_fraction(5, 3).value) return filter_12tap_16p_150; else return filter_12tap_16p_183; } static const uint16_t *wbscl_get_filter_coeffs_16p(int taps, struct fixed31_32 ratio) { if (taps == 12) return wbscl_get_filter_12tap_16p(ratio); else if (taps == 11) return wbscl_get_filter_11tap_16p(ratio); else if (taps == 10) return wbscl_get_filter_10tap_16p(ratio); else if (taps == 9) return wbscl_get_filter_9tap_16p(ratio); else if (taps == 8) return wbscl_get_filter_8tap_16p(ratio); else if (taps == 7) return wbscl_get_filter_7tap_16p(ratio); else if (taps == 6) return wbscl_get_filter_6tap_16p(ratio); else if (taps == 5) return wbscl_get_filter_5tap_16p(ratio); else if (taps == 4) return wbscl_get_filter_4tap_16p(ratio); else if (taps == 3) return wbscl_get_filter_3tap_16p(ratio); else if (taps == 2) return get_filter_2tap_16p(); else if (taps == 1) return NULL; else { /* should never happen, bug */ BREAK_TO_DEBUGGER(); return NULL; } } static void wbscl_set_scaler_filter( struct dcn20_dwbc *dwbc20, uint32_t taps, enum wbscl_coef_filter_type_sel filter_type, const uint16_t *filter) { const int tap_pairs = (taps + 1) / 2; int phase; int pair; uint16_t odd_coef, even_coef; for (phase = 0; phase < (NUM_PHASES / 2 + 1); phase++) { for (pair = 0; pair < tap_pairs; pair++) { even_coef = filter[phase * taps + 2 * pair]; if ((pair * 2 + 1) < taps) odd_coef = filter[phase * taps + 2 * pair + 1]; else odd_coef = 0; REG_SET_3(WBSCL_COEF_RAM_SELECT, 0, WBSCL_COEF_RAM_TAP_PAIR_IDX, pair, WBSCL_COEF_RAM_PHASE, phase, WBSCL_COEF_RAM_FILTER_TYPE, filter_type); REG_SET_4(WBSCL_COEF_RAM_TAP_DATA, 0, /* Even tap coefficient (bits 1:0 fixed to 0) */ WBSCL_COEF_RAM_EVEN_TAP_COEF, even_coef, /* Write/read control for even coefficient */ WBSCL_COEF_RAM_EVEN_TAP_COEF_EN, 1, /* Odd tap coefficient (bits 1:0 fixed to 0) */ WBSCL_COEF_RAM_ODD_TAP_COEF, odd_coef, /* Write/read control for odd coefficient */ WBSCL_COEF_RAM_ODD_TAP_COEF_EN, 1); } } } bool dwb_program_horz_scalar(struct dcn20_dwbc *dwbc20, uint32_t src_width, uint32_t dest_width, struct scaling_taps num_taps) { uint32_t h_ratio_luma = 1; uint32_t h_ratio_chroma = 1; uint32_t h_taps_luma = num_taps.h_taps; uint32_t h_taps_chroma = num_taps.h_taps_c; int32_t h_init_phase_luma = 0; int32_t h_init_phase_chroma = 0; uint32_t h_init_phase_luma_int = 0; uint32_t h_init_phase_luma_frac = 0; uint32_t h_init_phase_chroma_int = 0; uint32_t h_init_phase_chroma_frac = 0; const uint16_t *filter_h = NULL; const uint16_t *filter_h_c = NULL; struct fixed31_32 tmp_h_init_phase_luma = dc_fixpt_from_int(0); struct fixed31_32 tmp_h_init_phase_chroma = dc_fixpt_from_int(0); /*Calculate ratio*/ struct fixed31_32 tmp_h_ratio_luma = dc_fixpt_from_fraction( src_width, dest_width); if (dc_fixpt_floor(tmp_h_ratio_luma) == 8) h_ratio_luma = -1; else h_ratio_luma = dc_fixpt_u3d19(tmp_h_ratio_luma) << 5; h_ratio_chroma = h_ratio_luma * 2; /*Program ratio*/ REG_UPDATE(WBSCL_HORZ_FILTER_SCALE_RATIO, WBSCL_H_SCALE_RATIO, h_ratio_luma); /* Program taps*/ REG_UPDATE(WBSCL_TAP_CONTROL, WBSCL_H_NUM_OF_TAPS_Y_RGB, h_taps_luma - 1); REG_UPDATE(WBSCL_TAP_CONTROL, WBSCL_H_NUM_OF_TAPS_CBCR, h_taps_chroma - 1); /* Calculate phase*/ tmp_h_init_phase_luma = dc_fixpt_add_int(tmp_h_ratio_luma, h_taps_luma + 1); tmp_h_init_phase_luma = dc_fixpt_div_int(tmp_h_init_phase_luma, 2); tmp_h_init_phase_luma = dc_fixpt_sub_int(tmp_h_init_phase_luma, h_taps_luma); h_init_phase_luma = dc_fixpt_s4d19(tmp_h_init_phase_luma); h_init_phase_luma_int = (h_init_phase_luma >> 19) & 0x1f; h_init_phase_luma_frac = (h_init_phase_luma & 0x7ffff) << 5; tmp_h_init_phase_chroma = dc_fixpt_mul_int(tmp_h_ratio_luma, 2); tmp_h_init_phase_chroma = dc_fixpt_add_int(tmp_h_init_phase_chroma, h_taps_chroma + 1); tmp_h_init_phase_chroma = dc_fixpt_div_int(tmp_h_init_phase_chroma, 2); tmp_h_init_phase_chroma = dc_fixpt_sub_int(tmp_h_init_phase_chroma, h_taps_chroma); tmp_h_init_phase_chroma = dc_fixpt_add(tmp_h_init_phase_chroma, dc_fixpt_from_fraction(1, 4)); h_init_phase_chroma = dc_fixpt_s4d19(tmp_h_init_phase_chroma); h_init_phase_chroma_int = (h_init_phase_chroma >> 19) & 0x1f; h_init_phase_chroma_frac = (h_init_phase_chroma & 0x7ffff) << 5; /* Program phase*/ REG_UPDATE(WBSCL_HORZ_FILTER_INIT_Y_RGB, WBSCL_H_INIT_INT_Y_RGB, h_init_phase_luma_int); REG_UPDATE(WBSCL_HORZ_FILTER_INIT_Y_RGB, WBSCL_H_INIT_FRAC_Y_RGB, h_init_phase_luma_frac); REG_UPDATE(WBSCL_HORZ_FILTER_INIT_CBCR, WBSCL_H_INIT_INT_CBCR, h_init_phase_chroma_int); REG_UPDATE(WBSCL_HORZ_FILTER_INIT_CBCR, WBSCL_H_INIT_FRAC_CBCR, h_init_phase_chroma_frac); /* Program LUT coefficients*/ filter_h = wbscl_get_filter_coeffs_16p( h_taps_luma, tmp_h_ratio_luma); filter_h_c = wbscl_get_filter_coeffs_16p( h_taps_chroma, dc_fixpt_from_int(h_ratio_luma * 2)); wbscl_set_scaler_filter(dwbc20, h_taps_luma, WBSCL_COEF_LUMA_HORZ_FILTER, filter_h); wbscl_set_scaler_filter(dwbc20, h_taps_chroma, WBSCL_COEF_CHROMA_HORZ_FILTER, filter_h_c); return true; } bool dwb_program_vert_scalar(struct dcn20_dwbc *dwbc20, uint32_t src_height, uint32_t dest_height, struct scaling_taps num_taps, enum dwb_subsample_position subsample_position) { uint32_t v_ratio_luma = 1; uint32_t v_ratio_chroma = 1; uint32_t v_taps_luma = num_taps.v_taps; uint32_t v_taps_chroma = num_taps.v_taps_c; int32_t v_init_phase_luma = 0; int32_t v_init_phase_chroma = 0; uint32_t v_init_phase_luma_int = 0; uint32_t v_init_phase_luma_frac = 0; uint32_t v_init_phase_chroma_int = 0; uint32_t v_init_phase_chroma_frac = 0; const uint16_t *filter_v = NULL; const uint16_t *filter_v_c = NULL; struct fixed31_32 tmp_v_init_phase_luma = dc_fixpt_from_int(0); struct fixed31_32 tmp_v_init_phase_chroma = dc_fixpt_from_int(0); /*Calculate ratio*/ struct fixed31_32 tmp_v_ratio_luma = dc_fixpt_from_fraction( src_height, dest_height); if (dc_fixpt_floor(tmp_v_ratio_luma) == 8) v_ratio_luma = -1; else v_ratio_luma = dc_fixpt_u3d19(tmp_v_ratio_luma) << 5; v_ratio_chroma = v_ratio_luma * 2; /*Program ratio*/ REG_UPDATE(WBSCL_VERT_FILTER_SCALE_RATIO, WBSCL_V_SCALE_RATIO, v_ratio_luma); /* Program taps*/ REG_UPDATE(WBSCL_TAP_CONTROL, WBSCL_V_NUM_OF_TAPS_Y_RGB, v_taps_luma - 1); REG_UPDATE(WBSCL_TAP_CONTROL, WBSCL_V_NUM_OF_TAPS_CBCR, v_taps_chroma - 1); /* Calculate phase*/ tmp_v_init_phase_luma = dc_fixpt_add_int(tmp_v_ratio_luma, v_taps_luma + 1); tmp_v_init_phase_luma = dc_fixpt_div_int(tmp_v_init_phase_luma, 2); tmp_v_init_phase_luma = dc_fixpt_sub_int(tmp_v_init_phase_luma, v_taps_luma); v_init_phase_luma = dc_fixpt_s4d19(tmp_v_init_phase_luma); v_init_phase_luma_int = (v_init_phase_luma >> 19) & 0x1f; v_init_phase_luma_frac = (v_init_phase_luma & 0x7ffff) << 5; tmp_v_init_phase_chroma = dc_fixpt_mul_int(tmp_v_ratio_luma, 2); tmp_v_init_phase_chroma = dc_fixpt_add_int(tmp_v_init_phase_chroma, v_taps_chroma + 1); tmp_v_init_phase_chroma = dc_fixpt_div_int(tmp_v_init_phase_chroma, 2); tmp_v_init_phase_chroma = dc_fixpt_sub_int(tmp_v_init_phase_chroma, v_taps_chroma); if (subsample_position == DWB_COSITED_SUBSAMPLING) tmp_v_init_phase_chroma = dc_fixpt_add(tmp_v_init_phase_chroma, dc_fixpt_from_fraction(1, 4)); v_init_phase_chroma = dc_fixpt_s4d19(tmp_v_init_phase_chroma); v_init_phase_chroma_int = (v_init_phase_chroma >> 19) & 0x1f; v_init_phase_chroma_frac = (v_init_phase_chroma & 0x7ffff) << 5; /* Program phase*/ REG_UPDATE(WBSCL_VERT_FILTER_INIT_Y_RGB, WBSCL_V_INIT_INT_Y_RGB, v_init_phase_luma_int); REG_UPDATE(WBSCL_VERT_FILTER_INIT_Y_RGB, WBSCL_V_INIT_FRAC_Y_RGB, v_init_phase_luma_frac); REG_UPDATE(WBSCL_VERT_FILTER_INIT_CBCR, WBSCL_V_INIT_INT_CBCR, v_init_phase_chroma_int); REG_UPDATE(WBSCL_VERT_FILTER_INIT_CBCR, WBSCL_V_INIT_FRAC_CBCR, v_init_phase_chroma_frac); /* Program LUT coefficients*/ filter_v = wbscl_get_filter_coeffs_16p( v_taps_luma, tmp_v_ratio_luma); filter_v_c = wbscl_get_filter_coeffs_16p( v_taps_chroma, dc_fixpt_from_int(v_ratio_luma * 2)); wbscl_set_scaler_filter(dwbc20, v_taps_luma, WBSCL_COEF_LUMA_VERT_FILTER, filter_v); wbscl_set_scaler_filter(dwbc20, v_taps_chroma, WBSCL_COEF_CHROMA_VERT_FILTER, filter_v_c); return true; }