diff --git a/input.conf b/input.conf index d85103a..41da0e7 100644 --- a/input.conf +++ b/input.conf @@ -194,7 +194,8 @@ CTRL+2 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/NVScaler.glsl" CTRL+3 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/CAS-scaled.glsl"; show-text "CAS" CTRL+4 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/FSRCNNX.glsl"; show-text "FSRCNNX" CTRL+5 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/ArtCNN_C4F32.glsl"; show-text "ArtCNN" -CTRL+6 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/ArtCNN_C4F32.glsl:~/.config/mpv/shaders/FSRCNNX.glsl:~/.config/mpv/shaders/CAS-scaled.glsl:~/.config/mpv/shaders/NVScaler.glsl"; show-text "ALL" +CTRL+6 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/ArtCNN_C4F16_DS.glsl"; show-text "ArtCNN" +CTRL+7 no-osd change-list glsl-shaders set "~/.config/mpv/shaders/ArtCNN_C4F16.glsl"; show-text "ArtCNN" CTRL+0 no-osd change-list glsl-shaders clr ""; show-text "GLSL shaders cleared" diff --git a/mpv.conf b/mpv.conf index 9a6ebcd..d9ef75c 100644 --- a/mpv.conf +++ b/mpv.conf @@ -14,7 +14,8 @@ volume=75 audio-spdif=ac3,eac3,dts-hd,truehd # glsl-shaders="~~/shaders/Anime4K_Clamp_Highlights.glsl:~~/shaders/Anime4K_Restore_CNN_VL.glsl:~~/shaders/Anime4K_Upscale_CNN_x2_VL.glsl:~~/shaders/Anime4K_AutoDownscalePre_x2.glsl:~~/shaders/Anime4K_AutoDownscalePre_x4.glsl:~~/shaders/Anime4K_Upscale_CNN_x2_M.glsl" # glsl-shaders="~~/shaders/FSRCNNX.glsl:~~/shaders/FSR.glsl:~~/shaders/NVScaler.glsl:~~/shaders/CAS-scaled.glsl" -glsl-shaders="~~/shaders/ArtCNN_C4F32.glsl:~~/shaders/FSRCNNX.glsl:~~/shaders/CAS-scaled.glsl" +# glsl-shaders="~~/shaders/ArtCNN_C4F32_DS.glsl" +glsl-shaders="~~/shaders/ArtCNN_C4F32.glsl" # Can fix stuttering in some cases, in other cases probably causes it. Try it if you experience stuttering. opengl-early-flush=no @@ -31,19 +32,34 @@ sub-auto=fuzzy slang=en,eng # profile=svp -profile=gpu-hq +profile=high-quality blend-subtitles=video # GPU OPTIONS vo=gpu-next hwdec=nvdec-copy gpu-api=vulkan -scale=bicubic -dscale=bicubic +# scale=bicubic +# scale=ewa_lanczos +# scale-blur=0.981251 +# dscale=bicubic +dscale=catmull_rom cscale=bicubic tscale=oversample interpolation=yes interpolation-preserve=no +# fruit: 8-Bit/8-Bit+FRC display +# ordered: true 10-Bit/12-Bit display +# error-diffusion: high-end GPUs +dither=error-diffusion +dither-depth=auto +error-diffusion=sierra-lite # uncomment if not 'error-diffusion' + +###### Antiring +scale-antiring=0.5 +dscale-antiring=0.5 +cscale-antiring=0.5 + # laptop # vo=gpu # gpu-api=opengl @@ -55,11 +71,11 @@ input-ipc-server=/tmp/mpvsocket # ao=pule,pipewire ao=pipewire,pulse -deband=no -deband-iterations=2 -deband-threshold=64 -deband-range=20 -deband-grain=64 +deband=yes +deband-iterations=4 +deband-threshold=35 +deband-range=16 +deband-grain=4 subs-with-matching-audio=no sub-fix-timing=yes @@ -68,6 +84,14 @@ sub-ass-override=scale sub-gauss=1.0 sub-gray=yes +###### High-quality screenshots +screenshot-format=webp +screenshot-webp-lossless=yes +screenshot-high-bit-depth=yes +screenshot-sw=no +screenshot-directory="/truenas/sudacode/pictures/mpv" +screenshot-template="%f-%wH.%wM.%wS.%wT-#%#00n" + [hdr] target-colorspace-hint=yes gpu-api=vulkan @@ -98,3 +122,6 @@ slang=ja,jpn,JA,JPN alang=ja,jpn vlang=ja,jpn sub-font="Noto Sans CJK JP" +sub-border-size=1 +sub-shadow-color=0.0/0.0/0.0/0.50 +sub-shadow-offset=2 diff --git a/shaders/ArtCNN_C4F16.glsl b/shaders/ArtCNN_C4F16.glsl new file mode 100644 index 0000000..4086dce --- /dev/null +++ b/shaders/ArtCNN_C4F16.glsl @@ -0,0 +1,1407 @@ +// MIT License + +// Copyright (c) 2024 Joao Chrisostomo, Kacper Michajłow + +// Permission is hereby granted, free of charge, to any person obtaining a copy +// of this software and associated documentation files (the "Software"), to deal +// in the Software without restriction, including without limitation the rights +// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +// copies of the Software, and to permit persons to whom the Software is +// furnished to do so, subject to the following conditions: + +// The above copyright notice and this permission notice shall be included in all +// copies or substantial portions of the Software. + +// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +// SOFTWARE. + +//!DESC ArtCNN C4F16 (Conv2D) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND LUMA +//!SAVE conv2d +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared F inp[1][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(1, 1); + inp[0][y][x] = F(LUMA_mul * texelFetch(LUMA_raw, input_base + ivec2(0, 0), 0).x); + } + } + + barrier(); + V4 result0 = V4(-0.0027198044, -0.013629392, -0.015712878, -0.050803013); + V4 result1 = V4(-0.02707489, -0.0062177293, 0.0026368732, -0.0029379292); + V4 result2 = V4(0.03127001, -0.0039273943, -0.0040966137, -0.0016518718); + V4 result3 = V4(0.0028380281, 0.00058883557, 0.013085538, -0.058857743); + const F inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const F inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const F inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const F inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const F inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const F inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const F inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const F inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const F inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += V4(-0.016452063, -0.1258466, 0.013886958, 0.036870774) * inp_0_0_0; + result0 += V4(0.04311634, 0.15515013, 0.12190506, 0.12543218) * inp_0_1_0; + result0 += V4(-0.0049624983, 0.1029244, -0.10124424, 0.06448426) * inp_0_2_0; + result0 += V4(0.001886782, 0.06120591, 0.020384936, 0.16804346) * inp_0_0_1; + result0 += V4(-0.04256893, -0.07616671, -0.37889892, 0.27856478) * inp_0_1_1; + result0 += V4(-0.20398517, -0.12900643, 0.113083735, 0.11175711) * inp_0_2_1; + result0 += V4(0.009553091, 0.13118562, -0.031063978, 0.09478131) * inp_0_0_2; + result0 += V4(0.066157505, -0.114692695, 0.22418123, -0.009412468) * inp_0_1_2; + result0 += V4(0.15508306, 0.011386595, 0.014014352, 0.09318008) * inp_0_2_2; + result1 += V4(0.08046117, -0.07086712, -0.102300294, 0.014950261) * inp_0_0_0; + result1 += V4(-0.06476857, -0.014190924, -0.017589286, -0.19119741) * inp_0_1_0; + result1 += V4(0.05054515, 0.115604624, 0.06517106, 0.13799176) * inp_0_2_0; + result1 += V4(-0.045681432, 0.08269155, 0.10319298, -0.026858954) * inp_0_0_1; + result1 += V4(0.11229104, -0.17059296, 0.13794285, 0.18026339) * inp_0_1_1; + result1 += V4(-0.1267971, 0.23877597, -0.18725446, -0.12132741) * inp_0_2_1; + result1 += V4(0.05785694, -0.015154775, 0.026422592, 0.002328838) * inp_0_0_2; + result1 += V4(0.07150728, -0.22784448, -0.12155527, 0.027110105) * inp_0_1_2; + result1 += V4(-0.08247087, 0.06362491, 0.08973536, -0.02196324) * inp_0_2_2; + result2 += V4(-0.06092033, 0.1256232, -0.11233013, -0.061837807) * inp_0_0_0; + result2 += V4(0.08898802, -0.028417582, 0.15791786, -0.01610648) * inp_0_1_0; + result2 += V4(0.06330266, -0.009340407, 0.017859828, -0.007937439) * inp_0_2_0; + result2 += V4(-0.17722517, 0.31189576, 0.32109433, 0.18112311) * inp_0_0_1; + result2 += V4(-0.2903746, -0.72364086, -0.3329427, -0.08360631) * inp_0_1_1; + result2 += V4(0.14228302, 0.11720193, -0.056604996, -0.027815754) * inp_0_2_1; + result2 += V4(0.035853237, 0.118430145, -0.12544365, -0.02719196) * inp_0_0_2; + result2 += V4(0.20537417, 0.07353585, 0.10881828, 0.1451791) * inp_0_1_2; + result2 += V4(-0.1517126, -0.010349405, 0.018765846, -0.09707698) * inp_0_2_2; + result3 += V4(0.052764144, -0.10130216, 0.22795214, -0.09385554) * inp_0_0_0; + result3 += V4(-0.16102873, 0.18050277, 0.36273104, 0.1743911) * inp_0_1_0; + result3 += V4(0.008320275, -0.031096114, 0.06665433, 0.047147725) * inp_0_2_0; + result3 += V4(0.039706435, -0.0059984834, 0.026533028, -0.19475575) * inp_0_0_1; + result3 += V4(0.017116806, -0.1657458, -0.4245533, 0.011194904) * inp_0_1_1; + result3 += V4(0.03566397, 0.1254953, -0.16895337, 0.20406392) * inp_0_2_1; + result3 += V4(-0.0622524, 0.11329407, -0.052762877, -0.081980705) * inp_0_0_2; + result3 += V4(0.08946176, -0.05226282, -0.15308078, -0.0015630769) * inp_0_1_2; + result3 += V4(-0.018317576, -0.06487258, -0.012865839, 0.13352033) * inp_0_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), result0); + imageStore(out_image, output_base + ivec2(1, 0), result1); + imageStore(out_image, output_base + ivec2(0, 1), result2); + imageStore(out_image, output_base + ivec2(1, 1), result3); +} + +//!DESC ArtCNN C4F16 (Conv2D-1-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d +//!SAVE conv2d_1 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.0035388642, 0.012181487, 0.06403471, 0.015263772); + V4 result1 = V4(0.048399653, -0.0074684187, -0.0068150507, 0.016319986); + V4 result2 = V4(0.015551343, 0.028928788, 0.0074838563, 0.012831508); + V4 result3 = V4(0.015546932, 0.0018076884, 0.003934822, -0.027352111); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.08193566, 0.39840552, -0.05933193, 0.029763913, 0.120781906, 0.13874644, 0.06285476, -0.031514462, -0.33653876, 0.23761259, -0.07119319, -0.08926567, 0.00014508692, -0.062654756, -0.13101529, 0.029373677) * inp_0_0_0; + result0 += M4(-0.2686895, 0.10908275, 0.024864523, 0.028138349, 0.63595426, 0.20497061, -0.0053157317, 0.09559526, -0.6010695, -0.52804697, -0.08165241, -0.07418531, -0.36249816, 0.09965129, 0.043142296, 0.11102198) * inp_0_1_0; + result0 += M4(0.32003805, -0.06369186, 0.110159315, -0.010411652, 0.14303263, -0.18286166, 0.17141442, -0.0774708, -0.2750923, 0.048123654, -0.042993017, 0.055669174, -0.08664134, -0.014772742, -0.09638268, -0.060853086) * inp_0_2_0; + result0 += M4(-0.18638985, -0.10025375, -0.01221694, -0.18347955, -0.22381034, -0.15570909, 0.22322272, -0.18700717, 0.23769893, 0.14806393, -0.008849564, 0.0136317285, 0.03139464, 0.08378959, -0.012119499, 0.026419694) * inp_0_0_1; + result0 += M4(-0.09444148, -0.16680825, -0.04191063, -0.11433058, -0.46190983, 0.24968515, 0.09260946, -0.039239544, -0.48942524, 0.65290695, 0.026454417, -0.3996515, 0.035578046, 0.03752698, 0.11413368, 0.12726994) * inp_0_1_1; + result0 += M4(-0.3939464, 0.011404807, -0.08643197, -0.07001899, -0.4240259, -0.11423647, -0.06039618, -0.045650464, 0.18176849, 0.118614994, 0.07916771, -0.14000084, -0.04808409, 0.06989854, 0.06425597, 0.038330052) * inp_0_2_1; + result0 += M4(0.088639356, 0.063344724, -0.0034504097, 0.2238218, -0.07661125, -0.10738507, -0.0092966715, 0.3010383, 0.31496724, -0.1979007, 0.05447602, -0.10734698, -0.053885452, -0.05719943, -0.113555916, -0.021155154) * inp_0_0_2; + result0 += M4(0.015520851, 0.026369756, -0.04167262, 0.141523, 0.073253386, 0.084800765, -0.0676251, 0.5053454, 0.28553674, -0.15500426, -0.24915896, 0.9031177, -0.0045735966, -0.039383005, -0.060552903, 0.024590101) * inp_0_1_2; + result0 += M4(-0.21189246, -0.050623517, 0.013824571, 0.054410357, 0.18887533, -0.2435286, -0.11421549, -0.16462444, 0.0728174, -0.09657451, 0.07730208, -0.07939918, 0.034992587, -0.07169108, 0.04370187, -0.0785741) * inp_0_2_2; + result1 += M4(-0.08724563, -0.029360695, 0.065424606, 0.18016396, -0.066029646, 0.009851433, 0.044099204, 0.062524706, 0.075378865, -0.04025694, -0.00035143772, 0.02216928, 0.07692978, -0.07277084, -0.061999667, -0.12335496) * inp_0_0_0; + result1 += M4(0.15146391, -0.045693725, 0.08794338, -0.07766357, -0.13882384, 0.11807377, 0.16390486, 0.060984742, -0.050909836, 0.011076402, -0.0069654104, -0.008235624, 0.13997374, -0.055829335, -0.11395829, -0.045706417) * inp_0_1_0; + result1 += M4(0.11037505, 0.037779838, 0.041720603, -0.11670487, -0.10206224, 0.29574063, -0.017590221, -0.029810347, 0.08654991, 0.11194881, -0.09588386, 0.11034557, -0.11284499, -0.038090393, -0.060732067, 0.15201814) * inp_0_2_0; + result1 += M4(-0.02798946, 0.2645396, -0.05080384, 0.39022708, -0.07972038, -0.03486675, 0.1624059, 0.1826741, -0.0305445, 0.3158071, 0.0032137304, 0.06960887, 0.061508473, -0.060662374, -0.03728802, -0.10974534) * inp_0_0_1; + result1 += M4(0.13413881, -0.19690159, 0.25165883, -0.025285713, 0.19857527, -0.2321096, -0.056400586, -0.11435613, -0.1891792, 0.15364274, 0.95750797, -0.031228404, 0.17185828, 0.072887875, -0.11088333, -0.08581528) * inp_0_1_1; + result1 += M4(0.09028881, -0.1780539, -0.04785461, -0.09430586, -0.044199556, -0.17495096, 0.2255327, -0.04418362, 0.42351684, -0.17086548, 0.108544886, 0.063870065, -0.20677198, 0.0918337, -0.031405777, 0.026987633) * inp_0_2_1; + result1 += M4(0.03143219, -0.06746378, -0.077566706, -0.19247384, 0.16452655, -0.5051362, -0.16162011, -0.08145442, 0.05511902, 0.030584775, -0.071060166, 0.25326735, -0.016743116, -0.0618647, 0.1214063, -0.04310255) * inp_0_0_2; + result1 += M4(0.13270794, -0.12859413, -0.13721833, -0.011795724, 0.11956431, 0.026687238, -0.52203315, -0.317287, -0.012819699, -0.45424682, -0.681156, -0.18422177, 0.07963337, 0.04038403, 0.086956374, 0.0706985) * inp_0_1_2; + result1 += M4(0.2106671, -0.09430158, -0.077296756, 0.001207568, -0.019188594, -0.011531864, -0.046601746, -0.057146672, 0.0503799, -0.118843146, -0.124916956, -0.08522102, -0.14284284, -0.1193746, 0.06719082, 0.09910482) * inp_0_2_2; + result2 += M4(-0.2244822, -0.082729764, -0.44512755, -0.77702785, 0.070779085, -0.06795795, 0.048184644, -0.41027415, -0.21277706, -0.20790118, 0.36475337, -0.31860444, 0.014606301, -0.08359864, 0.03596085, 0.0350377) * inp_0_0_0; + result2 += M4(0.09447366, 0.12554698, 0.052572437, 0.004993876, 0.015338761, 0.008580391, 0.024699932, -0.18695894, 0.12486596, 0.16261359, 0.05223534, -0.49886906, 0.058645505, 0.11000217, -0.052211735, -0.10267668) * inp_0_1_0; + result2 += M4(0.09253685, 0.32692894, -0.11326509, -0.2243793, 0.055343658, 0.062875904, 0.1316403, -0.37698555, -0.06615555, 0.2947396, -0.30346048, -0.20655632, -0.052567784, -0.17170146, -0.10338503, -0.028746855) * inp_0_2_0; + result2 += M4(-0.12259729, -0.119727425, 0.593932, -0.10741678, -0.0150476275, -0.15803762, 0.43156016, -0.09719216, -0.07408, -0.12842028, -0.47880188, 0.41297135, 0.07315841, 0.08734928, -0.031542793, 0.0862864) * inp_0_0_1; + result2 += M4(-0.14790195, 0.028560948, 0.14077131, 0.15227696, -0.11203044, 0.1193981, 0.16548304, 0.07721256, -0.48270524, -0.14609018, 0.13051052, 0.16035795, 0.22310275, 0.08613812, 0.12101891, 0.0693605) * inp_0_1_1; + result2 += M4(-0.17909749, -0.024392027, 0.2227383, -0.057302292, -0.05009124, 0.30629346, -0.0658257, 0.10691373, -0.09005195, 0.26912916, -0.02555377, 0.18611579, 0.09474404, -0.046735127, 0.08628372, 0.14976539) * inp_0_2_1; + result2 += M4(-0.12682188, -0.033667836, -0.21387348, 0.11724357, 0.11241762, -0.10776379, -0.45622072, 0.36206225, 0.034357004, 0.0274606, 0.53226703, -0.054120746, -0.07173099, -0.019781826, -0.0004506044, -0.090236515) * inp_0_0_2; + result2 += M4(0.10396443, -0.05090273, 0.030880392, 0.13643251, 0.4523865, 0.081858695, -0.08280347, 0.18518096, 0.56079537, 0.007042201, -0.012337641, 0.0017952896, -0.19653215, 0.10902694, -0.0235898, -0.15462936) * inp_0_1_2; + result2 += M4(0.011347261, 0.16956125, -0.07598024, -0.010642945, -0.06959051, 0.097124174, -0.10528735, 0.023413276, 0.011072511, -0.11380183, -0.1546189, -0.018206634, -0.072076365, -0.09334556, -0.03711523, -0.061668754) * inp_0_2_2; + result3 += M4(0.20372537, 0.14578828, 0.20127167, -0.16066748, 0.09756872, -0.10025203, 0.18399055, 0.057970647, 0.03679455, -0.13061528, -0.13194819, -0.017791305, -0.027707439, -0.037850592, -0.0058791186, 0.15898317) * inp_0_0_0; + result3 += M4(-0.13326374, -0.048175838, -0.1211976, -0.047573894, 0.029398272, 0.038163513, 0.06364081, 0.09756068, 0.112353444, -0.06523655, -0.3399193, 0.007071915, -0.0023307495, 0.06515439, -0.008210844, -0.048217848) * inp_0_1_0; + result3 += M4(-0.21247563, 0.08523739, 0.04721741, 0.06442855, -0.051469017, -0.092593156, 0.047065668, 0.02163933, -0.20487121, -0.2948929, 0.14564759, 0.072847456, 0.009143655, 0.061654102, -0.008843048, -0.095890515) * inp_0_2_0; + result3 += M4(0.22976227, -0.0034405778, -0.33477315, 0.12545134, 0.17131741, -0.11558586, 0.03167751, 0.14242904, 0.1061916, -0.18220623, 0.07726241, -0.48172006, -0.14746118, -0.11912247, 0.030638449, 0.10207886) * inp_0_0_1; + result3 += M4(-0.06655945, -0.019838296, -0.038446557, -0.047108516, -0.30915856, 0.07429464, -0.20438327, 0.14802341, 0.47137445, 0.024445575, 0.42510328, 0.242163, -0.021400312, 0.107167594, -0.056022163, 0.020425789) * inp_0_1_1; + result3 += M4(-0.0074782637, 0.054402016, -0.121972315, 0.041444067, -0.35059676, -0.15080321, -0.29118222, -0.016145391, -0.3576716, -0.3522069, 0.043113176, 0.010357731, 0.14414723, -0.113717005, -0.09415485, -0.028949017) * inp_0_2_1; + result3 += M4(0.03853427, 0.03176998, -0.07919849, 0.018467484, 0.03600878, 0.56193393, 0.13832507, 0.07699603, -0.15650001, -0.07601528, 0.16394944, -0.026312442, -0.07145015, -0.036025092, -0.04234946, 0.041831832) * inp_0_0_2; + result3 += M4(-0.016900353, -0.28659436, 0.011943033, -0.07257182, 0.014030349, 0.035322875, -0.5988642, -0.14678574, -0.0044690417, 0.8888096, -0.23830332, 0.10747964, 0.02044547, 0.1279399, 0.0006579104, -0.011562968) * inp_0_1_2; + result3 += M4(-0.089198224, 0.16423313, -0.29691276, 0.07104331, 0.13190354, 0.0776772, 0.08241301, -0.14865209, -0.08948346, 0.1620836, -0.32379845, 0.0013747211, 0.04707559, 0.0037285136, -0.015344385, -0.014232466) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.85313725, -0.02435101, -0.06857936, 0.04679383, -0.2585699, 0.081624314, 0.24544875, -0.027587967, -0.7746935, 0.5622293, -0.09342312, -0.03688094, -0.34380323, 0.72687024, -0.048763245, -0.003689941) * inp_1_0_0; + result0 += M4(-0.35174468, 0.117986694, 0.08605906, 0.028830849, 0.64237136, -0.3769583, -0.024089484, -0.23862994, 0.8207976, -0.092174746, 0.04297148, -0.051756054, -0.29739568, -0.11195339, -0.14723086, 0.03295132) * inp_1_1_0; + result0 += M4(0.2954745, 0.21712531, -0.067807004, 0.029517183, 0.16259618, 0.014441043, 0.0127598, 0.029936556, -0.4073981, -0.48001292, 0.10198077, 0.17044066, 0.058579385, -0.16940872, -0.22117646, 0.0061707636) * inp_1_2_0; + result0 += M4(-0.37001958, -0.071665555, 0.10686925, -0.10744776, -0.11030434, -0.016945168, -0.14443113, 0.039766748, -0.041175894, -0.31643036, -0.009723037, 0.11083293, -0.35056636, 0.50091743, 0.21538898, 0.13894936) * inp_1_0_1; + result0 += M4(0.18551482, -0.38274184, 0.1090545, 0.09133414, -0.100317314, 0.26533842, 0.028536757, 0.07844555, 0.006583591, 0.27766275, 0.1254183, -0.0061147013, 0.8617392, -0.7546585, -0.23212102, 0.2814898) * inp_1_1_1; + result0 += M4(-0.17533015, 0.056518923, -0.11886858, -0.17416163, -0.21810603, -0.041996296, -0.13190891, 0.10978519, -0.13276191, 0.29193908, -0.10255887, -0.15144268, 0.39411002, 0.5364633, -0.07876772, 0.12273716) * inp_1_2_1; + result0 += M4(0.025226103, 0.14986138, -0.05295039, 0.12537077, 0.10823799, -0.15962936, -0.04351816, 0.06994498, 0.3133468, 0.14449136, -0.20122978, -0.04178362, -0.025069045, 0.052850995, -0.31893167, 0.31568733) * inp_1_0_2; + result0 += M4(0.10307432, -0.03794696, 0.11638587, -0.15721007, 0.0520565, -0.013159431, 0.0033045416, 0.16645943, -0.04602354, 0.07579619, 0.119559675, 0.10222658, -0.076188296, -0.03417925, 0.35578036, -0.90802264) * inp_1_1_2; + result0 += M4(-0.13523121, 0.14683475, -0.24159884, 0.011003018, 0.15668543, -0.012923501, -0.049195066, -0.15511718, 0.21970461, -0.40896636, 0.14699629, -0.10037102, -0.011684425, -0.44974482, 0.075924896, -0.13819264) * inp_1_2_2; + result1 += M4(-0.32133275, -0.1632966, 0.016118964, -0.004102593, 0.32084933, 0.41906273, 0.08610651, 0.17084497, 0.13008702, 0.09139067, 0.21345861, -0.12968206, 0.008954712, -0.07455759, -0.25342295, -0.13596231) * inp_1_0_0; + result1 += M4(0.110927545, 0.026440676, -0.057138063, -0.026707454, -0.23099862, 0.10929439, 0.18417938, -0.08928301, 0.10867742, -0.062411074, 0.17694812, 0.27520618, 0.14665566, -0.19123065, -0.0028814063, 0.020384334) * inp_1_1_0; + result1 += M4(0.13942137, 0.0722548, 0.085695975, -0.0482584, -0.058018155, -0.06788848, 0.12553318, -0.017362285, -0.28463066, 0.2797977, -0.1744807, 0.07061992, 0.19873491, -0.16651899, -0.06323969, -0.02578639) * inp_1_2_0; + result1 += M4(-0.025543625, -0.61818314, 0.05540194, -0.36864513, 0.13506746, 0.45087427, 0.02561734, 0.4824854, -0.12235725, -0.13946341, -0.06030317, 0.14183283, -0.25570124, -0.47644913, -0.019941723, -0.45477942) * inp_1_0_1; + result1 += M4(0.3645578, 0.068593346, -0.1665043, 0.16704038, -0.2967851, 0.026300274, -0.13397226, -0.32232535, 0.13193616, -0.22311744, -0.41460353, -0.28414023, 0.4073843, 0.07373801, -0.22364068, 0.12431164) * inp_1_1_1; + result1 += M4(0.25017032, 0.070454225, 0.13813335, 0.019375844, -0.096448295, 0.072787635, 0.0041182754, -0.15815192, -0.2322587, -0.19746271, 0.13508892, 0.14120723, 0.11005683, 0.08688148, -0.15526778, -0.075340524) * inp_1_2_1; + result1 += M4(-0.14920484, -0.48791856, -0.023223, -0.3027848, 0.3378221, 0.4793663, -0.14946601, 0.9567044, -0.18527344, -0.119982645, -0.08596696, -0.17026097, 0.23330817, 0.036837753, -0.08102003, 0.29802063) * inp_1_0_2; + result1 += M4(0.10104728, 0.017842278, 0.20009801, 0.2362712, -0.16312838, -0.04045318, -0.3592395, -0.20366094, 0.2688829, 0.30382335, 0.08821922, -0.27768466, -0.07204707, 0.67338127, 0.9684179, 0.26206905) * inp_1_1_2; + result1 += M4(0.20085827, -0.1115579, -0.20676771, -0.14104019, -0.25027877, 0.13877366, -0.032097857, 0.011562554, -0.06354945, 0.1315248, 0.17668413, 0.061860748, -0.24132724, -0.11776977, 0.18664834, 0.05808953) * inp_1_2_2; + result2 += M4(-0.072219275, 0.024704212, 0.6167852, -0.5133586, 0.23397118, 0.12476223, -0.24312721, 0.7445347, -0.19348057, -0.09359127, -0.8927323, -0.27338013, -0.08031656, -0.08860313, 0.32231623, -0.64860487) * inp_1_0_0; + result2 += M4(-0.045371484, 0.12290978, 0.19355193, -0.03915953, -0.10403266, -0.26496485, 0.008814081, -0.16285874, -0.18879507, 0.1972924, 0.12899448, 0.15576236, -0.21710408, -0.008091758, 0.0434765, -0.1066743) * inp_1_1_0; + result2 += M4(-0.002016541, -0.0006886421, 0.33393008, -0.039007384, 0.020184148, -0.0028074265, 0.13437714, 0.09344798, 0.20083073, -0.29304448, -0.07516481, 0.16750409, 0.067934446, 0.062371586, -0.09625756, 0.63305384) * inp_1_2_0; + result2 += M4(-0.38875118, -0.0530316, -0.2627638, -0.37096834, 0.28227875, 0.057058726, -0.0007648176, 0.50170916, -0.014582225, -0.08303465, 1.2882401, -0.14439599, -0.5612461, -0.12507576, 0.7443172, 0.2275837) * inp_1_0_1; + result2 += M4(-0.06241773, 0.23984735, -0.38247794, -0.193146, -0.023529753, -0.26548344, -0.0008831312, 0.054739162, 0.50808966, 0.04970531, 0.28555724, -0.07511468, 0.21564315, 0.14087324, -0.31117678, -0.52685535) * inp_1_1_1; + result2 += M4(-0.067698725, -0.12012657, -0.18702506, 0.012525038, 0.11423368, 0.19669291, 0.0687259, -0.08449188, 0.114131555, 0.08787378, 0.027727695, -0.08600934, -0.1309175, 0.026612828, -0.078773305, 0.4300998) * inp_1_2_1; + result2 += M4(-0.07888591, -0.19316435, 0.07030573, -0.23898849, 0.30641487, -0.050587706, -0.067026295, 0.50440204, -0.080069296, -0.09858528, -1.2006693, 0.22419576, 0.69720376, -0.4077811, -0.82145584, -0.3318518) * inp_1_0_2; + result2 += M4(0.253429, 0.034562856, -0.043068126, 0.15730365, 0.18888126, -0.21013, -0.13781698, 0.21707365, -0.19726713, 0.027488727, 0.18039607, 0.11479809, -0.41453183, 0.31391656, 0.0070650936, 0.076380774) * inp_1_1_2; + result2 += M4(0.003429857, -0.018602068, -0.066684365, 0.11482386, -0.036528666, -0.029451601, -0.052084677, -0.035276096, -0.18110622, 0.20486076, 0.20484242, -0.0025528024, -0.19367853, 0.24121977, 0.025350042, 0.10913147) * inp_1_2_2; + result3 += M4(-0.0023735664, 0.15035935, 0.12993571, 0.20475487, 0.0019596012, -0.09204715, -0.13434508, -0.2821397, -0.05906947, 0.21287656, 0.30251858, -0.05017008, 0.03126201, 0.002017435, -0.50526565, 0.17320465) * inp_1_0_0; + result3 += M4(0.099262066, 0.12742217, -0.16422229, 0.03186198, 0.12362506, -0.14565836, -0.01895703, 0.17308953, 0.18997124, -0.008680871, 0.5007363, -0.06796606, 0.11387236, 0.0110532595, 0.027245427, -0.02858506) * inp_1_1_0; + result3 += M4(-0.1043227, -0.009697204, -0.14678726, 0.025163496, -0.195235, -0.03975564, 0.020124005, 0.036363356, 0.2044253, -0.08100828, -0.18540438, 0.024970459, -0.06662393, -0.24664907, 0.1844767, 0.039760955) * inp_1_2_0; + result3 += M4(0.03556496, 0.40731633, -0.009378648, 0.35368907, 0.054531943, -0.25538638, 0.23750697, -0.7583463, 0.19742353, -0.098816276, -0.41828468, 0.54874414, -0.07079365, 0.020870816, -0.64631456, 0.61903435) * inp_1_0_1; + result3 += M4(-0.3990005, 0.00885162, -0.3252981, -0.072892606, 0.5868726, 0.062424455, 0.12871675, 0.32273144, -0.5357227, 0.08173042, -0.20361531, -0.15989196, -0.7643352, -0.024472103, -0.46516174, -0.58503497) * inp_1_1_1; + result3 += M4(0.1232718, 0.06953096, 0.17959209, 0.023106743, -0.18714033, -0.09933013, -0.032718066, 0.070490085, 0.00089770433, -0.053541496, -0.09406766, -0.0057063233, 0.38167843, -0.14396475, 0.5196705, -0.16198893) * inp_1_2_1; + result3 += M4(0.0140656475, 0.21922494, -0.056840483, -0.07001231, -0.120163955, -0.22476105, 0.072396405, -0.06738373, -0.09434732, 0.123775706, 0.09688478, -0.159715, 0.0009263281, 0.38566205, 0.1203647, -0.082159035) * inp_1_0_2; + result3 += M4(-0.058063142, -0.13751893, -0.012188545, -0.10500652, 0.17686076, 0.042373944, -0.23056524, 0.10845812, -0.019570937, -0.19659866, -0.14402579, -0.13492614, 0.26653746, -0.038438268, 0.6654084, 0.13422534) * inp_1_1_2; + result3 += M4(0.051074985, 0.01658446, 0.27970675, 0.06717866, -0.029654497, -0.041104205, -0.031459272, 0.02453557, 0.14207277, 0.118784904, 0.08530623, 0.045611463, -0.036815416, 0.44440648, 0.41889176, 0.040619373) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.041046668, -0.08714282, -0.073594816, 0.010970952, -0.1882758, 0.27579176, 0.03536449, -0.08542214, 0.3048594, 0.4530526, 0.0013206154, -0.028139513, 0.8478168, 0.23004742, 0.0076424624, -0.005963699) * inp_2_0_0; + result0 += M4(-0.675687, -0.18131071, -0.11496222, 0.04182087, -0.031031555, -0.46466836, -0.06559829, -0.03957504, 0.044670437, -0.38225058, 0.06304581, 0.040416148, -1.1025981, -0.18210213, 0.047893796, 0.09789689) * inp_2_1_0; + result0 += M4(-0.25182498, 0.11422446, 0.11699884, 0.001959186, -0.18557777, 0.25785574, 0.025503788, -0.026508162, -0.70701927, -0.19959773, -0.16261607, 0.044826515, 0.4344687, 0.07016805, 0.06883519, 0.01511665) * inp_2_2_0; + result0 += M4(0.066674605, 0.19236362, -0.0785282, -0.05095323, 0.18426083, -0.029129753, -0.10607958, -0.026322767, 0.08938068, -0.46208933, 0.15560026, -0.15441328, -0.20653039, -0.031048529, 0.18270804, -0.052175336) * inp_2_0_1; + result0 += M4(-0.17021075, 0.44645318, 0.064337924, -0.35476676, -0.06049966, 0.14457396, 0.23315272, -0.61046785, -0.16183764, 0.7003692, 0.15736891, -0.4137998, 0.23982742, 0.24342622, -0.20881954, -0.21306111) * inp_2_1_1; + result0 += M4(-0.12433247, 0.17513616, 0.088211484, -0.034301586, 0.17206079, -0.12319476, -0.0711395, -0.09247507, 0.017651413, -0.17906149, -0.119941995, 0.22451276, -0.047592435, 0.09213579, -0.062360976, -0.013997644) * inp_2_2_1; + result0 += M4(0.18996708, 0.01084998, -0.26635185, 0.122841895, 0.010606524, -0.027477054, 0.019549975, 0.03288411, -0.012691764, 0.051538102, -0.046197236, 0.06947832, -0.11301016, 0.09755053, -0.07446157, 0.1486752) * inp_2_0_2; + result0 += M4(-0.36824858, 0.05843571, -0.2618618, 0.7284761, -0.21758777, 0.15616763, 0.1021092, 0.39711222, 0.033237204, 0.023642745, -0.21918292, 0.5568767, 0.13701046, -0.25721508, 0.082974575, 0.0041465224) * inp_2_1_2; + result0 += M4(0.09509355, -0.15123545, -0.034223463, -0.04543954, -0.079144716, 0.09071367, 0.09338266, 0.17455119, 0.1773881, -0.053871572, 0.037042413, -0.17526062, -0.070509546, -0.19783144, 0.011318544, -0.026450291) * inp_2_2_2; + result1 += M4(-0.061877683, -0.12305839, -0.20263477, -0.11488986, 0.24543491, 0.32654366, 0.10685588, 0.11506586, -0.10795856, 0.03018991, 0.059933174, 0.0853006, -0.20264159, -0.043828856, -0.20878649, 0.14681698) * inp_2_0_0; + result1 += M4(-0.099625036, 0.20434903, 0.07796133, 0.06736927, 0.07125978, 0.05099109, 0.22723898, -0.08742187, 0.11490085, -0.04678864, -0.13050777, -0.08809224, 0.10186953, 0.16114867, -0.1435795, -0.05920464) * inp_2_1_0; + result1 += M4(0.07486631, 0.0044751903, -0.093036935, 0.027565863, -0.07470142, 0.17695644, -0.07382289, -0.044591907, -0.21034206, -0.25844106, 0.18035167, 0.059543654, -0.06836321, -0.14411914, 0.1548659, -0.03892513) * inp_2_2_0; + result1 += M4(0.117224984, 0.17542, -0.00016663033, -0.20314355, 0.22289772, 0.30088758, -0.032968026, -0.15414216, -0.140072, 0.14610891, 0.03125237, 0.3250524, 0.03702276, 0.10557298, 0.08998342, -0.43446854) * inp_2_0_1; + result1 += M4(-0.10302777, 0.4501756, 0.8351375, -0.017320178, -0.14834926, -0.13270089, 0.9023029, -0.0824228, 0.09006571, 0.11064118, 0.35334682, -0.30232978, 0.12792541, -0.0071462905, 0.4237898, 0.38528624) * inp_2_1_1; + result1 += M4(0.36576793, -0.050644517, 0.04195809, 0.108811006, -0.33933258, -0.048364114, 0.15662737, -0.09251479, -0.20477468, 0.2541265, 0.17623655, 0.20086327, -0.111452036, -0.09789033, -0.15870745, 0.027849512) * inp_2_2_1; + result1 += M4(0.20742778, -0.14416832, -0.13775797, 0.58929, 0.16418126, 0.49148947, -0.18096113, 0.68119305, -0.2531042, -0.17075492, -0.12018323, 0.12608007, 0.021732088, -0.37607798, 0.0010915091, 0.001743941) * inp_2_0_2; + result1 += M4(-0.15006953, -0.28072268, -0.44455764, 0.027220342, 0.08871589, -0.19202746, -0.5691258, -0.22697172, 0.5984513, -0.021040866, -0.5640603, -0.69894254, 0.10230523, 0.37776676, -0.16448745, -0.34962857) * inp_2_1_2; + result1 += M4(0.28793243, -0.27053738, 0.037647776, 0.10638764, -0.29987827, -0.10918723, -0.15849937, 0.032926988, -0.276323, -0.30320406, -0.06410051, 0.079027995, -0.1144192, 0.0686072, 0.13253035, 0.16962466) * inp_2_2_2; + result2 += M4(-0.104575686, -0.04030638, 0.38205162, -0.1646444, 0.0070794793, 0.086107545, 0.09008801, -0.26022068, -0.08264631, 0.0025685597, 0.45367503, 0.036392443, -0.05385623, 0.0043640602, 0.88977754, -0.6094777) * inp_2_0_0; + result2 += M4(0.17220014, -0.104757294, 0.28872848, -0.9140526, 0.07250322, -0.03486389, 0.0519809, -0.28910607, 0.13334726, -0.18156597, -0.48792294, 0.45706385, 0.114385955, 0.06414442, -0.40856388, 0.26286653) * inp_2_1_0; + result2 += M4(0.06838794, 0.0037464432, -0.25175664, -0.10634569, -0.07736329, 0.04136653, -0.09635174, 0.042798392, -0.089459404, 0.1431562, -0.35529405, -0.58673966, -0.009117467, -0.08846847, -0.13101909, -0.0941622) * inp_2_2_0; + result2 += M4(0.014403663, -0.09284215, -0.22324999, 0.5977427, -0.13145088, 0.045327898, -0.2159109, 0.58904, -0.14557627, 0.047140498, 0.37750348, 0.04514063, -0.07165266, 0.00403441, -0.20610464, -0.22565311) * inp_2_0_1; + result2 += M4(-0.34951925, -0.20195192, 0.052249074, 0.004859058, -0.4837092, -0.56432015, -0.14240249, -0.089294374, -0.32763055, -0.6932184, 0.18841206, -0.10697703, -0.12905538, -0.012168624, 0.33363688, -0.23945247) * inp_2_1_1; + result2 += M4(-0.19418816, -0.07137613, 0.016112942, -0.06583376, 0.010781973, 0.64119726, 0.2163896, 0.053818654, 0.19992511, 1.0749966, 0.37210134, -0.114605546, 0.12615307, 0.045438178, -0.09376032, 0.095737554) * inp_2_2_1; + result2 += M4(0.1762724, -0.12271588, 0.32391888, 0.05773013, 0.24969184, 0.04550068, 0.14141926, 0.3324033, 0.10539948, -0.22236584, 0.063619636, 0.37273255, 0.17779888, -0.049786404, -0.2504475, 0.6257438) * inp_2_0_2; + result2 += M4(0.20685196, -0.0106152035, -0.16097048, -0.011148921, 0.29720846, -0.2017546, -0.055421192, 0.14278509, 0.4991777, 0.1290137, -0.6009226, 0.12703991, 0.019506518, -0.09236414, -0.16110387, 0.15518974) * inp_2_1_2; + result2 += M4(-0.051044676, -0.0802801, -0.16391027, -0.20129019, 0.07025838, -0.08146353, -0.13828063, 0.089377195, -0.26447552, -0.09614584, -0.004125906, -0.071870096, -0.24505717, 0.08601064, -0.007302386, 0.09454271) * inp_2_2_2; + result3 += M4(0.08847961, -0.17847943, -0.69526863, -0.10000524, 0.022599213, -0.106843226, -0.32798478, -0.30478817, 0.116008244, 0.037003428, 0.00491019, 0.012982513, 0.14008689, -0.12109373, -0.114603855, 0.044905365) * inp_2_0_0; + result3 += M4(0.17639944, -0.044862606, -0.17100137, -0.005114512, 0.2445843, -0.058113806, -0.18633145, 0.22324812, 0.07353126, -0.08040312, 0.46093383, -0.1881027, 0.020793755, 0.05615095, -0.12523803, -0.11003187) * inp_2_1_0; + result3 += M4(0.015362869, 0.11070844, 0.18635881, 0.049795542, -0.18239588, -0.06503216, -0.004792109, 0.09085003, -0.24347839, 0.0014260579, -0.35534698, -0.01901228, -0.11597512, -0.14712879, -0.15724897, 0.08272095) * inp_2_2_0; + result3 += M4(0.03369274, -0.09148342, -0.11649345, -0.8705563, 0.07332814, -0.07007546, -0.118292294, -0.5086767, -0.09837098, -0.086299285, 0.39339754, -0.34102294, -0.14108673, 0.3166342, -0.09888971, 0.17531094) * inp_2_0_1; + result3 += M4(0.44183612, 0.03237536, 0.17856692, 0.11106832, 0.45943972, -0.4042934, 0.42762074, 0.78249615, 0.49094617, 0.08979736, 0.63991433, 1.1504385, -0.19337255, -0.028499793, 0.0188026, 0.13573536) * inp_2_1_1; + result3 += M4(-0.07735287, -0.10227065, -0.11877216, 0.12290771, -0.8072676, 0.0721539, -0.1910864, -0.089940324, -0.9754005, 0.3272343, 0.04703304, -0.093180224, -0.30274558, 0.3410099, 0.17829552, -0.1283383) * inp_2_2_1; + result3 += M4(-0.014644263, -0.16843987, 0.10283902, -0.23915698, 0.04944409, -0.28421712, 0.029477706, -0.20114663, 0.04234802, -0.10247694, 0.08606297, -0.00060528243, 0.16025454, -0.113197796, 0.32325915, -0.09360282) * inp_2_0_2; + result3 += M4(0.15988652, 0.43129408, 0.003102661, 0.13530524, 0.20106629, 0.35276395, -0.2581822, 0.27712944, 0.092174165, 0.5860203, -0.6644479, -0.30149898, 0.28493616, 0.2263659, -0.103455596, -0.13312685) * inp_2_1_2; + result3 += M4(0.05288319, 0.076428, -0.18710244, -0.093296796, -0.21877469, -0.15173075, -0.16969322, 0.05675821, 0.34267446, -0.25818372, -0.3879385, 0.057327595, 0.05748257, -0.44461763, 0.24332774, 0.18331102) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.33035442, 0.008719723, 0.09506913, -0.05596779, 0.6257054, -0.4622823, 0.19758332, -0.009717658, 0.11556571, -0.008927558, 0.0506363, 0.011549255, 0.022223158, 0.16494507, -0.023656936, -0.012043801) * inp_3_0_0; + result0 += M4(-0.3018259, -0.16688901, -0.08174471, 0.031225208, -0.3682067, 0.33880973, -0.029750831, 0.052449267, 0.24696672, -0.124532506, -0.040378094, -0.02887898, 0.08495422, -0.10733539, 0.033680625, -0.0040187235) * inp_3_1_0; + result0 += M4(0.28583634, 0.06151723, -0.056340285, -0.07114769, 0.40981525, -0.027857127, 0.23838963, -0.121739745, -0.07850837, 0.05227717, -0.03982672, 0.015378227, 0.29068476, -0.04168, 0.045381863, -0.00013727625) * inp_3_2_0; + result0 += M4(-0.041488778, 0.10742621, 0.037410427, 0.002719236, 0.23568422, -0.2532835, -0.14904994, -0.02132816, -0.26083633, 0.02395297, 0.013597459, -0.022430388, 0.0039781285, -0.052303746, -0.033815533, -0.08052908) * inp_3_0_1; + result0 += M4(0.19898818, -0.062810175, -0.0030155992, -0.014311552, -0.44702345, 0.43076748, 0.13032986, 0.04623066, -0.4599223, 0.39305303, 0.076502815, 0.01207224, -0.2322498, 0.07225618, 0.09567222, 0.074906886) * inp_3_1_1; + result0 += M4(0.14233728, 0.04341192, -0.14022432, 0.074965544, -0.42312324, -0.21910575, -0.04191498, -0.16155356, 0.016639965, 0.08997261, -0.030961918, 0.14126752, -0.16792814, 0.10337423, 0.07536254, -0.027254093) * inp_3_2_1; + result0 += M4(-0.10881682, 0.0070124045, -0.0734743, 0.02380105, -0.08528868, 0.2052196, 0.28235316, -0.09937192, -0.120403625, -0.18133068, -0.11513659, 0.2849305, -0.093126595, 0.09221593, -0.001545093, 0.118906654) * inp_3_0_2; + result0 += M4(0.07010447, -0.002349371, 0.07754369, -0.59997034, 0.057434276, -0.013308527, -0.12963523, 0.44178784, 0.29675305, -0.008670963, -0.14948617, 1.4333277, -0.048508614, 0.077688985, -0.03507625, 0.398176) * inp_3_1_2; + result0 += M4(-0.041430607, -0.0056431303, -0.03318371, -0.14079575, 0.08872225, 0.03580239, -0.11937835, -0.055355314, -0.23013176, -0.011193484, -0.0024156924, 0.2336995, -0.08273895, 0.021009317, -0.15586923, 0.20260328) * inp_3_2_2; + result1 += M4(0.0513188, -0.06831208, 0.071969114, 0.04630944, -0.10447119, 0.057457622, 0.087569036, 0.111861736, -0.110252105, 0.13196746, 0.07982998, 0.07918412, 0.07207178, 0.06784348, 0.06167251, -0.0048216507) * inp_3_0_0; + result1 += M4(-0.11775122, -0.068306886, -0.1314514, -0.022869237, 0.00013730286, 0.119652584, 0.08880258, 0.17652866, 0.041738562, -0.20556526, -0.09664171, -0.04788704, -0.25071782, -0.040533535, 0.007784405, 0.062077902) * inp_3_1_0; + result1 += M4(-0.16064279, -0.11079397, 0.10935189, -0.012442423, -0.2100082, 0.16263524, 0.03739031, -0.10447196, 0.08221832, -0.081931755, -0.015653074, -0.03437766, 0.22324844, -0.04340437, -0.03868832, -0.07421524) * inp_3_2_0; + result1 += M4(-0.0006676013, 0.040496968, -0.029079301, -0.085848354, 0.32673135, 0.02512588, 0.13175364, -0.27145657, -0.29334694, 0.13588892, -0.023815535, 0.2919419, 0.19565086, 0.4451977, 0.008018119, 0.44960222) * inp_3_0_1; + result1 += M4(-0.022897674, 0.022049528, 0.063053586, 0.12857682, -0.08483499, -0.03945858, 0.070367396, 0.106271245, 0.0042700917, -0.02905016, -0.12511766, -0.19536735, -0.3540937, 0.019095879, -0.015849894, 0.06366033) * inp_3_1_1; + result1 += M4(-0.01652925, -0.042448483, 0.008769335, -0.07717558, -0.052162528, -0.322415, 0.11697755, -0.014363827, 0.037944168, -0.029346848, 0.027509725, -0.08859583, 0.50523734, -0.026561983, 0.052579824, 0.0062967185) * inp_3_2_1; + result1 += M4(0.2831015, 0.29757833, 0.05384404, 0.07900192, -0.039041176, 0.29436517, -0.04795067, 0.28521034, -0.00084280485, -0.8624592, -0.2333652, 0.28047234, 0.13323455, 0.13980593, -0.1040817, 0.41841346) * inp_3_0_2; + result1 += M4(-0.056748446, 0.22499406, 0.47074968, 0.0529144, -0.18061697, -0.102058284, -0.45679823, -0.30751905, 0.56470495, -0.6227711, -1.0454521, -0.232476, -0.31827578, -0.16248211, -0.13230376, -0.018044606) * inp_3_1_2; + result1 += M4(-0.27055663, 0.040104035, 0.14919373, 0.020736083, 0.01568136, 0.009609554, -0.04672135, -0.019085662, 0.061935153, -0.2874959, -0.22337474, -0.06617894, 0.24911705, -0.18539925, -0.10120979, -0.028026477) * inp_3_2_2; + result2 += M4(0.024042394, 0.073262535, 0.29006875, 0.14790326, 0.27991506, 0.08672429, 0.63894117, 0.23894568, 0.029150546, -0.003545572, -0.1935614, 0.31723386, -0.026120424, 0.042341888, 0.021989973, 0.39239773) * inp_3_0_0; + result2 += M4(0.12542348, -0.12852398, 0.08891283, -0.14603676, -0.13592839, -0.054619603, 0.016557576, -0.5885332, -0.09488814, -0.07046842, 0.068331644, 0.10981448, -0.007638868, -0.13542384, -0.040854737, -0.005702912) * inp_3_1_0; + result2 += M4(0.07082901, 0.3306401, 0.14118254, 0.15615349, 0.0026882638, -0.15104243, 0.16891389, -0.18970816, 0.029838756, 0.13553977, 0.0018116818, -0.05020311, 0.08921652, 0.1348939, 0.043923832, -0.12109734) * inp_3_2_0; + result2 += M4(-0.034977324, 0.020053409, -0.37609595, -0.054664034, 0.15570554, 0.28191614, -0.6908297, 0.14370124, 0.08973948, -0.14156595, 0.041179802, -0.0043907193, 0.0063222884, 0.08350338, 0.0016131507, -0.056665104) * inp_3_0_1; + result2 += M4(-0.10248851, -0.1634687, -0.26851672, -0.46094584, 0.13998966, -0.2924333, 0.07655084, 0.1363661, -0.13416262, 0.08360797, -0.0077458336, 0.052660167, 0.064197175, -0.35289478, -0.004854883, 0.09082584) * inp_3_1_1; + result2 += M4(-0.095027156, 0.04068739, 0.03084716, -0.03596515, -0.13508861, 0.04214646, -0.3288225, 0.13073072, 0.1476837, 0.22203143, 0.14448355, -0.24459559, -0.17169268, -0.15294273, -0.10575014, 0.043388218) * inp_3_2_1; + result2 += M4(0.029903082, 0.061882522, 0.008157312, 0.36121556, -0.07368661, 0.08575936, 0.35597792, 0.34465766, 0.104644366, -0.11097311, 0.17444994, -0.10731304, 0.1298015, -0.025148133, 0.1390958, 0.045870513) * inp_3_0_2; + result2 += M4(-0.368986, -0.10517477, -0.11623787, 0.16291271, 0.27432486, -0.06225037, -0.43164015, -0.07802707, 0.6406274, 0.15081723, 0.038465872, 0.071604036, 0.19591734, -0.15255238, 0.13270366, -0.0070306635) * inp_3_1_2; + result2 += M4(-0.43216032, -0.039325733, 0.11141706, 0.12786095, 0.018126328, -0.07048143, 0.16246274, -0.09758973, 0.21826117, -0.11532947, -0.16299699, -0.035572365, 0.13867931, 0.18741262, -0.030538183, -0.04330623) * inp_3_2_2; + result3 += M4(-0.016080486, 0.032022443, -0.165704, 0.07246584, -0.08014878, -0.35844275, 0.113061614, 0.065997146, 0.02371046, -0.0008155743, 0.07187625, -0.08876956, -0.021193719, -0.033109672, -0.07381202, -0.1332826) * inp_3_0_0; + result3 += M4(0.04180735, -0.10776659, -0.027806621, 0.03553281, -0.023503449, 0.0169977, -0.27451426, 0.13919999, -0.042250317, 0.08521528, 0.17336805, 0.094439976, 0.18615168, 0.0021308872, -0.11744622, -0.0066396925) * inp_3_1_0; + result3 += M4(-0.15732574, 0.032522585, -0.09444964, 0.01659268, -0.09113259, 0.1305735, -0.11529496, 0.06343632, -0.046901505, -0.05037784, -0.07369559, -0.003344642, 0.07115879, 0.024641449, -0.08119741, -0.0030102434) * inp_3_2_0; + result3 += M4(-0.053414203, 0.29699224, 0.22554293, -0.009535028, -0.034720074, 0.2417781, 0.24099764, -0.4626596, 0.13475932, -0.08492695, 0.015628448, -0.20312022, 0.10430628, -0.012566143, 0.055538982, -0.3632165) * inp_3_0_1; + result3 += M4(0.15908659, -0.048262477, -0.03419863, 0.1971502, 0.59373474, 0.040420167, -0.006936596, -0.02301966, 0.11121678, 0.12800483, 0.26782277, 0.22499534, 0.13175733, 0.031205691, -0.024721615, -0.60766846) * inp_3_1_1; + result3 += M4(-0.120825715, 0.15550387, 0.2964152, 0.045677517, -0.16462475, 0.082349055, 0.025853585, 0.038958352, -0.3481213, 0.024049724, -0.31659842, 0.16717331, 0.1698046, 0.08965835, 0.26032227, 0.0028352945) * inp_3_2_1; + result3 += M4(0.048251737, -0.3381504, -0.06695844, -0.157471, 0.00037351192, -0.23412548, -0.046711236, -0.07236172, 0.006832392, 0.35861197, -0.20628686, -0.060990233, 0.082007684, -0.17143841, -0.121094696, -0.1463941) * inp_3_0_2; + result3 += M4(0.09094426, -0.522618, 0.32228535, -0.094180234, -0.119871415, 0.044149384, -0.47617498, 0.009163124, 0.12564674, 0.5748051, -0.43634674, 0.10976416, 0.099546134, 0.0657549, 0.03073671, -0.026292121) * inp_3_1_2; + result3 += M4(-0.19512002, -0.29417554, 0.16560094, 0.06612767, 0.061374467, -0.08437194, 0.2300457, 0.13011362, -0.19942062, 0.13436554, -0.27281252, -0.03332893, -0.028906567, 0.13050336, -0.08008115, 0.07068302) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 (Conv2D-2-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_1 +//!SAVE conv2d_2 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.007665273, -0.012706782, -0.01845592, 0.026948148); + V4 result1 = V4(-0.004221884, 0.016139362, -0.014981546, 0.016426912); + V4 result2 = V4(0.023174407, 0.05587216, -0.036808174, -0.002717008); + V4 result3 = V4(-0.036521614, -0.027948106, 0.005269135, 0.016757237); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.039672762, 0.14756373, -0.08448369, 0.017731339, 0.025569528, -0.040744573, 0.013367848, -0.019573305, -0.16450569, 0.33285397, -0.11215605, -0.028131716, 0.016628815, 0.023166431, -0.00037328724, -0.08177501) * inp_0_0_0; + result0 += M4(-0.065025754, -0.104294226, 0.094719954, 0.038185492, -0.09666806, 0.027351536, -0.038861245, 0.004919656, 0.19828482, -0.22604604, 0.024477452, -0.10591664, -0.19293559, 0.4599996, 0.04217503, 0.16875263) * inp_0_1_0; + result0 += M4(0.11909007, 0.022196636, 0.034610387, -0.018519526, -0.06364373, -0.008448898, 0.015312234, -0.0006501346, 0.016660782, 0.11387573, -0.049037285, 0.024658464, 0.034969676, 0.10625149, 0.053557772, 0.020835) * inp_0_2_0; + result0 += M4(-0.0125005925, -0.30383512, 0.118058, -0.0622122, -0.053739194, 0.02854181, 0.021767799, -0.023679044, 0.1428111, 0.22441542, 0.13784951, 0.055275932, 0.06970613, -0.03743594, -0.049048167, -0.018928634) * inp_0_0_1; + result0 += M4(-0.061673142, 0.35783702, -0.2123013, -0.0029690831, -0.028315723, -0.014267534, -0.029230714, 0.033998776, -0.017710077, -0.12725465, 0.055828135, 0.16664071, -0.6307306, 0.087453276, -0.24898805, 0.04119017) * inp_0_1_1; + result0 += M4(-0.046845675, -0.034220554, 0.085932806, 0.083577596, -0.014423473, 0.24495147, 0.029078502, 0.05503181, -0.16131906, -0.10079813, 0.042977642, -0.0016745959, -0.65428495, 0.022565061, 0.067007095, 0.03766914) * inp_0_2_1; + result0 += M4(0.06490114, 0.2199838, -0.22797251, -0.23349749, -0.010567795, 0.07199016, 0.0155491065, 0.04098838, 0.101175986, 0.12190727, -0.072651304, -0.14695418, 0.090389036, -0.28267708, 0.05694964, -0.012954298) * inp_0_0_2; + result0 += M4(0.47807366, -0.030264005, 0.49982014, 0.33034417, 0.11898345, 0.19849163, 0.09678157, -0.08528741, -0.2896773, -0.18903524, -0.19259109, -0.20551237, 0.12084159, 0.02699669, 0.014437785, 0.032559108) * inp_0_1_2; + result0 += M4(-0.45953196, -0.099686995, -0.48402756, -0.29487053, 0.048139166, 0.025708836, -0.06933556, -0.0635896, 0.27754197, 0.049773578, 0.12305871, 0.106278256, -0.2843809, 0.073834695, -0.0054634786, 0.007431036) * inp_0_2_2; + result1 += M4(0.085994475, -0.1193417, 0.0071456973, -0.0188979, 0.04183363, 0.12310363, 0.05413761, 0.04909667, -0.30297938, 0.013713022, 0.033152174, -0.11379657, -0.18750672, -0.22004475, 0.072046556, 0.35643157) * inp_0_0_0; + result1 += M4(-0.044690162, -0.058702532, 0.007017294, -0.041176673, 0.048408784, 0.080121264, 0.14161503, 0.12842357, 0.16440009, -0.21827607, 0.108833574, -0.044027567, -0.7746953, -0.8959941, 0.12757428, -0.1544348) * inp_0_1_0; + result1 += M4(0.042872313, 0.14205654, -0.03782293, 0.14235368, 0.130305, 0.009863965, -0.036303528, 0.1701927, -0.032293867, 0.22456177, -0.062228113, 0.2358024, -0.16976565, -0.43414745, -0.21161576, 0.099397495) * inp_0_2_0; + result1 += M4(-0.17363705, 0.0061433585, -0.13879266, 0.051511798, -0.022545822, 0.10734877, 0.06815579, -0.027122574, 0.04138703, -0.15504237, 0.16342735, -0.072404325, -0.20245026, -0.052299656, -0.02321829, 0.002982435) * inp_0_0_1; + result1 += M4(0.02651482, 0.12583537, 0.45761207, -0.095229685, -0.09167909, 0.25368944, 0.1494136, 0.017393095, -0.22577058, -0.07560319, -0.5818347, -0.5617876, -0.20395924, -0.37043095, 0.25695607, 0.45370623) * inp_0_1_1; + result1 += M4(0.15493771, -0.1451798, -0.32017693, 0.106086396, 0.14634423, 0.22603515, 0.07768741, -0.010450286, 0.002767987, 0.46913233, 0.23929594, 0.44290265, -0.05627698, -0.33913442, 0.029245248, -0.02599956) * inp_0_2_1; + result1 += M4(-0.0021248949, 0.3092833, 0.15976787, 0.17359373, 0.12920043, 0.106215686, 0.111749046, 0.032766804, 0.0702469, -0.12661065, -0.1285257, -0.08318957, -0.06495591, 0.021884361, -0.043050367, -0.048703246) * inp_0_0_2; + result1 += M4(-0.20655625, -0.51618236, -1.0094728, -1.0106137, 0.18894927, 0.06065753, 0.12400759, -0.07092802, 0.30361733, -0.16834623, -0.015209634, -0.0769189, -0.21808125, -0.07767393, 0.054584887, -0.3680687) * inp_0_1_2; + result1 += M4(-0.33314708, -0.15586081, 0.6099683, 0.13461177, 0.057432342, 0.22775277, 0.21322937, 0.0532397, 0.21244651, -0.0720669, 0.020412793, 0.037264194, 0.06017442, -0.2044945, 0.040000513, 0.19136631) * inp_0_2_2; + result2 += M4(-0.022256808, 0.04888811, -0.022015247, -0.092115186, 0.020818705, -0.028380645, 0.06185778, 0.08197749, -0.15860432, 0.108361594, -0.19694375, 0.07381369, 0.15101261, 0.14137074, -0.088994004, -0.5152534) * inp_0_0_0; + result2 += M4(0.06987822, -0.082000196, 0.02866381, 0.02108778, -0.051829483, -0.10683904, 0.12230972, 0.06575793, 0.090399876, -0.09562653, 0.043466404, 0.045909394, -0.020149088, -0.023214703, -0.30334076, -0.152464) * inp_0_1_0; + result2 += M4(0.0811315, -0.031609118, 0.01223644, 0.037147917, -0.18350898, -0.07458222, 0.089401655, 0.04162907, 0.103615806, -0.10315151, -0.07726605, 0.19025756, 0.1799963, -0.01810218, -0.14209187, -0.16685213) * inp_0_2_0; + result2 += M4(0.36047256, 0.1324033, -0.035303097, -0.029761754, -0.08453878, -0.092538394, 0.048813272, 0.2952445, -0.16890605, -0.24446781, -0.2384415, -0.051971577, 0.17304648, 0.015542306, -0.4414377, -0.20117971) * inp_0_0_1; + result2 += M4(-0.045148943, -0.3111919, 0.11992417, -0.027939236, -0.18373263, -0.015571242, 0.16786881, 0.19525638, 0.017805958, -0.23059563, -0.410443, -0.16854092, 0.1441553, -0.45532706, -3.1361716, -0.3325092) * inp_0_1_1; + result2 += M4(-0.38618526, 0.13740632, -0.08181973, 0.03373343, -0.14354973, -0.21948239, 0.18439542, 0.15648417, -0.085576214, 0.26852188, -0.26260558, 0.039526124, 0.25491875, 0.045001876, 0.11680835, -0.30998042) * inp_0_2_1; + result2 += M4(-0.22676072, -0.19009703, 0.22159863, -0.30039275, -0.02362561, -0.11382714, 0.12698817, 0.44949046, 0.26380983, 0.025303096, -0.06650232, 0.036743466, -0.23880884, 0.034025613, 0.016137755, -0.020864155) * inp_0_0_2; + result2 += M4(0.35370076, 1.4717959, -0.39453936, 0.012876503, -0.22790988, 0.013500226, -0.023526462, 0.40373355, -0.12799382, -0.35260844, 1.2150608, -0.2795026, 0.09862312, -0.31711802, -0.38266385, -0.4625872) * inp_0_1_2; + result2 += M4(-0.006961403, -0.38303775, -0.023807812, -0.032239847, 0.1080835, -0.20735481, 0.20969796, 0.23094925, -0.05239786, 0.12599377, 0.20246367, 0.14485277, 0.13914481, 0.018579604, -0.0628238, -0.22654083) * inp_0_2_2; + result3 += M4(-0.008393504, 0.06399756, -0.0042330017, -0.038735587, 0.009515421, -0.009107273, 0.033609197, 0.017786147, -0.056026146, -0.015695263, -0.101369716, -0.047951315, -0.0045006033, -0.024499964, -0.059617385, -0.050731726) * inp_0_0_0; + result3 += M4(0.05816133, -0.016608475, -0.008917803, 0.0039858357, 0.04840855, -0.03989783, 0.021003753, 0.11802983, 0.04186096, -0.02740838, 0.03711145, -0.15018326, 0.06298314, -0.13889475, 0.0056237825, -0.1520681) * inp_0_1_0; + result3 += M4(-0.0464783, 0.0043105236, 0.05190762, -0.016212137, 0.08643694, 0.044873476, 0.01192245, 0.073939085, -0.050208796, -0.06378546, 0.040115822, -0.10028227, 0.17046078, 0.104430355, 0.04660742, 0.004472599) * inp_0_2_0; + result3 += M4(0.01869681, 0.17765687, -0.01132854, -0.028719053, 0.03712774, -0.03786645, 0.021126691, 0.03835777, 0.07792008, 0.21017025, -0.017897833, -0.09897833, -0.08394025, 0.14385825, 0.021313882, -0.0965509) * inp_0_0_1; + result3 += M4(0.26953533, -0.046034764, -0.04922047, 0.2146039, -0.06167827, 0.10177388, -0.00028696132, 0.24834304, 0.21333528, 0.09260683, -0.062288165, 0.011650751, -0.35006827, 0.34293538, 0.45763996, -0.2745375) * inp_0_1_1; + result3 += M4(-0.248477, 0.13341399, 0.046218965, -0.23830393, 0.046279684, -0.04249783, 0.05034412, 0.22284749, 0.19501184, -0.013352284, -0.08176439, 0.062934145, -0.38506672, 0.22943279, 0.09323349, 0.055179156) * inp_0_2_1; + result3 += M4(-0.16656476, -0.9840606, -0.20659976, -0.763574, -0.043892097, -0.44524747, -0.019569376, 0.08370716, -0.00852045, -3.123414, -0.08242622, 0.15859091, 0.057629827, 0.21355532, 0.048139296, 0.13085455) * inp_0_0_2; + result3 += M4(0.16033624, -0.8272528, 0.20588383, 0.8193101, 0.07821069, -0.8910632, 0.08296487, 0.28125536, -0.024175977, -3.1040792, 0.06526852, -0.1698219, -0.008097565, 0.17878205, -0.021604018, -0.03205016) * inp_0_1_2; + result3 += M4(0.30415177, -0.04037523, -0.30204728, 0.1479439, 0.08117435, -0.59381247, -0.028565824, 0.3110151, 0.07412945, -2.6523457, 0.13584737, -0.14663945, -0.13277556, 0.3445814, -0.08542846, 0.10787985) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.014861815, 0.066454895, -0.018906003, -0.023595516, -0.016467934, 0.08245411, 0.058886092, -0.00517167, 0.0736858, -0.33098358, -0.053136736, 0.042932037, -0.023391662, -0.0154059855, 0.0027027188, 0.04671472) * inp_1_0_0; + result0 += M4(0.12285722, 0.02999312, -0.024734395, 0.052841812, -0.07606859, 0.532711, 0.029948376, 0.07419315, -0.1194898, -0.7954723, -0.117610976, -0.0037800272, 0.046508733, 0.15742284, -0.030505521, -0.06849125) * inp_1_1_0; + result0 += M4(0.10988922, -0.021709241, 0.0027044513, -0.087975435, -0.037619695, 0.1729772, 0.043288194, -0.00652201, 0.215917, -0.13082863, 0.0029795505, 0.026782269, 0.18413892, 0.009974911, 0.07329704, 0.057529766) * inp_1_2_0; + result0 += M4(-0.068852276, -0.015672447, 0.08639786, 0.015099182, -0.14214975, 0.03751679, 0.01517611, 0.017874567, 0.010275957, -0.33464134, 0.023621306, 0.06633157, 0.18977083, 0.014755853, -0.021573516, -0.025924493) * inp_1_0_1; + result0 += M4(0.18194625, 0.21327859, -0.022046618, -0.0863755, -0.10154144, 0.11552613, -0.02150014, 0.08803059, 0.33497876, 0.11428454, 0.7498792, 0.24571484, 0.11873142, -0.40479037, 0.12675676, 0.076739) * inp_1_1_1; + result0 += M4(-0.38466164, -0.03697603, -0.037561305, -0.043681134, -0.6816189, 0.13083659, 0.07451801, -0.003327551, 0.5126916, -0.09917474, -0.0708578, 0.01648595, 0.423934, -0.34497714, -0.02784395, 0.010498842) * inp_1_2_1; + result0 += M4(-0.08783385, 0.033599894, 0.006346594, -0.006446634, -0.016138535, 0.045155555, -0.04009477, -0.018183654, -0.013776878, -0.014323365, 0.05841988, 0.076961026, -0.047537193, -0.0663202, 0.03427056, 0.03428585) * inp_1_0_2; + result0 += M4(-0.09914099, -0.032711275, 0.097858556, 0.117271565, -0.056332853, 0.09818337, -0.05306024, -0.04881118, 0.23671569, 0.02282729, 0.025347842, 0.03629352, -0.075708866, -0.023583038, 0.03354702, 0.007265923) * inp_1_1_2; + result0 += M4(0.36997548, 0.052172437, -0.023425005, 0.042993546, -0.08452691, 0.12523419, -0.044003073, -0.0430429, 0.016587403, -0.14865886, -0.03721655, -0.031733558, 0.021108441, -0.041968603, 0.0120479325, 0.0014579248) * inp_1_2_2; + result1 += M4(0.32410297, 0.16156995, -0.2704675, -0.15474492, -0.0051417057, 0.0736679, -0.027583983, 0.042698298, 0.029605344, -0.097892836, -0.042276148, -0.17086019, 0.05914977, -0.0958991, 0.024540406, -0.014890719) * inp_1_0_0; + result1 += M4(-0.17057064, -0.06878893, 0.09484002, -0.46547592, 0.16778767, 0.21305582, 0.055226404, 0.14098307, -0.24932669, -0.6438276, 0.1469775, 0.15965456, 0.13635448, -0.10718979, 0.08083247, -0.47670645) * inp_1_1_0; + result1 += M4(0.033564653, 0.10775614, -0.082825914, -0.10517869, 0.19951133, 1.1163155, -0.15247913, 0.20495285, 0.057683297, -0.844752, 0.16111496, -0.44034448, -0.20139556, -0.9145029, -0.13836655, 0.1408168) * inp_1_2_0; + result1 += M4(0.103660226, 0.21737917, -0.16172896, 0.13338298, -0.018703043, -0.07260912, -0.040737107, 0.034949742, -0.19936053, 0.051139116, -0.020942764, 0.009280968, 0.027868485, 0.002934873, -0.07566193, -0.104706034) * inp_1_0_1; + result1 += M4(0.35724416, -0.077911, 0.09947001, -0.6117375, 0.21342002, 0.060938604, -0.20370094, 0.3130246, -0.47341087, -0.30221367, 0.4240177, -0.0758348, -0.12976281, 0.024794862, -0.07694939, 0.101710096) * inp_1_1_1; + result1 += M4(-0.14973663, -0.2178218, -0.022833738, 0.5495507, -0.014890054, 0.36719897, 0.0068603246, 0.8096376, 0.054707617, -0.11853919, -0.20341462, -0.7495799, -0.03551902, -0.3992545, -0.40176797, -0.058236588) * inp_1_2_1; + result1 += M4(0.1114995, 0.018287987, -0.1068866, 0.30490544, 0.026842179, 0.09772784, 0.021783939, 0.06514757, -0.02939784, 0.0063857757, 0.052597906, -0.029246058, 0.03607791, -0.026882924, 0.0045780633, -0.015172184) * inp_1_0_2; + result1 += M4(-0.040682446, -0.045952864, 0.14679994, 0.3277869, -0.010540915, -0.075695984, -0.047419466, 0.34779298, 0.02479446, -0.020837042, -0.0089015765, -0.34170833, 0.08684945, -0.019799326, 0.009023451, -0.073233105) * inp_1_1_2; + result1 += M4(-0.05574628, 0.18257698, 0.121048525, -0.3028285, 0.021456659, -0.1035951, -0.032101694, 0.4428228, -0.14607942, 0.017202685, -0.027647339, -0.24124599, 0.05897191, -0.095147684, -0.052099764, -0.19641311) * inp_1_2_2; + result2 += M4(-0.0677571, -0.14728205, 0.2918349, 0.17206684, 0.09093841, 0.017973123, -0.0043883957, -0.15070698, 0.13623445, -0.03267367, -0.035259522, 0.2057031, 0.10146496, -0.043358415, -0.059748214, 0.09960731) * inp_1_0_0; + result2 += M4(-0.084727354, 0.11521498, 0.00149433, 0.027532067, 0.048819114, -0.105092816, -0.009181161, -0.13722752, -0.44462013, -0.22134246, 0.10355644, 0.08042798, -0.004623407, -0.16590333, -0.11398178, 0.008029647) * inp_1_1_0; + result2 += M4(-0.0021335448, -0.15116176, 0.20302649, 0.055204622, 0.07024495, 0.056478035, 0.09759212, 0.033892937, 0.0037432178, 0.07928205, -0.04295959, 0.11223701, -0.22060403, -0.042706113, -0.28266382, -0.025342258) * inp_1_2_0; + result2 += M4(-0.18853788, -0.37525776, 0.33662406, 0.0021643888, 0.046762835, 0.043696124, -0.0014363487, -0.28293067, -0.16980772, 0.048948396, 0.3054481, -0.25124067, -0.12796396, -0.13256674, 0.061534125, 0.13214476) * inp_1_0_1; + result2 += M4(0.15168403, -0.30957776, -0.2828841, 0.25446436, 0.55487597, -0.07893502, -0.5719077, -0.7259194, -0.109957784, 0.36705047, 0.23906712, 0.019667521, -0.15451595, 0.08622951, 0.4389705, 0.56009406) * inp_1_1_1; + result2 += M4(-0.062005397, 0.08156719, -0.16399525, -0.06189081, 0.06525984, 0.09745813, 0.39185095, -0.29123664, -0.15941338, 0.08956102, -0.21950622, 0.11557442, 0.38353565, 0.1466502, -4.3374176, 0.34140408) * inp_1_2_1; + result2 += M4(0.092709705, -0.15493768, -0.012704912, -0.117980175, 0.07436645, -7.8802695e-05, -0.058275957, -0.18827915, -0.0631416, -0.0373527, -0.11127798, -0.009910854, -0.011067589, -0.0053280033, 0.022658903, 0.06333271) * inp_1_0_2; + result2 += M4(0.0916497, 0.1943221, 0.37540963, -0.046307754, 0.00953411, 0.066546984, 0.2116024, -0.5158029, -0.032494158, 0.14182144, -1.8395805, 0.3173581, -0.09340417, -0.10758007, -0.15254256, 0.32740375) * inp_1_1_2; + result2 += M4(0.025273405, 0.08492187, -0.14413005, -0.05747447, 0.089801, -0.03564784, -2.2446504, -0.4472199, -0.12965105, 0.009225538, 0.10549652, 0.11036174, -0.115849234, -0.099777445, 0.12770584, 0.31634042) * inp_1_2_2; + result3 += M4(0.021053081, -0.055306282, -0.081807986, -0.21331595, -0.000998926, 0.008907352, 0.016980026, 0.009302538, 0.04861071, -0.0046227667, -0.0016314664, -0.07899752, -0.078419186, -0.11081667, -0.030900553, 0.02087226) * inp_1_0_0; + result3 += M4(0.1846625, 0.099488035, -0.05193646, -0.095876545, -0.0011387762, 0.015150568, -0.010261407, -0.013941359, -0.042803578, 0.059049208, -0.07620146, -0.102711946, -0.034578953, 0.20519276, 0.097422205, 0.025764102) * inp_1_1_0; + result3 += M4(-0.43959314, 0.16758272, 0.035562072, -0.07742551, -0.38682875, 0.046922028, 0.08865273, -0.044875767, -0.80026156, -0.06039983, 0.024169726, -0.13747011, -0.55590475, -0.23130962, -0.04149803, -0.08241675) * inp_1_2_0; + result3 += M4(0.030927973, -0.6119503, 0.10466902, -0.12390426, 0.034730162, -0.10333266, 0.02035231, 0.013106206, -0.05916547, -0.777083, -0.006414744, -0.011363021, 0.035848703, 0.36386737, -0.002772792, -0.0480502) * inp_1_0_1; + result3 += M4(0.5065, 0.19396274, 0.14151096, -0.35221586, 0.09600475, -0.014168858, -0.034725133, 0.05604017, -0.13955177, -1.0448937, -0.19251399, 0.007042205, 0.14856394, 0.38436663, -0.0064019714, -0.014204183) * inp_1_1_1; + result3 += M4(-0.061922383, -0.12842242, -0.07295167, -0.0075706756, 0.10817202, -0.1655033, 0.07266308, -0.022521412, -0.093321756, -0.876699, -0.018780176, -0.14927478, -0.03584319, -0.5748604, -0.024849145, -0.17630738) * inp_1_2_1; + result3 += M4(-0.025384348, 0.49858052, -0.075553015, 0.025753077, 0.002560775, -0.37545115, -0.028084433, 0.030594576, 0.0049141925, 0.15890612, 0.08069018, -0.08922643, 0.036730718, -0.2823979, 0.031380307, 0.031606745) * inp_1_0_2; + result3 += M4(0.23545441, -1.2197607, -0.025337541, 0.21307686, -0.09559411, -0.8597017, 0.034877297, -0.015559628, 0.058392383, 0.3864891, -0.053282253, -0.055226818, -0.007128761, -1.8220773, 0.02058869, 0.017222092) * inp_1_1_2; + result3 += M4(0.080354765, -0.09153391, 0.029530875, 0.03370949, -0.07208025, 0.2936868, -0.05797227, 0.013, 0.052441202, -1.7494535, 0.052883293, 0.008096113, -0.028412474, -2.4877417, 0.005800512, 0.025508739) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.03952951, 0.038941756, 0.09056351, 0.097450286, -0.1596078, -0.1410198, 0.168562, -0.026641607, -0.054110724, -0.0563214, 0.034391247, 0.021438785, 0.0057072574, -0.107405394, -0.04044469, 0.044145353) * inp_2_0_0; + result0 += M4(0.11733438, -0.20137449, -0.040039547, 0.02093038, -0.2984962, 0.2671289, -0.19594978, -0.06000205, -0.041333724, -0.114821054, 0.00012655034, -0.018803762, 0.02485363, -0.010562574, 0.06306494, -0.0020644043) * inp_2_1_0; + result0 += M4(-0.036415216, 0.10247068, -0.030816095, -0.040820822, -0.04745717, 0.020836288, 0.06765466, 0.007323091, -0.06571431, 0.027249105, -0.051204715, -0.019635567, 0.05453804, -0.12017959, -0.035392873, 0.028308189) * inp_2_2_0; + result0 += M4(-0.04156831, 0.28028694, 0.06831695, 0.022350814, 0.13675615, 0.15137945, -0.0084258355, 0.53870726, -0.07335624, 0.00800944, 0.012506781, 0.057974383, 0.013222071, -0.14250757, -0.007383215, 0.031982966) * inp_2_0_1; + result0 += M4(0.65670925, -0.30265868, 0.2362948, 0.12972662, 0.20985337, -0.45745087, 0.22702388, 0.083776616, -0.06499208, 0.03460006, -0.041461278, -0.025413781, 0.019352706, -0.45709613, 0.014837353, 0.027197322) * inp_2_1_1; + result0 += M4(0.57660085, -0.09744273, -0.009441254, -0.03757566, 0.019752283, -0.067605585, -0.009568382, 0.07353522, -0.064801805, 0.13704818, -0.034330864, 0.0051319897, 0.20990741, -0.33425754, -0.016691428, -0.028612768) * inp_2_2_1; + result0 += M4(-0.10979933, 0.18432014, -0.074066855, 0.0054639196, 0.098094076, 0.064506084, 0.26912084, 0.16957463, 0.07098004, 0.023026804, 0.071376055, 0.034128394, 0.059867695, -0.08107985, 0.10168895, 0.08820417) * inp_2_0_2; + result0 += M4(-0.2552831, -0.052631672, 0.050921284, -0.016037157, -0.116781406, -0.07262549, -0.0022834113, -0.088421635, 0.15951507, 0.00042410966, 0.07465069, 0.0019270786, 0.10275644, -0.3381453, 0.24874882, 0.10901488) * inp_2_1_2; + result0 += M4(0.36554116, -0.027189862, 0.0032612395, 0.004169092, -0.042129308, 0.044692904, 0.040775307, 0.010006452, -0.021286374, 0.073701605, -0.0044975975, 0.0043594157, 0.54600775, -0.14487681, 0.062218707, 0.01976116) * inp_2_2_2; + result1 += M4(0.014763889, 0.11339801, 0.032690678, -0.08592508, 0.103032224, -0.09282646, -0.098232545, 0.3981169, -0.03748985, 0.06707042, 0.019140782, 0.06538452, 0.0027186018, -0.0030862922, 0.029157702, -0.006268967) * inp_2_0_0; + result1 += M4(-0.16860075, -0.18705767, 0.29325658, 0.07206259, -0.2872574, 0.5612131, 0.04638324, 0.49310178, -0.19112644, 0.17206986, 0.0029015448, -0.059934225, 0.028581057, -0.13357182, -0.038109895, 0.0005232052) * inp_2_1_0; + result1 += M4(0.15277332, 0.007269086, 9.9966186e-05, 0.23408552, 0.14690994, -0.058067933, 0.008219528, 0.19074975, -0.1848797, 0.024352368, 0.05464677, 0.06272763, 0.008818596, 0.08902247, 0.035453882, -0.11298582) * inp_2_2_0; + result1 += M4(0.15972948, -0.15435955, 0.053044003, -0.048703156, 0.07449017, 0.52491075, 0.29206496, -0.09729822, -0.14646658, 0.11030144, 0.08527744, 0.10426317, -0.13405898, 0.060408086, 0.06603381, -0.0022193235) * inp_2_0_1; + result1 += M4(0.26860082, 0.7463653, -0.14953612, -0.47049257, -0.031829864, -0.8885134, 0.14411287, -1.1775255, 0.014824517, 0.16122791, 0.1182362, 0.1877675, -0.027240504, 0.21426389, -0.030941296, -0.14024088) * inp_2_1_1; + result1 += M4(-0.05250066, 0.18955119, -0.00546335, 0.2086277, 0.026105952, 0.09914598, -0.120411806, -0.24279192, -0.15098634, 0.12038881, 0.24426264, 0.08256465, -0.1532883, 0.08571956, -0.05187043, -0.50765544) * inp_2_2_1; + result1 += M4(0.1040866, -0.05975824, 0.023336973, -0.032634534, -0.05037019, 0.14335546, 0.12934166, 0.6264734, -0.03757042, 0.113765046, 0.07949648, 0.14570814, -0.041041322, 0.060453493, 0.08972462, 0.048948) * inp_2_0_2; + result1 += M4(-0.00400568, 0.06874304, -0.06918383, 0.535076, 0.20119326, 0.4890317, 0.08677889, 0.06478608, -0.071693674, 0.14588821, 0.000260698, 0.06933203, 0.012584373, 0.1483624, 0.17692986, -0.21019499) * inp_2_1_2; + result1 += M4(-0.0102418875, 0.10566752, -0.061612416, -0.28907233, 0.0599261, -0.07173808, 0.046218887, -0.09600095, -0.1028075, 0.20061518, 0.07601999, 0.15499063, -0.029355908, 0.16779986, -0.15463807, -0.5739547) * inp_2_2_2; + result2 += M4(0.19928946, -0.033282038, 0.057147387, 0.115399025, 0.020315133, 0.02849115, 0.09572222, -0.044312302, 0.006143764, 0.12822536, 0.097994566, -0.124979936, -0.0746315, 0.026666824, 0.004227371, 0.08828524) * inp_2_0_0; + result2 += M4(0.19336012, 0.37895447, 0.15984185, 0.09104523, 0.124388486, 0.048203543, 0.2084745, 0.11253485, -0.07148966, 0.14339097, 0.08032688, -0.17872952, -0.049673792, -0.008513587, 0.025794912, 0.03211732) * inp_2_1_0; + result2 += M4(-0.26330376, 0.19026726, 0.1857569, 0.1315198, 0.064501986, 0.10317745, -0.0176552, 0.02821371, -0.18644843, 0.1889562, 0.10001778, -0.104555264, 0.064582534, 0.06963303, 0.0025069967, -0.0014127698) * inp_2_2_0; + result2 += M4(0.066179745, 0.013192936, 0.030699657, 0.044947155, -0.29488063, -0.17109951, 0.1126733, 0.14376812, -0.078351244, 0.14674957, 0.07026974, -0.16070388, -0.2022285, 0.0499185, 0.03827287, 0.116912186) * inp_2_0_1; + result2 += M4(-0.073056035, 0.3671889, 0.25542954, -0.17342108, 0.025615497, -0.12021865, 0.13177577, -0.2007023, -0.13627052, 0.2357552, 0.13015415, -0.35278785, -0.43087515, 0.169868, 0.06493807, 0.04443809) * inp_2_1_1; + result2 += M4(-0.045416348, -0.025851315, 0.007347807, -0.004663971, -0.062454782, -0.038503435, -0.10300142, -0.050885145, -0.22055164, 0.079387955, 0.27758706, -0.20710965, -0.20509078, 0.24001168, 0.04358121, -0.028955676) * inp_2_2_1; + result2 += M4(0.26075888, 0.013541241, 0.06371779, -0.051259648, -0.110951304, 0.039574105, 0.56873083, 0.084856056, -0.11592972, 0.068496436, 0.12595423, -0.09547746, -0.13057609, 0.07384179, 0.014910358, 0.07805904) * inp_2_0_2; + result2 += M4(-0.12786224, 0.26142845, 0.24205787, -0.18063907, -0.320074, 0.08904255, -0.41527358, -0.21437109, -0.0011689005, 0.1619207, 0.12261965, -0.45217648, -0.52569383, 0.107322425, 0.19049393, 0.08988259) * inp_2_1_2; + result2 += M4(-0.09822684, -0.045753952, -0.009845761, 0.14947642, 0.06210613, -0.06658182, 0.2632897, 0.08839577, 0.09217471, 0.11952383, -0.01280119, -0.3180698, -0.4636886, 0.10647941, -0.05618376, 0.095478706) * inp_2_2_2; + result3 += M4(-0.07195442, -0.026333254, 0.12311325, 0.12909564, 0.084573925, -0.054440748, 0.053060867, 0.17208287, 0.05446062, -0.03114994, 0.044506367, -0.026369767, 0.01629298, -0.007789797, -0.018678132, -0.06553193) * inp_2_0_0; + result3 += M4(-0.24843477, -0.042103805, -0.018636895, 0.09162976, 0.08486336, 0.08406515, -0.10784883, 0.21382321, 0.07368658, 0.006697408, 0.028386468, -0.09322328, -0.012220106, 0.044635873, 0.045417525, -0.0190928) * inp_2_1_0; + result3 += M4(-0.026487457, -0.019765217, -0.055956613, -0.12057359, 0.061001785, -0.011873475, 0.019730749, -0.020624056, 0.0407704, 0.03941482, -0.050869886, -0.07624975, -0.02593104, 0.003896486, -0.019085458, -0.025894178) * inp_2_2_0; + result3 += M4(0.11962663, 0.27838814, 0.061310023, 0.17531951, -0.07656211, 0.065626204, 0.14210185, 0.12210379, -0.019672073, 0.062481478, 0.0018487858, 0.011222493, -0.029829169, 0.022130238, -0.0002840079, -0.04773493) * inp_2_0_1; + result3 += M4(0.49700227, 0.27449438, 0.33256647, 0.13850217, 0.24635719, 0.20387016, 0.17043021, -0.0163939, -0.1460736, -0.053372465, -0.038251426, -0.13872208, 0.067372546, -0.07736337, -0.009627407, -0.0026862074) * inp_2_1_1; + result3 += M4(0.1817412, 0.22691032, -0.043124903, -0.035016127, 0.054409128, 0.05345417, -0.042170398, 0.059411958, 0.06607303, -0.062856466, 0.096283935, 0.045097217, 0.025960647, 0.08227504, -0.0507895, 0.043821495) * inp_2_2_1; + result3 += M4(-0.031986434, 0.012987435, -0.08489054, -0.026731597, -0.0078079957, -0.13354276, 0.060593486, 0.060747415, -0.010851016, 0.4664801, 0.06491011, -0.023194442, -0.04618695, -0.007261282, 0.070509985, -0.0035181446) * inp_2_0_2; + result3 += M4(-0.018880002, -0.550916, 0.07930929, 0.0028127227, 0.11175226, -0.73254424, 0.013858653, 0.111013226, 0.008463192, 0.122215405, 0.025371715, -0.14817141, -0.009153332, -0.5058772, 0.2843366, -0.09837672) * inp_2_1_2; + result3 += M4(0.06638847, -0.379183, 0.07764303, -0.08592844, 0.056915276, -0.20073003, 0.05886113, 0.012288142, 0.07630634, 0.86829257, -0.07294268, -0.17273578, -0.019856475, -0.8567808, 0.064931154, -0.130162) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.07428233, -0.11267418, 0.037147317, 0.012798383, -0.019355856, 0.2063775, -0.04869492, 0.023931865, 0.01826915, 0.061503474, 0.0725478, -0.016411101, 0.101941735, -0.07801213, 0.04161863, 0.0091594625) * inp_3_0_0; + result0 += M4(-0.010983235, -0.16873623, 0.09934868, 0.1475657, 0.3739511, -0.26998657, -0.0023212505, -0.13427515, -0.12743473, 0.32550758, -0.00587959, 0.020362807, 0.14574823, -0.055605818, -0.089228176, 0.07283733) * inp_3_1_0; + result0 += M4(-0.029632267, -0.006311438, 0.03683852, 0.0460545, -0.30349982, -0.22447036, -0.104302175, 0.006356504, -0.13840042, 0.165813, -0.03996628, -0.0009846408, 0.17081043, -0.005697063, 0.0636153, -0.015204903) * inp_3_2_0; + result0 += M4(-0.0288406, -0.33211818, 0.21823318, -0.4359618, 0.13476162, 0.2285806, -0.03546847, -0.036070306, -0.25634402, 0.13865985, -0.043487567, 0.011144803, 0.005096203, -0.04584228, -0.0008283112, -0.05267128) * inp_3_0_1; + result0 += M4(-0.10899708, 0.3470446, 0.0151194865, 0.025779225, 0.016572125, -0.08544362, 0.11226876, 0.027983677, -0.22979917, -0.041324202, 0.07830652, 0.1347805, -0.32296747, -0.0066952063, 0.06512874, 0.55718046) * inp_3_1_1; + result0 += M4(0.13161051, -0.019632412, -0.007245154, -0.046875164, -0.0063375905, 0.12709594, 0.048449367, 0.051778726, -0.24015811, 0.21853109, 0.052569073, 0.061736215, -0.197316, 0.1515158, -0.027146904, -0.044522174) * inp_3_2_1; + result0 += M4(0.048434425, 0.22990787, -0.01401221, -0.09624674, 0.011959234, 0.24457654, -0.06643086, -0.07578145, -0.13297154, -0.036548138, 0.049699903, 0.06231048, -0.110873826, -0.076110214, 0.002417552, 0.06022659) * inp_3_0_2; + result0 += M4(-0.41839388, 0.22337331, 0.039156444, 0.0853396, 0.021588642, 0.0067923763, -0.12538072, -0.0549457, -0.1382161, -0.018326575, 0.041040212, 0.0237146, 0.05310075, 0.12090509, 0.08417775, 0.0426096) * inp_3_1_2; + result0 += M4(0.01903611, -0.03635987, -0.02728464, -0.0124920765, 0.012841934, -0.0045961696, 0.029713307, -0.040158134, -0.16160838, 0.07344862, 0.058719117, 0.05547189, 0.22943653, -0.039776597, 0.019647159, 0.049335755) * inp_3_2_2; + result1 += M4(-0.050886225, 0.010773032, 0.068307996, 0.05066938, -0.10175775, 0.11504418, 0.057479113, -0.07015231, -0.011961269, 0.05447044, -0.024111401, 0.03896853, 0.011676859, -0.00091025315, 0.0037686634, 0.01574372) * inp_3_0_0; + result1 += M4(0.0011024862, -0.6409941, -0.04154058, -0.29942003, -0.04070786, 0.6291146, -0.31498915, -0.22144635, -0.10045137, -0.06473676, 0.0025352717, 0.03836787, 0.11647241, -0.06366675, -0.12816723, -0.26756752) * inp_3_1_0; + result1 += M4(0.059803132, 0.04112017, -3.865815e-05, -0.21099187, -0.0766396, 0.49812844, 0.23124191, 0.19388396, -0.10059807, 0.13539618, 0.012365532, 0.26512218, 0.27849954, -0.4466902, -0.14386821, 0.013069269) * inp_3_2_0; + result1 += M4(-0.0011572625, -0.08685813, 0.03506645, 0.32730153, 0.05965957, -0.030346887, -0.033162106, 0.10434774, 0.087460466, -0.04626651, -0.016391698, -0.055453468, 0.09741922, 0.04287869, -0.030375898, -0.033166446) * inp_3_0_1; + result1 += M4(0.20846428, -0.74136734, 0.5844527, 0.08609542, -0.015801225, 0.030329805, 0.13481435, -0.0682619, 0.12169573, 0.23842777, 0.006281105, -0.050572608, -0.20900005, -0.37843063, 0.59546393, 0.07246317) * inp_3_1_1; + result1 += M4(0.07766126, -0.089687124, -0.02369101, -0.39898276, 0.08709351, 0.15610176, -0.14815669, 0.13425788, 0.032636512, 0.011805772, 0.1855222, 0.49408266, 0.2102859, -1.2030262, -0.12703134, -1.5024164) * inp_3_2_1; + result1 += M4(0.08445707, -0.13061571, -0.09417561, -0.48509976, 0.07966434, 0.023925027, 0.032142166, 0.044588283, 0.011262317, -0.011922964, 0.09275115, -0.019332774, -0.08464665, -0.036373246, 0.057657905, 0.008083529) * inp_3_0_2; + result1 += M4(-0.013658516, 0.17535844, 0.43256798, -0.3588802, 0.21435346, 0.15809372, 0.05006835, -0.043844294, 0.04974172, 0.21411541, 0.03997919, 0.14509, 0.05745982, -0.02040189, 0.12265856, -0.26175705) * inp_3_1_2; + result1 += M4(-0.012978171, -0.06615713, -0.016302722, -0.07360273, 0.1120467, 0.2523338, 0.013040222, 0.07845912, 0.12137823, 0.13015787, 0.036681052, 0.09809164, 0.014065165, -0.122808255, -0.039797485, -0.46501014) * inp_3_2_2; + result2 += M4(-0.080871835, -0.22307916, 0.07004091, 0.06692253, -0.25825113, -0.030632246, 0.07111695, 0.44181773, 0.09049517, -0.008341272, 0.044914108, -0.18295835, -0.014715955, -0.008019641, -0.03798547, -0.074919805) * inp_3_0_0; + result2 += M4(-0.060306337, -0.19063218, -0.20212461, -0.011923865, 0.2857088, 0.009115366, 0.11899254, 0.14336674, 0.18231158, -0.13981315, 0.045094874, -0.09755735, 0.040069308, 0.016306436, -0.21158268, -0.06527811) * inp_3_1_0; + result2 += M4(-0.00039039235, -0.03416186, 0.018411878, -0.010035256, 0.0074744555, -0.30681312, 0.04060132, 0.08147552, 0.033693682, -0.037743136, 0.009858464, -0.057877015, -0.015383695, -0.07576271, -0.03201459, -0.07223331) * inp_3_2_0; + result2 += M4(0.15047242, -0.10756204, 0.09433242, 0.14607352, 0.028909385, 0.07892575, 0.007390004, 0.14807044, 0.056910306, -0.037883703, 0.050295055, -0.35840037, -0.019727677, -0.0066186097, -0.0021540523, 0.017334) * inp_3_0_1; + result2 += M4(0.14233728, 0.24207225, -0.05877726, 0.11620321, 0.10720529, 0.0008283299, -1.5752418, 0.08940047, 0.36390868, -0.36308664, -0.010029068, -0.27397126, 0.06675105, 0.07950608, -0.11110028, 0.10758905) * inp_3_1_1; + result2 += M4(-0.0076967604, -0.0063465773, 0.07495261, 0.060014434, -0.21927468, -0.16195607, 0.004462335, 0.1700076, 0.18680118, -0.08768889, 0.08070937, -0.13451485, 0.027677529, -0.37147608, 0.0492793, 0.20355256) * inp_3_2_1; + result2 += M4(0.28913042, -0.1857833, -0.19982226, 0.0047614267, -0.040002443, 0.013629103, 0.14590615, -0.1875878, 0.13732162, -0.0996179, 0.08447261, 0.059818078, 0.12112791, 0.04442736, -0.036067992, 0.009009383) * inp_3_0_2; + result2 += M4(0.074754044, -0.24406068, 0.5842961, 0.01011099, 0.06859522, 0.106121376, 0.20751011, -0.078184746, 0.06569143, -0.05616781, 0.43368873, -0.18342853, 0.0648663, 0.08838746, -2.5457027, -0.032766283) * inp_3_1_2; + result2 += M4(-0.016084341, 0.049012687, -0.0840192, -0.009945125, -0.13082097, -0.026519094, 0.22928171, 0.109046146, 0.1913399, -0.06577869, 0.05957043, -0.111836284, 0.21928439, -0.044628173, 0.007977876, -0.08064955) * inp_3_2_2; + result3 += M4(0.07694559, -0.0138822915, 0.06503231, -0.03360788, -0.07092503, -0.00048928615, -0.026823722, -0.02658003, 0.02215056, 0.031604793, 0.04115292, 0.040732138, -0.008415167, 0.054748695, 0.03447441, 0.018476207) * inp_3_0_0; + result3 += M4(-0.036803186, -0.05286142, 0.007957323, -0.017383374, 0.17671868, 0.27140468, 0.13692562, -0.012053789, 0.10316045, -0.013202491, -0.016275119, 0.01879904, -0.062531106, 0.029337812, -0.078415155, -0.0249412) * inp_3_1_0; + result3 += M4(0.018963913, -0.010214533, 0.018063482, 0.031577088, 0.05999718, -0.113296494, -0.09365664, 0.26440683, 0.08826179, 0.016142845, 0.0216411, -0.101425715, 0.009847335, -0.008299357, 0.074420415, 0.011775249) * inp_3_2_0; + result3 += M4(-0.39081585, -0.0838673, 0.27916974, -0.07050347, -0.020497013, -0.1974258, -0.11615982, -0.04604486, 0.0473447, -0.029950554, 0.007203267, 0.039071508, 0.05709263, 0.024631454, 0.057777587, 0.040751096) * inp_3_0_1; + result3 += M4(0.03844488, 0.018994762, 0.016261842, 0.51800346, -0.06746922, 0.32197532, 0.020198246, -0.1261948, -0.047454923, 0.19068927, -0.058833476, 0.17420405, -0.035010174, -0.24515375, -0.049961384, 0.42633954) * inp_3_1_1; + result3 += M4(-0.10035564, 0.013695476, 0.05426191, -0.014002882, -0.0910872, -0.24419665, -0.034756966, -0.2550853, 0.13050632, 0.048386525, 0.08481854, -0.015868377, -0.7629353, 0.07594038, 0.058023147, -0.25982517) * inp_3_2_1; + result3 += M4(0.053038094, 0.3456283, -0.028815135, -0.021221591, -0.030001303, 0.26908705, -0.03715217, -0.093417, -0.0061158077, 0.46648175, 0.06069643, 0.042290237, -0.022208512, -0.022681322, 0.011513289, 0.07366402) * inp_3_0_2; + result3 += M4(-0.023000399, 1.1273052, -0.004522217, 0.22401826, 0.00028205267, -0.82191133, -0.08815093, -0.10096036, 0.052339103, -0.494361, 0.014254294, 0.05702493, -0.053227764, -1.9380327, 0.044443835, 0.10758067) * inp_3_1_2; + result3 += M4(0.052999526, 0.40421763, -0.012616779, 0.002641059, 0.12748745, 0.37926105, 0.022284118, -0.1623692, -0.021195088, -0.23581114, 0.013012999, 0.055029694, -0.064298704, -2.3030765, 0.092065066, 0.03497193) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 (Conv2D-3-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_2 +//!SAVE conv2d_3 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.014308364, -0.031445663, -0.01849288, -0.004246903); + V4 result1 = V4(-0.021231862, 0.018275987, 0.004760984, 0.033462685); + V4 result2 = V4(0.0017615217, 0.012336949, -0.022513494, 0.009208594); + V4 result3 = V4(-0.0013368673, 0.0046511, 0.021403618, 0.012234549); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.025315678, -0.40740538, 0.37080577, 0.17917906, 0.1517135, 0.09999762, 0.03209811, -0.025414864, -0.0072085187, -0.044233754, -0.14142239, 0.021514736, 0.074731536, 0.06694275, 0.08969647, 0.01626352) * inp_0_0_0; + result0 += M4(-0.4784662, -0.44962025, 0.16025928, -0.112756014, 0.098072365, -0.16340493, -0.10911931, -0.057525925, -0.07066941, 0.04618561, -0.3869227, 0.07643021, 0.002182261, -0.29465193, 0.12064611, -0.15072991) * inp_0_1_0; + result0 += M4(-0.3007937, 0.0072757923, -0.07775808, 0.075630665, 0.07475434, -0.030880397, 0.017956393, 0.030480307, -0.07537768, -0.0060714884, -0.10579664, -0.041868184, -0.029362228, 0.0019552058, 0.0033949236, -0.042928576) * inp_0_2_0; + result0 += M4(-0.055378314, 0.11835048, -0.21005718, -0.067133605, 0.037751865, 0.111293666, -0.2152327, 0.35863844, 0.09041399, -0.13204306, -0.023983477, 0.035911985, -0.1136856, -0.101052254, -0.026796436, 0.17415252) * inp_0_0_1; + result0 += M4(-0.19136935, 0.25973448, -0.35633188, -0.13955162, -0.022144493, -0.12332462, 0.12980436, -0.06716298, -0.226214, -0.017355867, 0.31573844, -0.07952507, 0.06953637, 0.3504291, 0.3310475, -0.4188637) * inp_0_1_1; + result0 += M4(0.07861268, -0.011944142, -0.06872131, 0.06526956, -0.23126051, -0.0787915, 0.3074996, -0.1560054, -0.0515472, -0.15933825, 0.008892285, -0.032828208, -0.04228462, 0.19568804, -0.056245092, 0.2529376) * inp_0_2_1; + result0 += M4(0.0092896065, -0.0029096454, -0.23034982, 0.011114423, -0.1106547, -0.15602478, 0.2677796, 0.19269039, -0.031739205, -0.03228303, 0.011086476, -0.05332459, -0.22346567, 0.08080637, -0.020646531, 0.08239571) * inp_0_0_2; + result0 += M4(-0.15126343, 0.022163287, -0.15783563, -0.025882605, 0.15493815, 0.1494604, -0.034188353, 0.047689065, 0.14822488, -0.010189335, 0.18554454, 0.030036429, 0.024229797, 0.06672721, -0.27624926, -0.0014910502) * inp_0_1_2; + result0 += M4(-0.11723486, -0.024278458, -0.0918668, -0.05912352, 0.0804538, 0.22284164, 0.082265265, -0.086509205, 0.077792905, 0.06799491, 0.10968278, 0.07208801, -0.10925173, -0.19539174, -0.20790318, -0.08770796) * inp_0_2_2; + result1 += M4(0.3236074, -0.016813854, -0.05796897, -0.07314582, -0.06281415, 0.012611842, 0.016730722, 0.11916892, 0.054947067, -0.024866354, -0.007610447, -0.11161885, 0.04581396, 0.009688132, 0.021315157, -0.08097858) * inp_0_0_0; + result1 += M4(0.1599916, -0.031528797, 0.0126992585, 0.016889824, 0.11132726, -0.06296075, 0.00051726383, -0.3424913, -0.004174934, -6.6618624e-05, -0.012995042, 0.005965193, -0.06023162, 0.003182649, 0.021039585, -0.11947315) * inp_0_1_0; + result1 += M4(0.027892213, -0.00062689267, -0.01636723, -2.2716187e-05, 0.25023237, -0.007830497, 0.021714738, -0.56807584, -0.053948745, -0.024804676, 0.045291945, -0.13231511, 0.07675576, 0.06605667, -0.032000583, 0.10833098) * inp_0_2_0; + result1 += M4(-0.36363825, 0.021935955, -0.18368474, 0.028652018, 0.14966221, 0.027848009, 0.072001524, 0.3989147, -0.060279924, 0.025458539, -0.0016928725, 0.060513448, -0.030946735, 0.116279155, -0.027582984, 0.07756251) * inp_0_0_1; + result1 += M4(-0.23284562, 0.14024308, 0.062349986, -0.12310892, -0.19432355, -0.08142183, -0.061544392, -0.45819297, -0.037947427, 0.39792922, 0.07392991, -0.088718906, 0.15805514, 0.30931425, -0.1016847, -0.078503326) * inp_0_1_1; + result1 += M4(0.02309257, -0.024762606, 0.008150015, 0.023823071, -0.15807371, 0.03965886, -0.016814513, -0.07145885, -0.20561801, 0.02365692, 0.0007521815, 0.1441513, 0.14683372, -0.046197027, -0.008067438, -0.36100286) * inp_0_2_1; + result1 += M4(-0.1421229, -0.099885836, -0.09427238, 0.1337728, -0.0066758767, -0.009484399, 0.06744897, 0.30264565, -0.03263222, 0.03592801, 0.10090736, 0.028849022, -0.041092165, -0.05571495, -0.117078304, -0.2493043) * inp_0_0_2; + result1 += M4(0.030493004, 0.013943649, 0.008176111, -0.048232153, -0.029120184, 0.0832065, 0.012535422, -0.06679524, 0.072213255, 0.047026567, 0.0739274, 0.021540673, -0.10233502, 0.04503862, -0.16855547, 0.19900726) * inp_0_1_2; + result1 += M4(-0.10335507, 0.03536097, 0.0033068694, 0.0032172517, 0.049036283, 0.07101889, -0.10331261, 0.14447233, 0.05273494, -0.014971053, -0.08585235, 0.11687278, -0.077435136, 0.03600481, 0.15392411, -0.22504471) * inp_0_2_2; + result2 += M4(-0.19788808, 0.088607766, 0.03288371, 0.018204056, -0.024293097, -0.008095376, 0.03442426, -0.036480363, -0.008784721, 0.08859438, -0.10649091, 0.030977005, 0.016547365, -0.0022618754, 0.0324507, -0.017606767) * inp_0_0_0; + result2 += M4(-0.04685454, -0.21285146, -0.010454878, -0.057078585, 0.065119885, 0.10927382, -0.05321152, 0.060907405, 0.08013327, -0.0073412405, -0.20529112, -0.08758012, 0.09224284, -0.067262664, 0.1502062, 0.05410036) * inp_0_1_0; + result2 += M4(-0.041660745, 0.0048408103, 0.003651176, 0.071307175, 0.01425864, 0.09917961, -0.05065944, 0.04616355, -0.106611334, 0.08681873, -0.07359776, -0.09394259, 0.11695499, -0.1402854, 0.061297946, -0.045418613) * inp_0_2_0; + result2 += M4(-0.23553102, 0.5484784, -0.09534771, -0.02045959, 0.13755015, -0.11109039, -0.06437182, -0.2358323, 0.010125626, -0.11606748, -0.08721418, 0.07951246, 0.14079992, -0.080286875, 0.03190584, -0.11406279) * inp_0_0_1; + result2 += M4(-0.10584075, -0.2533913, 0.19931902, -0.06487168, -0.1717319, 0.030989863, 0.03765032, -0.23701997, 0.392678, -0.20434664, -0.011459706, -0.012392768, -0.19392636, -0.19896725, 0.5523695, 0.10076211) * inp_0_1_1; + result2 += M4(-0.07930697, 0.012467926, -0.018473605, 0.049829062, 0.041304592, -0.20307006, 0.061710116, -0.1607002, 0.05850921, -0.054579165, 0.05506371, 0.018534066, -0.05382266, 0.19656838, -0.14599052, 0.10722883) * inp_0_2_1; + result2 += M4(-0.14471711, -0.089903586, -0.024194038, -0.008216228, 0.21955849, -0.3950722, 0.05865401, -0.15680425, 0.0034217027, 0.09524851, -0.014997871, -0.01323649, 0.0042688143, 0.033086605, -0.03602252, 0.14105399) * inp_0_0_2; + result2 += M4(0.020014875, -0.11133592, -0.023629094, -0.0709405, 0.07574613, 0.4842027, -0.016238315, -0.06935021, 0.048983708, -0.02455697, 0.023512363, 0.032327037, -0.12747441, -0.137746, -0.0041232975, -0.29301938) * inp_0_1_2; + result2 += M4(-0.04711032, -0.019662969, 0.020692779, 0.01689221, 0.030064257, -0.032970324, 0.093564175, -0.06074772, -0.0065473514, 0.10435069, -0.051301178, 0.07506068, -0.092831016, -0.0098741185, 0.092322186, -0.09218845) * inp_0_2_2; + result3 += M4(-0.109521486, -0.25843716, 0.051019795, 0.008796125, 0.006710635, -0.0049244356, -0.028464736, -0.020576421, 0.018126301, -0.03288581, -0.059816107, 0.012544033, 0.019033715, 0.036934555, 0.03997806, 0.011696228) * inp_0_0_0; + result3 += M4(0.15896165, -0.40192378, 0.020870406, -0.040908355, -0.06158074, 0.04799475, 0.02708582, 0.025623411, 0.031087726, 0.15594003, 0.061994012, -0.055818196, 0.009436111, 0.04553281, -0.009773234, 0.05364127) * inp_0_1_0; + result3 += M4(0.05062757, -0.34977517, -0.017327579, 0.029586911, -0.015337377, 0.1657842, -0.023074357, -0.48225418, -0.101821445, -0.07600293, -0.005563617, -0.5261255, 0.00761482, -0.058566544, 0.05186853, 0.04371315) * inp_0_2_0; + result3 += M4(-0.06422451, -0.6366767, -0.036370903, -0.0831035, 0.0374723, 0.38192326, 0.010392014, -0.08228988, 0.0633136, -0.048369046, 0.06295746, 0.0043660635, 0.037951868, -0.08372121, 0.055318434, -0.05734989) * inp_0_0_1; + result3 += M4(0.18938878, -0.58693033, 0.11619453, -0.045211863, -0.081650935, 0.30361742, -0.12818241, -0.10964245, -0.21211484, -0.2671186, 0.14642583, 0.10737925, 0.0061715045, -0.38273, -0.22397554, -0.04302644) * inp_0_1_1; + result3 += M4(-0.016349845, -0.21763504, -0.0010806874, -0.0011352341, -0.1379133, 0.19977011, -0.019010192, 0.15351702, -0.049592014, -0.015350318, 0.075927876, 0.17186968, 0.12509024, 0.02728859, -0.037378654, -0.32351947) * inp_0_2_1; + result3 += M4(-0.019764764, -0.31119177, -0.06767115, -0.014068403, 0.03635759, 0.14193599, 0.0015609096, -0.0077975956, 0.009449523, -0.01775413, 0.062425796, 0.026602777, -0.025830995, -0.10380951, -0.02119342, 0.0054662493) * inp_0_0_2; + result3 += M4(0.046277538, -0.45933232, 0.06593023, -0.03638144, -0.07667149, 0.29901657, -0.0016867243, 0.11688226, 0.031845666, -0.027253512, 0.07584758, 0.08993896, -0.060812075, -0.04589073, -0.21525094, -0.047655407) * inp_0_1_2; + result3 += M4(0.008118003, -0.31232572, -0.01947948, -0.028818972, 0.01954803, 0.14400195, 0.07366684, 0.08039247, -0.039747268, -0.07018961, -0.006076149, 0.010897608, 0.0013431206, -0.038716212, 0.033262603, -0.06467397) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.034586944, 0.051405124, 0.024543753, 0.09663699, 0.21466514, -0.14363779, 0.091029935, 0.06438413, -0.07787725, 0.02310036, -0.08526669, -0.06898668, -0.07615313, 0.1859357, 0.051052812, 0.03592223) * inp_1_0_0; + result0 += M4(0.14242817, -0.12330711, 0.26888746, 0.027858777, -0.19174838, -0.3025271, 0.21068037, -0.22111407, 0.039243873, 0.32096145, -0.19555481, 0.041925013, -0.081656374, 0.042261768, 0.4310771, -0.17600678) * inp_1_1_0; + result0 += M4(0.07237473, -0.019333057, 0.01465501, 0.0103286505, -0.0033088874, 0.0049798666, 0.005620796, 0.050308306, 0.095135905, 0.11874092, -0.089677125, 0.06639713, 0.008767325, 0.020067416, -0.054253392, -0.02636066) * inp_1_2_0; + result0 += M4(0.12108157, -0.08878159, 0.20186365, -0.013874086, -0.41484395, -0.14844953, 0.0738829, -0.045337558, 0.042086396, 0.059161253, -0.012553872, -0.23520784, -0.12646332, 0.26784688, -0.20803319, -0.03942921) * inp_1_0_1; + result0 += M4(-0.23782037, -0.4498384, -0.2894948, -0.11137584, -0.41319975, -0.17482656, -0.117727414, 0.04227422, 0.44053125, -0.040965743, -0.07687903, 0.1572281, -0.14606549, 0.5611193, -0.017074287, -0.26588884) * inp_1_1_1; + result0 += M4(0.13518186, -0.1952343, -0.033405837, 0.15649372, 0.014096296, -0.1471687, 0.022654844, -0.16781017, 0.1897826, 0.05537809, 0.011526008, 0.16989169, 0.25440302, 0.02105957, 0.07173544, 0.13849147) * inp_1_2_1; + result0 += M4(0.12111377, 0.06486296, -0.054877255, 0.013369709, -0.26179752, 0.008404512, -0.291739, 0.09870817, 0.30430415, -0.02468248, 0.09765464, -0.073647045, 0.003215954, -0.17846975, 0.11312282, 0.061767615) * inp_1_0_2; + result0 += M4(-0.0767532, 0.46677387, -0.17212266, -0.03160566, -0.3810842, 0.056070074, -0.25618377, -0.100580625, -0.12561269, -0.016203389, 0.3710484, 0.00074308756, 0.10880074, -0.21513747, -0.21955177, -0.10800783) * inp_1_1_2; + result0 += M4(0.07202282, 0.08571014, 0.04075649, 0.024679877, 0.11339893, 0.10422508, -0.014214932, -0.19761975, 0.05781747, -0.18774833, 0.14175606, 0.12277776, -0.14729902, 0.0993602, 0.03688781, -0.06296111) * inp_1_2_2; + result1 += M4(0.061538264, 0.060805965, 0.017201789, 0.22006647, -0.01602865, 0.035268907, -0.00068671186, -0.18142733, -0.0058686594, 0.04291206, 0.0014080717, 0.13177212, -0.0016620886, 0.09081882, -0.031675898, -0.29883888) * inp_1_0_0; + result1 += M4(-0.15646641, 0.0058149397, -0.034551397, -0.087699234, -0.0009914644, -1.4757978e-05, 0.00055921706, 0.23698746, -0.15453093, 0.06698371, -0.014193776, 0.055897992, -0.19766432, 0.046747115, 0.03361082, -0.63573986) * inp_1_1_0; + result1 += M4(0.07094494, 0.00023815216, 0.006596921, -0.05585263, 0.07675021, -0.06228464, 0.014950143, -0.0021290332, -0.12428363, 0.016943645, -0.0096276365, -0.022048702, -0.06971582, -0.029114002, 0.049153633, -0.39115208) * inp_1_2_0; + result1 += M4(0.049078394, 0.06519899, 0.041337896, 0.18306711, 0.06364234, -0.036350865, -0.082766965, -0.04908475, -0.03600516, 0.13349976, 0.075641125, 0.09301542, 0.098319165, -0.111341886, -0.11690513, -0.30515233) * inp_1_0_1; + result1 += M4(-0.047191925, 0.122746356, -0.0033969765, 0.08131301, 0.1518897, 0.02669907, 0.033575322, -0.511831, -0.18935362, 0.09478832, 0.018412145, 0.27864313, 0.4335526, 0.38276324, 0.056418765, 0.092538744) * inp_1_1_1; + result1 += M4(0.06391543, -0.032844223, -0.0015351484, 0.08773329, 0.0818433, -0.00886031, 0.006732896, -0.004721323, -0.0030527106, 0.0014216377, -0.04981653, 0.17145506, 0.003415348, 0.04492702, 0.032660168, -2.0050154) * inp_1_2_1; + result1 += M4(-0.08958046, 0.10260106, 0.11284484, 0.19449843, -0.15825003, -0.022389483, -0.1325153, -0.16857241, 0.16755177, 0.031064708, 0.1567697, 0.16521265, -0.065289006, -0.022755811, 0.03485217, 0.09884881) * inp_1_0_2; + result1 += M4(-0.109482475, 0.013460136, -0.04917644, -0.15271996, -0.2583299, 0.060626, -0.041091472, -0.15900281, 0.47309366, -0.03839146, -0.0045616627, 0.0008328471, 0.0082431855, -0.21283317, -0.18913719, 0.2243721) * inp_1_1_2; + result1 += M4(-0.030455546, -0.020884665, 0.06928861, -0.02054186, -0.051363032, -0.028426047, 0.032410964, 0.27805674, 0.09577153, 0.0018001996, -0.009598458, 0.24205303, 0.06581605, 0.032396894, 0.15634531, -0.062486712) * inp_1_2_2; + result2 += M4(0.04517026, -0.015449355, 0.030736623, -0.064001635, 0.10251629, -0.010003219, 0.00246948, -0.041401625, -0.07452645, 0.055657007, 0.017119868, 0.00057093386, 0.076428145, -0.13702212, 0.041210357, -0.097048655) * inp_1_0_0; + result2 += M4(-0.11847643, 0.07740604, 0.04646375, -0.006719404, 0.078692794, 0.018933047, -0.03411219, 0.005511014, -0.12282886, 0.0056976853, -0.0050732824, -0.020660818, -0.031830277, 0.030043423, 0.056548044, -0.090381294) * inp_1_1_0; + result2 += M4(-0.033105094, -0.0078620855, -0.022709917, 0.019003244, 0.024807753, 0.052204266, -0.071791224, 0.011485747, -0.07369586, 0.0137782805, 0.003582809, 0.035403106, -0.01405195, 0.07256009, 0.011241367, -0.06909385) * inp_1_2_0; + result2 += M4(0.026971996, 0.006361849, 0.14840193, 0.11840187, -0.23391397, 0.19595902, 0.021233503, -0.11863109, -0.02861322, -0.0805317, 0.19878447, 0.04877218, -0.03260752, 0.47443804, -0.0007973998, -0.083458565) * inp_1_0_1; + result2 += M4(0.10141363, 0.056519937, 0.09495047, -0.083211236, -0.33066672, 0.31982478, 0.06656332, -0.5255531, 0.39907596, -0.04551523, 0.076361425, 0.515442, 0.2894429, -0.026761035, 0.15433668, -0.22964536) * inp_1_1_1; + result2 += M4(-0.052999362, 0.052562866, -0.035938874, 0.032367133, -0.081125945, -0.008548732, -0.02534536, 0.09177157, -0.015444048, 0.12723202, -0.07120179, -0.0022531084, -0.018742096, 0.042202547, 0.030112537, 0.16257262) * inp_1_2_1; + result2 += M4(0.007041716, 0.018217154, 0.08307236, -0.04520616, -0.31561956, 0.23123385, -0.067681044, -0.12643862, 0.010874087, -0.10742594, 0.030002201, -0.14344977, 0.10406159, -0.20533821, -0.030862322, -0.10753616) * inp_1_0_2; + result2 += M4(0.11211696, -0.11703306, -0.029693123, 0.07388003, -0.2088053, 0.15857096, 0.047811363, -0.19972345, 0.03004797, -7.211207e-05, 0.011323185, 0.053247977, -0.11488151, -0.21737544, -0.09646544, -0.32760012) * inp_1_1_2; + result2 += M4(0.023682857, 0.028017636, 3.7979324e-05, 0.044192187, 0.06769071, 0.062285192, -0.00054911565, 0.044016127, -0.054126956, 0.073501885, 0.0038514957, 0.14338864, 0.07184208, 0.021787634, 0.008975992, -0.038967796) * inp_1_2_2; + result3 += M4(0.0076448624, 0.073063046, -0.018112276, 0.044603255, -0.028443448, 0.042257074, 0.033456415, 0.10408893, 0.013544821, -0.10530665, -0.013452262, 0.024509164, -0.032966062, 0.2765319, 0.06838193, -0.008048515) * inp_1_0_0; + result3 += M4(0.01256106, 0.0046958136, 0.03241983, 0.055210363, 0.07731245, -0.07009144, -0.048668608, 0.05429069, 0.07470501, 0.039248727, 0.03182757, -0.06734372, 0.1485473, -0.09281201, -0.054269433, 0.03705732) * inp_1_1_0; + result3 += M4(0.016695606, 0.058716543, -0.022234729, 0.010488249, 0.019232022, -0.044709843, -0.032776598, 0.12039033, -0.017063448, -0.09488618, -0.00074972864, -0.18022363, 0.035581883, -0.12771232, 0.037610672, -0.02314014) * inp_1_2_0; + result3 += M4(0.033441305, -0.17919269, 0.071414076, -0.040231004, -0.051545292, 0.3152309, 0.032920167, -0.050826155, 0.030751579, -0.043526605, 0.101936825, 0.10663154, -0.010965119, 0.23196171, -0.03446115, 0.012430032) * inp_1_0_1; + result3 += M4(-0.039667293, 0.28457764, 0.13565247, 0.021205531, 0.05632608, -0.18567143, 0.16571477, -0.23085211, 0.076178744, -0.04070206, 0.11625753, 0.11961359, 0.09332873, 0.061907627, 0.30030668, 0.10909142) * inp_1_1_1; + result3 += M4(0.108230695, 0.15231377, -0.0005546767, -0.19747706, 0.06423663, -0.031372365, -0.037357267, 0.15446967, 0.01659812, 0.0051198537, -0.027291223, -0.022681922, 0.057102717, 0.13700908, -0.032580305, -0.11682838) * inp_1_2_1; + result3 += M4(-0.0029815636, 0.13884383, 0.04761928, 0.059312716, -0.008409305, -0.9101977, -0.03828398, -0.07224407, -0.0005499478, 0.22700396, -0.007955575, 0.014039278, 0.00048419705, 0.14805353, 0.01756024, 0.08449175) * inp_1_0_2; + result3 += M4(-0.0013124654, 0.08395497, -0.044070862, 0.08525564, -0.0057046493, 0.1908161, -0.045428224, 0.05620147, 0.03192862, 0.23222342, 0.07045153, 0.059786994, -0.017609006, 0.22580697, -0.095051855, -0.06213206) * inp_1_1_2; + result3 += M4(-0.032118272, -0.05992314, 0.0014346216, -0.0144403465, -0.0040735975, -0.07336036, -0.019177906, -0.033247244, 0.036743563, 0.05132299, 0.023929443, 0.0894065, -0.02746859, -0.0016096028, 0.023279605, -0.03991766) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.0715746, -0.09631244, 0.050157297, -0.08048454, -0.0025352512, 0.16482176, -0.106414065, 0.083849244, 0.12749393, 0.20426564, 0.29415998, -0.037008047, -0.26012027, -0.14854887, 0.20277677, 0.31178087) * inp_2_0_0; + result0 += M4(-0.05076258, -0.13740575, 0.15595411, -0.053362656, -0.066203654, -0.16828513, 0.081790805, -0.017918047, -0.41374892, -0.52676713, -1.0831323, 0.22619742, 0.12750734, -0.14390856, -0.22360946, -0.5096736) * inp_2_1_0; + result0 += M4(-0.10955963, -0.24669066, 0.15493616, -0.11090137, -0.027859153, 0.03351683, 0.09520772, -0.107278876, -0.45327467, 0.0021158315, -0.11707372, -0.28413826, -0.15181288, -0.030790092, 0.18309823, -0.26073602) * inp_2_2_0; + result0 += M4(-0.0028697196, 0.06061011, -0.056756634, -0.036915377, -0.28824973, 0.012138959, -0.12313946, 0.10299592, 0.23378398, 0.049730666, -0.07091768, -0.01715781, -0.018962007, 0.16162728, 0.027316753, -0.008936573) * inp_2_0_1; + result0 += M4(0.025687302, 0.059557397, -0.20743646, 0.18490358, -0.3239818, 0.17850724, -0.08651508, 0.14011745, -0.66113037, 0.11846311, -0.061496705, 0.13422967, -0.005783129, -0.15430583, -0.26381627, 0.054521244) * inp_2_1_1; + result0 += M4(-0.015021453, -0.19950967, -0.27221996, -0.28598326, 0.110668495, 0.10796349, 0.05700929, -0.09480617, 0.055270392, 0.12745835, 0.116460495, -0.17917821, 0.12730812, -0.0012037748, 0.32492042, 0.08095944) * inp_2_2_1; + result0 += M4(0.06407335, 0.030303145, -0.08825665, -0.0035974658, 0.08393234, -0.009050897, 0.21445066, 0.043095548, 0.1661051, -0.0459125, 0.10902106, 0.039837647, -0.061346497, -0.009559113, -0.02383936, 0.0028487262) * inp_2_0_2; + result0 += M4(-0.1500397, 0.025134781, -0.10852966, -0.11559518, -0.18731914, 0.06851372, -0.066781044, -0.10385313, 0.17443936, -0.021997442, -0.13519152, -0.014186667, -0.18113253, 0.07363012, 0.12357896, 0.11021419) * inp_2_1_2; + result0 += M4(-0.005192235, 0.044567242, -0.011068163, -0.018504843, -0.04650239, -0.009309463, -0.07613297, -0.099593356, -0.029223667, -0.09067077, -0.029125804, -0.08720748, -0.004944248, 0.20919052, -0.051089592, -0.086393625) * inp_2_2_2; + result1 += M4(-0.079497606, 0.033001993, -0.0433299, -0.49341437, 0.06402561, 0.027012901, -0.017186008, -0.026205903, 0.20847131, -0.17379077, -0.1460187, -0.3422193, -0.028837888, 0.14444311, 0.017298697, 0.16118568) * inp_2_0_0; + result1 += M4(0.1362322, 0.0049404167, -0.0545727, 0.036812954, 0.029849706, -0.041181613, -0.011156492, -0.10626014, 0.4812216, -0.1561386, 0.13164558, -0.38440028, 0.09642372, -0.07784491, 0.004167074, -0.54048723) * inp_2_1_0; + result1 += M4(0.22648239, -0.0008470028, 0.017957706, -0.018039277, -0.015313996, 0.014065825, 0.015366776, 0.10012267, 0.014650181, 0.018891001, -0.008666813, 0.10578885, -0.24156433, -0.06182133, -0.0048173345, 0.50967747) * inp_2_2_0; + result1 += M4(0.04990316, 0.077742726, -0.07985242, -0.23526481, 0.010774825, -0.018184526, -0.032785896, -0.1857747, -0.23976691, -0.052705243, -0.35834587, 0.13117231, 0.01347248, -0.043906253, 0.032065123, -0.27442545) * inp_2_0_1; + result1 += M4(-0.199354, -0.053708132, -0.076112315, -0.13419336, -0.08698115, -0.1992096, -0.0026194518, -0.49119824, -0.50951654, 0.10993369, 0.17314698, -0.43758488, -0.2935566, -0.011501036, -0.10976056, 0.4501387) * inp_2_1_1; + result1 += M4(-0.21165654, 0.025460485, 0.055044506, -0.18715349, 0.26253015, 0.015346683, -0.0065055043, -0.1598433, -0.065605536, -0.025775231, -0.016590733, 0.31189066, 0.08281263, -0.0045969966, -0.13699894, -0.097940974) * inp_2_2_1; + result1 += M4(-0.088196106, 0.03208788, -0.06850063, -0.18676445, 0.13442639, 0.06030712, -0.062297534, -0.12515818, 0.051921774, -0.071406096, -0.14802997, 0.037173603, -0.06478699, -0.04161509, -0.07285825, -0.009940458) * inp_2_0_2; + result1 += M4(-0.13968326, -0.06019821, -0.0882567, -0.2698704, -0.09788051, -0.1485394, -0.085379414, 0.0072728456, 0.03298984, -0.074674346, -0.030420514, 0.17290293, 0.04263921, -0.11421748, -0.019576881, 0.2684657) * inp_2_1_2; + result1 += M4(-0.1025962, -0.011311065, 0.01694238, -0.13532774, 0.0062958077, -0.058460772, 0.09474729, -0.17248796, 0.06978807, -0.030376935, 0.0025259845, 0.27620357, -0.04003609, 0.0008251506, 0.09974402, -0.19953759) * inp_2_2_2; + result2 += M4(-0.0274369, -0.02785617, 0.111271836, -0.04777609, 0.022969048, -0.0103979325, -0.029450497, 0.071567275, -0.17947961, 0.3219096, -0.19316356, 0.06724893, 0.16150929, -0.17940994, 0.13669962, 0.0322664) * inp_2_0_0; + result2 += M4(-0.063206606, -0.004748452, -0.047064275, -0.10338681, -0.03555205, 0.06408232, -0.11194569, 0.024295783, -0.5038483, 0.5358632, -0.025267152, -0.43657935, -0.11281369, 0.21069881, -0.0877243, 0.23032966) * inp_2_1_0; + result2 += M4(0.09157177, -0.101289205, -0.0045268014, 0.007126031, 0.076024644, -0.011473527, -0.0014426362, -0.0772565, -0.066013575, 0.0573791, -0.057972565, -0.050329443, 0.13471925, -0.18278362, -0.124123216, -0.24296595) * inp_2_2_0; + result2 += M4(0.0018280116, 0.017851619, 0.06933558, 0.2027289, 0.14181142, -0.0031327193, 0.10318157, 0.06581663, 0.1528262, 0.07430443, -0.02498459, -0.03398527, -0.121124454, 0.0130372215, -0.04157365, 0.13387349) * inp_2_0_1; + result2 += M4(-0.2677744, -0.029308412, -0.07962408, -0.12204546, -0.29457334, 0.030129738, -0.26925707, -0.22190627, 0.110479586, 0.3287684, -0.14959732, 0.17304076, -0.04718754, -0.08847532, -0.1267441, -0.26355487) * inp_2_1_1; + result2 += M4(-0.09800573, -0.14139035, 0.04140986, -0.18992579, 0.028541153, -0.0329216, 0.0016428916, 0.041346528, 0.009479444, 0.1538949, -0.016167583, 0.14781687, -0.20410268, -0.08003033, 0.058599915, 0.011661855) * inp_2_2_1; + result2 += M4(-0.08390431, -0.015559658, 0.018878765, -0.12197927, 0.054793455, -0.03990255, -0.011211109, 0.036316004, -0.00909181, 0.01052049, -0.07726077, 0.0054688193, -0.058225293, 0.025337262, -0.054769665, 0.0038822803) * inp_2_0_2; + result2 += M4(-0.042446077, -0.077310875, -0.015256182, 0.06345937, 0.073480725, 0.09065197, -0.0731339, 0.0723991, -0.0973175, -0.004725554, 0.00842376, -0.0057924674, 0.16431709, -0.041569393, -0.0024132037, 0.09127265) * inp_2_1_2; + result2 += M4(0.103879355, -0.114007644, -0.036526263, -0.09562801, 0.026349826, -0.077657074, -0.0014605734, 0.020703465, 0.00056508253, -0.034128983, 0.00072431617, 0.0124235535, 0.119479515, 0.027588964, -0.040412117, -0.0019401097) * inp_2_2_2; + result3 += M4(-0.0054999315, 0.054679673, -0.0046336288, 0.017204197, 0.01873656, 0.053969342, 0.0022390555, -0.079477236, -0.056740683, 0.061366238, -0.14898393, -0.009038732, 0.08329993, -0.08009324, 0.089084126, -0.052381206) * inp_2_0_0; + result3 += M4(-0.07229899, -0.23929752, 0.045575928, -0.08491341, -0.037206728, -0.066858895, -0.009566649, -0.16403022, 0.070830956, 0.24849686, 0.022231523, -0.60494363, -0.12693338, 0.09039926, -0.061455548, 0.029116308) * inp_2_1_0; + result3 += M4(0.14467773, 0.011604675, -0.011593841, 0.3062551, 0.014567709, 0.07741014, -0.012507825, 0.10407626, 0.06588569, 0.2327419, -0.021636222, 0.32575372, 0.0069890674, -0.019714063, -0.039952785, -0.15029353) * inp_2_2_0; + result3 += M4(-0.016747722, -0.057078633, 0.032135896, 0.03921812, 0.01964165, -0.041367184, 0.034990914, 0.03307513, -0.008712541, 0.36230156, -0.009524529, -0.013199496, -0.06960267, 0.11308598, -0.025458774, -0.016773175) * inp_2_0_1; + result3 += M4(0.10539831, 0.06910462, 0.10081203, -0.25462282, -0.051628787, 0.26734698, -0.09425403, -0.10206043, 0.0900536, 0.18957601, 0.024502385, 0.017249644, 0.013259816, 0.3805416, 0.09170492, -0.11961444) * inp_2_1_1; + result3 += M4(0.03674796, -0.20332646, -0.0019113279, -0.049671765, 0.12674725, 0.016929649, -0.019033445, -0.12554397, 0.057757977, 0.0079718605, -0.03455191, 0.012654533, 0.10924967, 0.13866869, -0.06353784, -0.15997352) * inp_2_2_1; + result3 += M4(-0.032977168, -0.008423808, 0.0131768845, -0.017573318, 0.0020663647, 0.05378569, -0.009707578, 0.01458635, -0.039570022, 0.26450455, -0.09522793, -0.0082146, 0.03125363, -0.0039754794, 0.0103347115, -0.018126415) * inp_2_0_2; + result3 += M4(0.053846017, -0.2637847, 0.034869306, -0.031385496, -0.049894933, 0.11334788, -0.050957955, -0.07865399, 0.0110876765, 0.19674455, 0.02882469, -0.008416688, 0.0094687035, -0.20319644, -0.11101057, -0.08230348) * inp_2_1_2; + result3 += M4(0.0044784476, 0.023611512, -0.042547744, 0.0007483636, 0.05025809, 0.14764841, 0.00044558995, 0.04103793, 0.048046812, 0.062373303, -0.014592626, 0.07766575, -0.0020092498, -0.0069300635, 0.03421132, -0.16338684) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.0020083024, -0.59463024, 0.13003162, 0.27622712, 0.51078737, -0.19404446, 0.12455177, 0.27357444, -0.00015589895, 0.08237507, 0.060955554, -0.013423829, -0.13043714, -0.26090437, -0.0061712246, 0.057619814) * inp_3_0_0; + result0 += M4(0.22813018, -0.16819888, 0.12644678, -0.06749888, 0.6929881, 0.06584952, 0.2152027, -0.0030935707, 0.03527825, 0.07355563, 0.20881042, -0.1287684, 0.006924962, -0.3719862, -0.036988992, 0.20827514) * inp_3_1_0; + result0 += M4(0.049787976, -0.1781383, 0.054748017, 0.003178183, 0.44286513, -0.21408647, 0.2594575, -0.7740605, 0.033387452, 0.021950949, -0.022106573, -0.0067378515, 0.13417983, -0.11796911, -0.031810988, 0.1171123) * inp_3_2_0; + result0 += M4(-0.18528815, 0.35193694, 0.11649766, -0.39793167, 0.08550548, -0.007938471, 0.20756447, -0.0918376, -0.1510857, -0.023432646, -0.12200965, 0.07017334, 0.26202187, 0.2199531, 0.21588492, -0.1368237) * inp_3_0_1; + result0 += M4(-0.44707954, 0.19176868, 0.17061797, 0.18040551, -0.13039091, -0.10258424, -0.16008896, 0.037404172, 0.117038585, -0.17250147, -0.1328998, 0.052930426, -0.44167283, -0.13420883, -0.23059113, 0.054577902) * inp_3_1_1; + result0 += M4(-0.12896018, 0.0633688, 0.034150008, -0.12148736, -0.004690631, 0.04905833, 0.27947712, 0.060562916, -0.03636501, 0.10707534, 0.055300053, -0.08954744, 0.051630456, 0.00094299554, 0.061553795, -0.0014282514) * inp_3_2_1; + result0 += M4(-0.14921282, -0.45711362, -0.957326, 0.26230615, 0.037424088, -0.033945464, 0.114703685, -0.0057828487, -0.08853224, 0.034291565, 0.032943837, -0.005019218, 0.005135216, -0.12015115, -0.18748857, -0.05337296) * inp_3_0_2; + result0 += M4(0.087564476, -0.1250068, -0.3363717, 0.18351421, 0.05174429, 0.049167316, -0.049760886, 0.007353514, -0.037329644, -0.016148722, -0.12699443, 0.014485368, 0.105171196, -0.31134298, -0.37899444, 0.07498702) * inp_3_1_2; + result0 += M4(-0.020149319, 0.124999724, -0.12147029, -0.00096658675, 0.0832416, -0.08173243, 0.05076248, 0.052645613, -0.0073318128, 0.077881485, 0.11520081, -0.0016521994, -0.0037119072, 0.09793644, 0.061810687, 0.029145136) * inp_3_2_2; + result1 += M4(-0.12472872, 0.07407384, -0.07791997, -0.7134498, 0.3457181, 0.018778412, -0.064711064, -2.43281, -0.054541327, 0.04039896, -0.008637337, 0.002681813, -0.0026259732, -0.11904751, 0.019719794, 0.19572537) * inp_3_0_0; + result1 += M4(0.18888874, 0.020963661, -0.018200552, -0.032447737, -0.15910539, 0.47710067, -0.49904862, -1.4134532, -0.084259026, 0.08839054, 0.028906915, 0.104726486, 0.29923728, -0.08374105, 0.01574318, -0.13314894) * inp_3_1_0; + result1 += M4(0.00032150888, -0.022052694, -0.015426221, 0.08341028, -0.21296762, 0.26484624, -0.1642875, -1.1250306, -0.085825145, 0.020342987, -0.004617357, 0.10114876, -0.013172022, -0.07820508, -0.004570691, 0.04852303) * inp_3_2_0; + result1 += M4(-0.51067257, -0.017741462, -0.30039522, -1.2571963, -0.02236554, 0.025866626, 0.35474715, -0.11294425, 0.015856761, -0.15779603, 0.004964842, -0.10562984, -0.092869416, -0.09270884, 0.023389773, -0.1594219) * inp_3_0_1; + result1 += M4(0.109542504, 0.13075843, -0.053791624, -0.2583805, -0.0003216644, 0.09596493, 0.57191336, 0.1930133, 0.36178964, -0.32451582, 0.076985724, -0.122095495, -0.3093755, -0.013410467, 0.11794235, -0.37326223) * inp_3_1_1; + result1 += M4(0.09745649, 0.110358074, 0.026718691, -0.20241807, -0.03151634, 0.046703037, 0.13132267, 0.13586995, 0.0039782166, 0.023424538, -0.06189003, 0.09849016, 0.021251155, -0.027039757, -0.001076575, 0.1751954) * inp_3_2_1; + result1 += M4(-0.9915245, -0.42759714, -0.6206918, 0.44665846, 0.07352433, -0.08387705, -0.03350734, 0.22847399, 0.026893489, -0.0028833593, -0.07794939, -0.1306795, -0.039633114, -0.055868, -0.061232213, 0.15494743) * inp_3_0_2; + result1 += M4(-0.36546615, -0.16674288, 0.036561977, 0.16032474, 0.025758734, 0.07587018, 0.14069304, -0.0019422671, -0.22332664, 0.109017774, 0.10702005, 0.007700021, -0.42372864, -0.049412824, 0.15198228, -0.11751534) * inp_3_1_2; + result1 += M4(-0.076892026, -0.10194194, 0.023829062, -0.0664451, 0.033672974, -0.024957536, -0.049628306, 0.05266212, 0.14750876, 0.012939363, -0.06411259, -0.03776985, -0.01884732, 0.03957383, -0.021288283, -0.044852577) * inp_3_2_2; + result2 += M4(0.00025199563, 0.096507885, 0.035680834, 0.06834127, 0.31596154, 0.5993435, -0.13442408, -1.0987302, 0.033409167, -0.028566176, 0.06360105, -0.016831838, 0.07198026, 0.0160935, -0.09025124, 0.039986104) * inp_3_0_0; + result2 += M4(0.27852255, -0.1456235, 0.026425557, -0.03960402, 0.99083656, -0.24289148, 0.255672, -0.7740539, 0.005261177, -0.058641613, 0.33040568, -0.09337607, 0.05810956, 0.07106933, -0.115775965, 0.17179202) * inp_3_1_0; + result2 += M4(0.05257131, -0.021596745, 0.0068275137, 0.046166256, 0.7031302, 0.034376085, -0.13304152, -0.29976267, 0.08550005, -0.0020981333, 0.09808359, 0.07445061, 0.061775465, 0.04428485, -0.06592481, 0.054875463) * inp_3_2_0; + result2 += M4(-0.64612305, 1.2113901, 0.009581094, -0.8400584, 0.046426214, -0.09642886, -0.06831416, -0.07444592, -0.019154096, 0.065491885, -0.028710717, -0.069172874, -0.14328499, 0.17614238, -0.14039895, 0.049561076) * inp_3_0_1; + result2 += M4(-0.27135545, 0.26022336, 0.008533434, -0.13182087, 0.06728565, 0.22086637, 0.06302549, 0.13521333, -0.3080801, -0.38079894, 0.20361297, -0.11221058, -0.20414463, 0.050636705, -0.022766195, -0.38828018) * inp_3_1_1; + result2 += M4(-0.15456447, -0.03646629, 0.10671977, 0.040676594, 0.10400211, 0.026499726, -0.100129865, 0.012024702, 0.13864364, 0.08457329, -0.02822368, -0.022809839, -0.032735273, 0.05287141, 0.031021947, 0.050165605) * inp_3_2_1; + result2 += M4(-0.5396394, 0.59668887, -0.14847545, -0.11262023, -0.01689237, -0.05919283, -0.009492103, -0.014342331, -0.019490363, -0.00014506304, 0.028579397, 0.00881577, -0.02950097, 0.020590046, -0.04593803, -0.06230642) * inp_3_0_2; + result2 += M4(-0.13129808, -0.032387625, -0.11815697, -0.035777994, -0.031615224, 0.03932641, 0.033151463, -0.0030484225, 0.078017905, 0.038734343, 0.0287011, 0.08592658, -0.10403654, 0.19592181, 0.020191323, 0.038593575) * inp_3_1_2; + result2 += M4(0.13677305, -0.027477767, -0.08110967, -0.13846825, 0.03510477, 0.06813107, -0.0028038565, 0.074799486, 0.048010178, -0.0062584206, -0.025137382, -0.03969312, 0.020384584, 0.020166244, -0.003604738, 0.0026067435) * inp_3_2_2; + result3 += M4(-0.07958163, 0.226626, 0.010839079, -0.15146959, -0.46411514, -0.9746635, -0.16067171, 0.26086998, -0.008847108, 0.1492069, 0.08893505, -0.009487972, -0.06220731, 0.06247489, -0.061906796, 0.024931276) * inp_3_0_0; + result3 += M4(0.1605299, -0.050733022, -0.009947459, 0.12511593, -0.070824474, -0.056747224, 0.05806642, 0.42568368, -0.07097865, -0.09931744, -0.037423436, 0.060617164, 0.0150114, -0.08423409, -0.05806379, 0.092213616) * inp_3_1_0; + result3 += M4(-0.0023733436, -0.071667895, -0.026429838, 0.17737049, -0.2254883, -0.45036575, -0.02305606, 0.37234473, -0.024518099, -0.07007941, 0.09261846, 0.24610615, -0.008102975, 0.094132714, -0.04586088, 0.11520861) * inp_3_2_0; + result3 += M4(0.04834176, -0.45825547, 0.15551898, -0.6823625, 0.077481635, -0.3181704, 0.1819974, 0.007107567, -0.07662808, -0.0008196648, -0.10875353, 0.0067090136, -0.04190695, 0.03827345, -0.14126761, -0.051619746) * inp_3_0_1; + result3 += M4(0.37930316, -0.04407946, -0.01238782, 0.23310061, 0.40887487, -0.719703, 0.48665968, 0.07135413, 0.24413355, 0.18634869, 0.3390411, -0.035839304, -0.07502038, -0.67640567, 0.0016627117, -0.02085262) * inp_3_1_1; + result3 += M4(0.035987593, 0.07719589, 0.096374325, -0.16219136, 0.32538247, -0.87211215, -0.07418743, 0.062578045, -0.16020074, -0.15909803, -0.05066982, -0.017460218, -0.04726886, 0.039209247, -0.014914555, -0.052938584) * inp_3_2_1; + result3 += M4(-0.012261669, -0.32118237, -0.022893699, -0.45062086, 0.046327095, 0.058009263, -0.065376736, 0.0055734706, -0.008084718, -0.17385426, -0.010035008, -0.006593194, -0.004550724, 0.09920785, -0.049575035, -0.013862305) * inp_3_0_2; + result3 += M4(0.17086881, 0.014676094, -0.014210215, -0.076593995, -0.017158492, 0.046289034, 0.07802933, 0.012850987, 0.036605753, -0.02279402, 0.10354422, -0.033762064, -0.029116895, 0.07669946, -0.054344196, -0.096501894) * inp_3_1_2; + result3 += M4(-0.023615815, 0.07025445, -0.08641296, 0.023666015, -0.018913722, 0.12914129, -0.025764482, 0.023226101, -0.030333309, 0.09175346, -0.037754275, 0.013420556, -0.051498346, -0.06312313, 0.008825869, -0.030032167) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 (Conv2D-4-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_3 +//!SAVE conv2d_4 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(-0.0040135784, 0.0032267163, 0.0077154385, -0.0131194005); + V4 result1 = V4(0.00494108, 0.012729458, -0.007542627, 0.009159574); + V4 result2 = V4(-0.0029531752, -0.08500148, -0.007686109, -0.0058430806); + V4 result3 = V4(-0.0036268765, 0.012139913, -0.005200553, -0.008799173); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.022446819, -0.09229735, -0.0010310403, -0.02886567, -0.00047958214, 0.018106725, 0.03281179, -0.03424525, -0.024050377, 0.093056306, 0.062247727, -0.09075345, 0.017732942, 0.20980102, 0.055907458, -0.032751247) * inp_0_0_0; + result0 += M4(-0.021193886, 0.031856388, -0.030064065, 0.08287286, 0.006676548, 0.1282676, 0.045911342, -0.060882766, 0.031217102, 0.027770746, -0.0755595, 0.1300494, -0.01657229, -0.04097931, -0.043443713, 0.02746677) * inp_0_1_0; + result0 += M4(0.020963114, -0.018738257, -0.0023086926, 0.03609221, -0.005606688, 0.0063512777, 0.0068921973, 0.002232806, -0.014810783, 0.011125607, 0.0073286225, 0.022102851, 0.0022564398, 0.016772412, 0.022617707, -0.012849541) * inp_0_2_0; + result0 += M4(-0.01166327, 0.00764596, -0.1432118, 0.11700769, 0.007080215, -0.20993969, -0.09295115, 0.048322495, 0.0017307845, -0.38891366, -0.037892267, 0.037722066, 0.068878174, 0.41997644, -0.039344516, -0.020811452) * inp_0_0_1; + result0 += M4(-0.00054955384, 0.014067522, 0.29207587, -0.16043621, -0.01351949, -0.08538314, -0.18636976, 0.19134319, 0.05039821, -0.093454875, 0.23129071, -0.29693934, -0.013584321, 0.08959259, -0.2683566, 0.21759026) * inp_0_1_1; + result0 += M4(0.012457035, 0.018976199, -0.10622637, 0.08818159, 0.011355054, 0.005865674, -0.018169943, -0.0063354126, -0.020067457, -0.032704737, -0.04071966, -0.021879561, 0.0071899095, 0.018855078, 0.12129616, -0.098034054) * inp_0_2_1; + result0 += M4(0.0065247775, -0.08215552, -0.012008458, 0.01703386, -0.09267752, -0.05647333, 0.020818327, -0.028593764, -0.014271322, -0.03788656, -0.020144267, 0.057078477, -0.008407014, 0.26333922, 0.019777702, -0.039687045) * inp_0_0_2; + result0 += M4(-0.064684056, 0.0026886077, -0.076331764, 0.09625828, 0.1110674, -0.045051012, 0.09687265, -0.05024201, -0.11028242, -0.07762572, -0.07028817, 0.036931906, 0.006109739, -0.08666, 0.017680138, 0.013017057) * inp_0_1_2; + result0 += M4(-0.00059720327, -0.03823437, 0.018477794, -0.052589536, -0.07530563, 0.043434873, -0.010242496, -0.009225539, 0.009707166, 0.0665768, -0.0029107493, 0.025805281, -0.017479628, 0.037734512, 0.028485654, -0.06030078) * inp_0_2_2; + result1 += M4(-0.0040805386, -0.04037355, -0.016298028, -0.10901159, 0.0075836866, 0.068849795, -0.0015867921, 0.08682354, -0.023941765, 0.09033158, 0.005955157, 0.07716451, -0.00027787118, -0.0027789993, 0.02263391, 0.03503209) * inp_0_0_0; + result1 += M4(-0.07058509, -0.08898672, -0.010795215, -0.24106635, 0.060452018, 0.027231239, 0.010219462, 0.12779248, -0.018958434, 0.009836416, -0.0048490902, -0.04708482, -0.0052001905, 0.0869615, -0.0153578855, 0.21318588) * inp_0_1_0; + result1 += M4(0.0018951882, 0.029790182, -0.018424176, 0.093001716, 0.021929987, 0.033413723, -0.0014516768, 0.028860403, -0.029973764, -0.038182214, -0.014042475, -0.113934435, -0.05061862, 0.018797146, 0.0062874416, 0.00840364) * inp_0_2_0; + result1 += M4(0.09108281, 0.12842284, -0.018321656, 0.101437524, 0.027001908, -0.1170763, -0.02120495, 0.011102345, 0.01890289, 0.050531536, -0.0261549, 0.11677346, -0.09126036, 0.018427776, 0.019214539, -0.12438176) * inp_0_0_1; + result1 += M4(0.015747905, 0.089796506, 0.070704944, 0.14218248, -0.25985935, 0.06523569, -0.074167654, -0.2468187, 0.052781288, 0.16311482, 0.011219645, 0.23202926, 0.29769585, -0.14658746, -0.011744472, -0.1010643) * inp_0_1_1; + result1 += M4(0.019483117, -0.081753485, -0.04673089, 0.004953991, -0.01471788, -0.057692084, -0.014760175, 0.004616836, 0.0422738, 0.07234505, 0.016358959, 0.10570093, -0.10613088, 0.0013665945, 0.056043588, 0.033560395) * inp_0_2_1; + result1 += M4(-0.032377638, -0.036992475, -0.11856061, -0.06043218, -6.167084e-05, 0.071027756, -0.0020108805, 0.18424764, -0.019465916, 0.02570314, -0.063401304, 0.005627003, 0.013067235, -0.08386608, 0.046325788, -0.07629352) * inp_0_0_2; + result1 += M4(-0.03403502, -0.21124011, 0.128395, -0.118983746, 0.11138527, 0.18360862, 0.15476844, 0.20760833, -0.069354326, -0.32101798, -0.17294091, 0.0053785504, -0.007118223, 0.13378446, -0.22533989, -0.1316874) * inp_0_1_2; + result1 += M4(-0.0032518269, 0.13455972, -0.047548614, 0.006280591, 0.014651311, 0.18860312, 0.012555325, 0.32387522, -0.00876885, 0.06728457, -0.03561065, -0.008271451, -0.027320381, -0.08463112, 0.123492375, -0.17134361) * inp_0_2_2; + result2 += M4(0.04966542, -0.014303865, 0.009559554, 0.050956815, 0.022178259, 0.051871855, 0.014207632, 0.019486817, -0.007377738, 0.063087024, 0.0013534816, 0.073808886, 0.097131714, -0.031721152, -0.0050633196, 0.0027983838) * inp_0_0_0; + result2 += M4(-0.071889535, -0.07981853, 0.029291, 0.0133744525, 0.02921235, -0.11562819, -0.038736906, 0.040879827, -0.05101825, 0.020087246, 0.027933752, -0.07056633, 0.024828767, 0.020775083, -0.03545826, 0.029901035) * inp_0_1_0; + result2 += M4(0.031110793, -0.106053896, -0.10874414, 0.06562912, 0.015990185, 0.07383382, 0.034378067, -0.043125585, 0.038731106, -0.021163106, -0.07850288, 0.048384033, -0.026847137, -0.09662953, -0.045504253, 0.08047158) * inp_0_2_0; + result2 += M4(-0.10335108, -0.01401889, 0.0038016094, -0.11588568, 0.036600247, 0.037577584, -0.007868014, -0.09576454, -0.018236142, -0.02697432, -0.025315316, 0.06763838, 0.17294714, 0.0654633, -0.02221289, 0.010515907) * inp_0_0_1; + result2 += M4(0.031055294, 0.0437143, -0.030369015, 0.25869074, -0.080643415, 0.05039154, 0.061441638, -0.14613687, -0.06329736, -0.04495888, -0.037863605, -0.06050588, -0.037237942, 0.04440609, 0.15861167, 0.059269182) * inp_0_1_1; + result2 += M4(0.0361052, -0.017285489, -0.15113652, 0.12752944, 0.001336428, -0.052559424, -0.19642851, 0.095575675, 0.065766186, -0.020980414, -0.1751973, -0.027264522, -0.16278692, -0.07947443, 0.041906893, -0.1923021) * inp_0_2_1; + result2 += M4(0.0058025694, -0.10522837, -0.003142448, 0.029614868, -0.12325673, -0.10741578, 0.0011671841, 0.008194599, 0.02683286, 0.05202333, -0.0081239175, 0.054529086, -0.0066502932, -0.01873842, 0.00828223, -0.008685434) * inp_0_0_2; + result2 += M4(0.011555687, 0.019120391, 0.0068035405, -0.033768255, -0.11139161, -0.07871454, 0.016408984, -0.08887099, -0.009325316, -0.014493788, -0.0042881635, -0.010129332, -0.028416067, -0.06053119, -0.028769666, -0.0074731703) * inp_0_1_2; + result2 += M4(-0.13009775, -0.04216335, 0.03589062, -0.05918483, 0.0063349833, 0.075580046, -0.06637416, -0.037039958, -0.11341202, 0.011516089, 0.03915498, 0.015401149, 0.09263449, -0.043401238, 0.035506167, 0.07418732) * inp_0_2_2; + result3 += M4(-0.055232104, -0.052181397, 0.09712439, 0.053068426, 0.008184627, 0.024033103, 0.0064768447, 0.01491977, -0.10160054, 0.056887053, -0.08783956, -0.15666912, 0.023039022, 0.10843832, -0.005499212, 0.07572511) * inp_0_0_0; + result3 += M4(0.01975557, 0.14321215, -0.119914174, 0.083147004, -0.075017564, 0.060033094, 0.02153906, -0.097562775, 0.14652961, 0.14147766, 0.12143339, 0.009040502, 0.029516807, 0.2184188, 0.13927828, 0.024003804) * inp_0_1_0; + result3 += M4(0.04161908, -0.12291186, 0.014007055, -0.0044366475, 0.065806784, 0.021362163, -0.03280152, 0.009637781, -0.0008115923, -0.11553343, -0.20894948, -0.039682742, -0.075024076, 0.094884165, 0.006231465, -0.021898488) * inp_0_2_0; + result3 += M4(0.07448278, -0.08064785, 0.1783025, 0.34271577, 0.028346969, -0.16897051, 0.031269226, -0.20038049, 0.032590013, -0.21115056, 0.0056216186, 0.04599637, -0.15385234, 0.055903055, 0.14891788, -0.08639215) * inp_0_0_1; + result3 += M4(0.33081916, 0.18709011, 0.10239755, 0.14202496, 0.074805714, 0.094217606, 0.078011304, 0.13345073, 0.18732202, -0.10334045, -0.2688966, 0.016904162, -0.104053885, -0.25665408, 0.5058878, -0.12103951) * inp_0_1_1; + result3 += M4(-0.080311626, 0.0096476115, -0.018007856, 0.0033822898, -0.040847033, 0.00077008334, -0.06762089, -0.019284576, -0.046603885, 0.05875434, 0.020478599, -0.015789887, 0.15411441, 0.20997126, -0.055525854, 0.036925472) * inp_0_2_1; + result3 += M4(0.036129907, -0.21834287, 0.046575624, 0.09891928, -0.049099892, 0.0012149358, -0.0941673, 0.06713417, 0.005362152, -0.008132467, 0.029246638, -0.025881121, -0.021541959, 0.1865162, -0.056459565, 0.15184881) * inp_0_0_2; + result3 += M4(-0.099397436, 0.11888237, 0.02868581, 0.023543233, 0.08439208, -0.22925763, -0.072643846, -0.19373773, -0.03718246, -0.043030668, -0.0279274, -0.02950604, 0.014288387, 0.12906073, 0.027930567, -0.028679885) * inp_0_1_2; + result3 += M4(0.035180163, 0.0027005104, 0.0058912137, 0.0039001005, -0.013516835, -0.063876055, 0.068691954, 0.050706748, 0.02708764, 0.11582471, -0.04711184, -0.0068420544, -0.05498892, 0.094348386, -0.051397104, 0.0029429044) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.0128763085, 0.052068323, -0.011954824, 0.0021608714, 0.00030223568, 0.017587025, -0.01058941, 0.008313421, -0.01251023, 0.29738817, -0.17888871, 0.17669652, 0.02183395, 0.11471337, 0.012121865, -0.056569528) * inp_1_0_0; + result0 += M4(0.013480782, -0.30869487, 0.12514831, -0.056587443, -0.06087438, -0.043470133, -0.12944093, 0.1333073, -0.033362042, 0.16611177, 0.26333383, -0.3493265, -0.012774537, 0.01958674, -0.025693916, -0.00576545) * inp_1_1_0; + result0 += M4(-0.0045791795, 0.057620887, 0.031712543, -0.021927495, 0.034111075, 0.04401428, -0.00932385, 0.02523834, -0.05177421, -0.037475258, -0.00818403, 0.18527389, 0.0073408224, 0.013466603, -0.018797964, -0.008819587) * inp_1_2_0; + result0 += M4(0.03511881, -0.31476012, -0.028296899, 0.014868918, -0.053283457, -0.11248065, -0.05588429, 0.052380826, 0.0022158825, -0.20020013, -0.013065737, 0.0059395954, -0.026061038, 0.009230161, 0.041668627, -0.04549138) * inp_1_0_1; + result0 += M4(-0.03102469, 0.048471652, -0.18547377, 0.11187585, -0.03838462, 0.062065408, -0.25089842, 0.27000895, 0.15203376, 0.1822979, 0.024691727, -0.05018225, 0.11352361, -0.13844427, -0.08078384, 0.16746117) * inp_1_1_1; + result0 += M4(0.05993513, 0.0053647747, -0.051664807, -0.009675976, -0.034741007, -0.016219925, -0.06747187, 0.08026824, 0.13252358, 0.2971501, 0.024876906, 0.021718679, -0.031329714, -0.0050613126, 0.085378274, -0.09904521) * inp_1_2_1; + result0 += M4(-0.057906702, -0.11236472, 0.023313101, -0.02293448, -0.03768937, -0.2251109, -0.016215017, -0.00950604, 0.068863146, 0.30394804, -0.012602742, 0.013618551, -0.014835617, 0.28404757, -0.0015931885, -0.02047274) * inp_1_0_2; + result0 += M4(0.10332839, 0.14611422, 0.05431722, -0.060723606, 0.09322961, 0.15063441, 0.03119704, 0.022710817, 0.01185925, 0.044084266, 0.05836641, -0.04914897, -0.11924304, -0.10219539, -0.023038983, -0.003801836) * inp_1_1_2; + result0 += M4(-0.08029915, -0.046139803, 0.008697404, -0.01117896, -0.043575782, -0.09271846, -0.0020342334, -0.014879644, -0.06671466, -0.02011031, 0.023232145, -0.06101047, 0.0013811433, 0.077171504, 0.034526013, -0.060139507) * inp_1_2_2; + result1 += M4(-0.019680703, -0.006418717, -0.004702196, 0.21885663, -0.019759674, 0.0102063, -0.002012741, 0.02891873, 0.08375299, 0.04083115, -0.008229031, -0.070820324, -0.033556238, -0.009796709, 0.0035726011, 0.120267294) * inp_1_0_0; + result1 += M4(0.22270824, -0.05971591, 0.014297061, 0.16603453, -0.17384386, -0.082323544, -0.012659822, -0.26011658, -0.39758298, -0.27216193, -0.0003004569, 0.14809889, -0.017855754, -0.12187555, -0.0056101284, -0.36598822) * inp_1_1_0; + result1 += M4(-0.0053077796, 0.07974863, 0.0044853278, 0.17476735, -0.05587634, 0.000478736, 4.7219305e-06, 0.013212377, 0.17053604, -0.061615106, 0.034866598, -0.1701907, 0.037163932, 0.0093364, -0.0059611164, 0.031372953) * inp_1_2_0; + result1 += M4(-0.005903216, -0.047463845, -0.0034881225, 0.020824652, -0.009203731, 0.053911712, 0.04947658, 0.004140391, 0.102251, -0.1762965, -0.111852996, 0.0038294205, -0.062487774, -0.07207221, 0.050615903, -0.019346781) * inp_1_0_1; + result1 += M4(-0.22630687, 0.045354478, -0.052379932, -0.3705097, -0.29889983, -0.077089064, 0.19144304, -0.035254218, -0.09279178, -0.41239044, 0.23899618, -0.3868468, 0.18396308, 0.12465744, 0.020112954, 0.074541666) * inp_1_1_1; + result1 += M4(-0.016391076, 0.17111103, 0.005496715, 0.053091466, -0.07366343, -0.12970647, 0.030588876, -0.010529222, 0.014089911, -0.008137579, -0.07495139, 0.11865472, -0.1468576, -0.019079275, -0.032410286, -0.07259862) * inp_1_2_1; + result1 += M4(0.0151464455, 0.027335307, -0.028206328, -0.029740231, -0.0077183773, -0.017693141, -0.009017493, -0.04187936, 0.0021898046, 0.016073616, -0.053040896, 0.087421216, 0.011279699, 0.036217406, 0.06301923, -0.012236634) * inp_1_0_2; + result1 += M4(0.041095432, 0.2537466, 0.17225754, 0.11324849, 0.026644496, -0.08952341, 0.2803843, 0.030880537, 0.03209173, 0.28756225, 0.042938236, 0.14979622, -0.036367867, -0.30107048, -0.115396775, -0.23922656) * inp_1_1_2; + result1 += M4(0.008334098, 0.1433527, -0.014165843, 0.028277045, 0.013517422, -0.012090402, 0.028212752, 0.016341574, -0.019476518, 0.08225366, 0.02954602, 0.056807607, -0.0013000853, -0.10133523, 0.10570841, 0.0040202886) * inp_1_2_2; + result2 += M4(0.00020585542, -0.10595579, -0.024075527, -0.043914355, 0.035975162, -0.110578425, 0.0005285829, 0.048812922, -0.122295074, 0.024852939, 0.00926203, -0.104586475, 0.006746198, 0.026529612, -0.005823842, -0.032530647) * inp_1_0_0; + result2 += M4(0.12146054, -0.02784996, -0.014604895, 0.15886171, -0.1691908, -0.10535379, -0.03362664, -0.24715196, -0.011940299, -0.028050655, -0.08629228, 0.08535456, 0.08652907, -0.0057366705, -0.013718489, -3.2006486e-05) * inp_1_1_0; + result2 += M4(-6.391767e-05, -0.03701326, 0.18519332, 0.004163531, -0.008389772, -0.04877323, -0.3238021, 0.11442726, 0.42126325, 0.07359092, -0.08448461, 0.2498309, 0.0030401861, 0.057449795, 0.0109812785, 0.04928388) * inp_1_2_0; + result2 += M4(-0.00012884365, -0.00072631775, -0.0041053053, 0.013112391, -0.09921218, -0.067468196, -0.014271074, -0.12439954, -0.035519533, -0.08444414, -0.017164286, 0.0024305168, 0.06430278, -0.008736951, 0.030803327, 0.08006712) * inp_1_0_1; + result2 += M4(0.12315418, -0.088640936, -0.050914943, -0.044375017, 0.13423163, -0.08564678, -0.102095746, 0.18636574, 0.15668021, 0.04321122, 0.057674617, 0.17986007, -0.017220415, -0.059452653, 0.047418516, -0.25613683) * inp_1_1_1; + result2 += M4(-0.065463364, -0.09421511, 0.16259682, 0.037939362, -0.1232132, -0.111910224, 0.22589701, -0.031586938, -0.15750502, 0.03500383, -0.02621489, -0.22954142, -0.13212022, 0.0063589057, -0.008052567, -0.092233874) * inp_1_2_1; + result2 += M4(-0.052525025, -0.03922068, 0.003195036, 0.025051178, -0.03326035, -0.08989328, -0.006789344, 0.0030992923, 0.034772567, -0.091194555, -0.009219043, 0.0696772, -0.047364756, 0.055251293, -0.006822553, -0.12333176) * inp_1_0_2; + result2 += M4(-0.017599246, -0.038083553, 0.023908038, -0.09640398, -0.013075659, -0.04444389, -0.006169872, 0.0292883, -0.046958275, -0.048682574, 0.012830524, -0.17958483, -0.024997052, 0.028825838, -0.03318397, -0.0043117087) * inp_1_1_2; + result2 += M4(0.024646105, -0.10364469, -0.021210829, 0.028682416, 0.0731311, 0.02400633, 0.0031529882, -0.012837452, -0.13710135, -0.018319733, -0.015243259, -0.031686984, 0.059482705, 0.042210914, -0.09135384, -0.095729634) * inp_1_2_2; + result3 += M4(0.0034101333, 0.05535736, 0.024105577, 0.021848775, -0.018094912, -0.054792136, 0.035593905, -0.107914925, 0.079538144, -0.15841089, 0.28956112, 0.2037883, -0.026085768, 0.19641061, -0.17448546, 0.02818008) * inp_1_0_0; + result3 += M4(0.013099687, -0.25685248, -0.21123523, -0.058896057, 0.13408852, -0.06408254, -0.038902212, 0.148966, -0.36242187, 0.9573575, -0.38538298, 0.20866586, -0.0135457115, -0.17544252, 0.21034725, -0.01854412) * inp_1_1_0; + result3 += M4(0.015325741, 0.109892145, -0.029220585, 0.0414602, -0.08171769, 0.0672044, -0.09715838, -0.024387505, -0.110984795, 0.87591684, 0.36287174, 0.02873156, -0.045318272, 0.03970228, 0.044567477, 0.019652335) * inp_1_2_0; + result3 += M4(0.048121918, 0.08487519, -0.0110788485, -0.10335771, 0.053024076, -0.019237788, 0.115838595, 0.27692616, -0.038947303, -0.07734193, 0.08789802, -0.13361062, -0.084543034, -0.063710235, -0.039903134, -0.082545) * inp_1_0_1; + result3 += M4(-0.111958675, -0.12849922, -0.042949416, -0.007649164, -0.09928454, -0.22055286, -0.1844109, -0.15226477, 0.06964548, 0.29758227, 0.2469849, 0.07742351, -0.094236195, 0.034951027, 0.13522738, 0.0133545175) * inp_1_1_1; + result3 += M4(-0.050296642, -0.28410354, 0.015063976, -0.006128918, -0.0470889, 0.008160088, 0.0020720777, 0.039283343, 0.10286344, 0.28448346, 0.02644191, 0.0026204113, 0.01836578, 0.084340185, -0.08349685, 0.013048368) * inp_1_2_1; + result3 += M4(-0.010066227, 0.015333275, 0.040386546, 0.0027275602, -0.048058737, -0.13380641, 0.047336664, -0.03337915, 0.0035930146, -0.06406163, 0.033675723, 0.12354965, 0.06876556, 0.020875918, 0.018492095, -0.09037671) * inp_1_0_2; + result3 += M4(-0.011871062, -0.002620799, 0.004697188, 0.011113553, 0.0071302364, 0.16026612, -0.037049957, 0.044946592, 0.015945464, 0.122067764, -0.0033488947, 0.018354658, -0.022900213, 0.02081817, 0.024235805, 0.041325647) * inp_1_1_2; + result3 += M4(0.00051608094, -0.111439236, 0.049050186, -0.0017189587, -0.012687636, -0.18043011, 0.032639593, -0.011066172, 0.003809168, 0.10372078, -0.00017059076, -0.0061963093, 0.010642897, 0.21251322, 0.01499975, -0.00060482975) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.018767586, 0.37946993, 0.03240346, -0.074103445, 0.013256744, -0.73405415, 0.025663486, 0.0037305616, 0.014623672, 0.007632366, 0.013873153, -0.015707593, -0.0046343533, -0.20099154, -0.038023286, 0.022481618) * inp_2_0_0; + result0 += M4(0.037362464, -0.029853325, 0.11825507, -0.1266219, -0.035908747, -0.027179906, -0.09394578, -0.107248306, 0.000541979, -0.061200544, -0.024837013, 0.0053975997, 0.017814586, -0.05382926, 0.0922865, -0.15499015) * inp_2_1_0; + result0 += M4(-0.026803698, -0.03689163, 0.024773858, -0.024776613, 0.023835085, 0.103969544, -0.01580862, -0.014334969, -0.002205302, -0.0065507595, 0.058469918, -0.05255904, -0.016154546, -0.026679695, -0.0022297816, -0.014502392) * inp_2_2_0; + result0 += M4(0.028078122, 0.2794735, 0.02043743, -0.013269822, -0.0069112084, -0.2905295, 0.0067768595, 0.0008341885, -0.05023395, 0.10181315, 0.07705284, -0.054124117, 0.06520775, -0.04132514, -0.11068868, 0.052190818) * inp_2_0_1; + result0 += M4(-0.10037066, -0.15912087, 0.055432197, 0.3000064, -0.014009785, -0.20990136, -0.09185901, -0.18783937, 0.011323513, 0.06145226, 0.26730964, -0.38835666, 0.08074848, 0.11648274, 0.107400686, 0.13202316) * inp_2_1_1; + result0 += M4(0.054533374, -0.030651595, 0.064748436, -0.11521519, -0.082970746, -0.16089259, -0.07056045, -0.0122828195, -0.008300171, 0.030350173, 0.2764626, -0.24443032, 0.027398918, -0.060851287, -0.050053008, 0.06686099) * inp_2_2_1; + result0 += M4(-0.030806756, 0.28152052, 0.016293688, 0.00019218923, 0.06385456, -0.768716, -0.008862266, -0.0013578102, 0.09297159, 0.17276277, 0.015002878, -0.011491623, 0.039086744, 0.12742285, -0.037600823, -0.028224783) * inp_2_0_2; + result0 += M4(-0.113680325, -0.090142876, 0.009299604, -0.042315293, -0.23041852, 0.10187753, -0.02534172, 0.015198311, -0.19454521, -0.03534942, 0.09299287, -0.05797667, 0.35324952, -0.034904387, 0.06753692, -0.06613343) * inp_2_1_2; + result0 += M4(-0.0041130786, 0.07705423, 0.029097408, -0.021241808, -0.14221656, 0.071248285, 0.0027881418, 0.02272239, 0.013451467, 0.0041271113, 0.04043472, -0.049031157, 0.05890192, 0.00071542076, -0.030902434, -0.01806016) * inp_2_2_2; + result1 += M4(-0.0100553315, 0.1445101, 0.025206093, 0.16367912, -0.0077398536, 0.057262916, -0.0018721124, 0.009491158, -0.019690538, -0.00050403655, -0.0022982846, 0.0064275805, 0.03182664, 0.08586602, 0.005296856, 0.11086229) * inp_2_0_0; + result1 += M4(0.100263774, 0.032224674, 0.007614719, 0.3077328, -0.11689845, 0.045522682, 0.005368042, -0.6640451, 0.05671755, 0.06947968, 0.0059584933, 0.12661453, 0.114836976, 0.0078067435, 0.012673742, 0.14992271) * inp_2_1_0; + result1 += M4(-0.014965994, -0.03613807, 0.017843746, 0.057888564, 0.0016416174, 0.039073598, 0.004485906, 0.01314407, -0.07619885, -0.013138787, 0.01482138, -0.014854271, 0.02104871, 0.058661107, 0.00537317, 0.059871946) * inp_2_2_0; + result1 += M4(-0.019947665, -0.02337146, -0.05745076, 0.06390522, 0.0061994577, -0.03513352, 0.0039894506, -0.1870658, 0.07621767, -0.041756485, 0.0042083175, -0.09015903, 0.050684888, -0.032862004, -0.0383148, -0.06806279) * inp_2_0_1; + result1 += M4(0.11575761, -0.03566747, -0.1419168, 0.07686426, -0.11935506, -0.5449443, -0.019731725, -0.4439198, 0.15448299, 0.06354772, -0.050596375, -0.17802976, -0.039333005, -0.1836554, -0.10640459, -0.024331508) * inp_2_1_1; + result1 += M4(-0.06137397, -0.028483927, -0.01319596, 0.029112315, 0.02215432, -0.47851038, -0.013122113, -0.37099057, -0.064374104, 0.12437201, 0.09441625, 0.0964911, 0.061800938, -0.020516852, -0.024200046, -0.080888055) * inp_2_2_1; + result1 += M4(-0.02180753, 0.2914682, 0.07562381, -0.046386164, 0.010121207, 0.020429429, 0.013896352, 0.010339173, -0.008270475, -0.0005158645, -0.0496025, 0.018030144, -0.0029540863, 0.053199697, -0.12489866, 0.07791219) * inp_2_0_2; + result1 += M4(0.03735715, 0.30508387, 0.15844251, -0.1175811, -0.03410126, -0.7469112, -0.13593495, 0.020091493, 0.0056048105, -0.1562087, -0.20568803, 0.007995341, 0.045260154, 0.37609518, 0.27776894, 0.14643498) * inp_2_1_2; + result1 += M4(-0.010797698, 0.18568471, 0.05050696, -0.03671986, -0.01899938, -0.3269143, -0.05808486, -0.057467256, -0.01960092, -0.17659442, 0.12925349, -0.14431082, -0.018930312, 0.18480995, -0.07412044, 0.15717995) * inp_2_2_2; + result2 += M4(-0.046204865, -0.103821956, -0.010860188, 0.037352648, 0.045176484, -0.11509887, 0.0032391804, 0.05722828, -0.014318247, -0.020388361, -0.006871636, 0.012856181, 0.0663493, -0.014491342, -0.00056829635, -0.018839898) * inp_2_0_0; + result2 += M4(0.015519363, -0.04379356, -0.048258897, 0.0092985695, -0.12677082, -0.0840051, -0.03845116, -0.44977376, 0.024705162, -0.08450324, -0.007273154, 0.003961096, 0.1205917, -0.06583735, 0.09004664, 0.056332048) * inp_2_1_0; + result2 += M4(-0.045568097, -0.03407655, 0.13666867, -3.1876676e-05, 0.019434048, -0.0877716, -0.32850698, -0.2531008, -0.06927688, -0.05049396, 0.07952079, 0.016784674, 0.037036795, 0.06620619, 0.044526313, -0.14102459) * inp_2_2_0; + result2 += M4(0.10563744, -0.054532535, -0.02444866, -0.04438278, 0.0056826673, -0.10505247, -0.0025805442, -0.011387135, -0.0163086, -0.0750018, 0.0057180603, 0.017566675, 0.020842876, -0.069835514, -0.025404071, -0.06463173) * inp_2_0_1; + result2 += M4(-0.09687428, -0.013830805, -0.0043008714, 0.19830416, -0.3254863, 0.07027251, 0.090760596, -0.42412746, -0.026216919, -0.042083472, 0.08191527, 0.08890029, 0.32130423, -0.10276524, -0.046229154, -0.09222065) * inp_2_1_1; + result2 += M4(-0.028740982, 0.05833635, -0.074025534, -0.11106386, -0.12051663, -0.016884184, -0.8760091, -0.21653624, -0.023070619, -0.086227246, -0.3356709, -0.10698863, 0.19418916, -0.06019335, 0.55395144, 0.04142959) * inp_2_2_1; + result2 += M4(-0.10068316, -0.055732206, 0.0039255223, 0.03194576, 0.0169547, -0.11442009, 0.0066540116, -0.06813424, 0.098051235, -0.104861155, 0.00054658856, 0.035421174, 0.078026086, -0.013412237, -0.0028990135, 0.050640628) * inp_2_0_2; + result2 += M4(-0.11782882, -0.123334214, -0.0017048669, -0.09074227, -0.012847767, -0.104540326, -0.024515854, 0.017064922, -0.12106071, 0.01742032, 0.024233157, -0.12282968, 0.1479409, 0.010675117, 0.03142114, -0.08293813) * inp_2_1_2; + result2 += M4(0.08341529, -0.093824685, -0.0050690966, 0.016659621, -0.1323844, -0.08899898, 0.011605324, 0.009853149, 0.1091089, -0.0008812067, 0.03615029, -0.014381648, 0.035703827, -0.0058702324, -0.01723073, -0.09445252) * inp_2_2_2; + result3 += M4(-0.0033674666, 0.27479184, -0.14520442, 0.056195375, 0.021564325, 0.120622255, 0.0747343, -0.06224032, -0.0316305, 0.08231498, -0.07389498, 0.02856619, -0.045992043, -0.35338366, 0.029923819, 0.039241537) * inp_2_0_0; + result3 += M4(-0.08923331, 0.017857159, 0.35180876, -0.07138678, 0.04999131, -0.57993644, -0.33715415, -0.06651225, 0.05477934, -0.14006998, 0.039397564, -0.043427624, -0.06581547, 0.23676425, 0.17026886, -0.17200765) * inp_2_1_0; + result3 += M4(0.10055006, 0.033518847, -0.050471883, -0.021379095, -0.13827854, -0.2650917, -0.06516931, 0.02099619, -0.07549386, 0.044028837, -0.0010062923, 0.00819925, 0.020101171, -0.03921381, 0.023089815, 0.02456863) * inp_2_2_0; + result3 += M4(0.03165244, -0.07129725, -0.23964712, -0.23844421, -0.037724618, -0.17837454, 0.016393203, -0.25098523, 0.06200857, 0.086369134, -0.027192384, -0.18964183, 0.039954573, -0.17039742, 0.13961609, 0.23892525) * inp_2_0_1; + result3 += M4(0.071400404, -0.015791003, 0.18592079, -0.10519635, -0.27906966, -0.4978389, -0.18447538, -0.12677093, -0.3329094, -0.0574575, 0.0017264464, -0.07430323, -0.031537917, 0.42141986, -0.11500433, -0.09284232) * inp_2_1_1; + result3 += M4(-0.01741798, 0.052760378, -0.06376725, -0.053840555, 0.12993482, -0.33029583, -0.043332346, -0.0067290626, 0.20229244, 0.1036244, -0.05800761, -0.013660656, -0.09456258, -0.32976916, -0.068030186, -0.0017372206) * inp_2_2_1; + result3 += M4(0.061151385, 0.28756905, -0.1282007, 0.072775304, 0.015067437, 0.06658751, -0.0007233735, 0.049608916, -0.025705693, 0.09252448, -0.081732415, -0.00092824135, -0.10873655, -0.07075192, 0.013692618, -0.10097195) * inp_2_0_2; + result3 += M4(0.019418621, -0.14067507, 0.12894523, -0.08513426, -0.017363464, 0.044414137, 0.06420442, 0.0006786324, 0.1281164, 0.056295928, -0.007402897, -0.017317312, -0.006835481, 0.11457798, -0.0066917334, -0.13481094) * inp_2_1_2; + result3 += M4(0.0070297364, 0.19065014, -0.017244624, 0.014097578, 0.02551897, 0.013782661, -0.00926291, -0.00593344, -0.004784505, 0.16583267, -0.021029223, -0.020769436, -0.035404734, -0.09736763, 0.00019690121, -0.01409137) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.02849564, 0.20801629, 0.07789714, -0.08591794, -0.013138032, -0.12500729, -0.05955897, -0.009347837, -0.0026199075, -0.18090871, 0.04996966, -0.024295611, 0.023241067, 0.2989913, -0.022329632, -0.01068407) * inp_3_0_0; + result0 += M4(0.006488096, 0.16587855, -0.023761768, 0.008591953, 0.017688885, 0.03924619, 0.037046492, 0.017823525, -0.032084648, -0.04694791, -0.038628716, 0.06675431, -0.05275973, -0.27945307, -0.10931105, 0.0933604) * inp_3_1_0; + result0 += M4(-0.0011106502, -0.09068102, -0.008446835, 0.0063396683, -0.0095890695, 0.080751486, 0.03700392, -0.010667634, 0.010742994, 0.020316003, -0.09261909, 0.07645715, 0.04386066, 0.20862317, 0.011739568, -0.019822497) * inp_3_2_0; + result0 += M4(0.092012346, -0.99243253, 0.08192624, -0.01996185, -0.12249764, -0.23786958, 0.02590213, 0.061792508, 0.024931097, -0.19624819, 0.020123413, -0.015653277, -0.1624149, -0.09031144, 0.036892284, -0.07276322) * inp_3_0_1; + result0 += M4(0.04910099, -0.05648109, 0.23602869, -0.32097897, -0.1457341, -0.16602312, -0.13416448, -0.12093756, 0.2184975, -0.059735287, -0.27835158, 0.3410014, 0.22202568, 0.010500871, 0.07437828, 0.13752706) * inp_3_1_1; + result0 += M4(-0.005880409, 0.055422354, -0.022551373, -0.0059791715, 0.018647302, 0.029757852, 0.019998867, 0.049658902, -0.04080723, -0.08332848, -0.15499778, 0.14148471, -0.17509991, -0.040453184, 0.09497388, -0.07449588) * inp_3_2_1; + result0 += M4(0.08568281, -0.29432014, -0.029305942, 0.053156, 0.06250727, 0.063061155, 0.0035598758, 0.003287929, -0.025394496, -0.06501153, 0.00040421658, 0.0016468758, -0.27703464, 0.046435226, 0.012366997, -0.08402375) * inp_3_0_2; + result0 += M4(0.032805514, 0.037855648, 0.056718554, -0.031252827, -0.19035767, -0.008683348, 0.040429004, 0.024449537, -0.2014328, -0.021833923, -0.08468981, 0.04139073, -0.37713024, -0.023530802, -0.08192364, 0.059064213) * inp_3_1_2; + result0 += M4(0.010253931, -0.09591305, -0.05260071, 0.07549732, -0.09035534, 0.055765323, 0.0043522757, -0.02160955, 0.06055933, 0.02745642, 0.0030234493, -0.013425673, 0.12574619, 0.080521055, 0.0094557395, -0.003933899) * inp_3_2_2; + result1 += M4(-0.012831924, -0.0132940365, 0.014013292, -0.038607925, -0.04236358, -0.0040199724, 0.00038156085, -0.06882647, 0.0035105674, -0.05997285, -0.019546315, -0.0690018, -0.05382405, -0.18697755, -0.016889963, -0.5278594) * inp_3_0_0; + result1 += M4(0.074903056, 0.030982196, -0.009691815, 0.021653235, -0.08748461, -0.12714823, -0.0073664947, -0.2103852, 0.27545306, -0.172489, -0.0138034215, -0.29320762, 0.01954728, -0.02743053, -0.023833975, -0.19926408) * inp_3_1_0; + result1 += M4(0.013739132, -0.112030625, 0.002236266, -0.11029386, 0.08357734, 0.029980266, -0.034573138, 0.19402589, 0.10511627, 0.018066818, -0.022175178, -0.06294438, -0.053210363, 0.02821048, 0.019673957, -0.048769414) * inp_3_2_0; + result1 += M4(-0.055812005, -0.124672994, -0.0028307915, 0.058708996, 0.0993413, 0.11292148, 0.0051302207, 0.09086054, -0.08655739, 0.018395796, 0.02877268, 0.05893856, -0.020206036, 0.2676144, 0.046343397, 0.2983221) * inp_3_0_1; + result1 += M4(-0.34456164, 0.16105084, -0.014667792, -0.11443499, -0.15428352, 0.019309709, 0.098831594, -0.22864045, 0.2626861, 0.15095614, -0.23578995, 0.29990196, 0.18960963, 0.21112593, 0.093182735, 0.47255817) * inp_3_1_1; + result1 += M4(0.059633996, 0.09617087, -0.044195272, 0.10701252, -0.0113297105, -0.19980581, -0.06557026, -0.35609877, 0.19168015, -0.17455539, -0.13791767, -0.080850326, -0.01642995, 0.2259445, 0.03632761, 0.34964672) * inp_3_2_1; + result1 += M4(-0.021547923, -0.033423975, 0.12387771, -0.15235455, -0.064095765, -0.22966129, -0.053911634, 0.009297953, 0.016425744, -0.031667043, 0.050109, -0.041998934, -0.0255521, -0.6661454, 0.0064874776, -0.06525574) * inp_3_0_2; + result1 += M4(-0.00955878, -0.18819161, 0.20119229, 0.067589976, 0.059636027, -0.21445525, -0.15586011, 0.12951705, -0.023852644, -0.17125781, -0.22089507, -0.15525785, 0.021554073, -0.24427617, -0.11932995, -0.11995491) * inp_3_1_2; + result1 += M4(0.00027492762, -0.011149431, -0.04397851, -0.015187671, -0.018693645, 0.17604014, 0.036288437, 0.027685415, 0.02450683, 0.028729985, -0.18002404, -0.06767717, -0.018331988, -0.06327862, 0.06566395, -0.04259143) * inp_3_2_2; + result2 += M4(0.020330925, -0.07583019, 0.00040865978, 0.17905723, -0.12488742, -0.038913324, -0.013407421, -0.15406337, -0.029491287, -0.019691758, 0.0037197322, -0.03494804, -0.048548967, -0.10085025, -0.011280026, -0.08775244) * inp_3_0_0; + result2 += M4(0.009023494, -0.08019787, 0.042378664, -0.005744673, -0.14025515, 0.04256303, 0.001598648, 0.21287486, 0.19740039, 0.006873391, 0.02995404, -0.017945066, 0.082922794, 0.045110267, -0.021023361, -0.0863003) * inp_3_1_0; + result2 += M4(0.012322307, -0.07433875, 0.27594987, -0.014473471, -0.085696355, 0.0740318, -0.10467701, -0.03484768, 0.04685408, -0.017835882, 0.16549787, -0.01544419, -0.15037893, -0.03528296, -0.059958216, -0.039337374) * inp_3_2_0; + result2 += M4(0.13516413, -0.015549442, 0.04405686, -0.08380343, -0.112463795, -0.11393289, 0.010840805, 0.06926739, 0.06683571, -0.013422019, 0.009995389, 0.13865924, -0.11091083, -0.04586237, -0.024832733, -0.10614919) * inp_3_0_1; + result2 += M4(-0.18775412, -0.05149138, 0.26367128, 0.06821067, -0.60855925, 0.024774756, 0.021855973, -0.29352945, -0.06843421, 0.054736953, 0.05677782, -0.15776412, -0.23566322, 0.024886563, 0.18402183, -0.35429534) * inp_3_1_1; + result2 += M4(0.03283841, -0.07640909, -0.23255424, 0.010227406, -0.20778243, 0.00991061, -0.17909159, 0.12931508, 0.08077656, 0.046959363, -0.17226915, 0.052532163, 0.010613912, 0.061070718, -0.24095905, -0.18562591) * inp_3_2_1; + result2 += M4(0.0634982, -0.08347916, 0.03740913, -0.0013856665, 0.045188613, 0.07850495, -0.0029027993, 0.034063198, -0.010978764, 0.02016892, -0.002155239, -0.061337594, -0.28043994, -0.0872294, -0.011892446, -0.35126853) * inp_3_0_2; + result2 += M4(0.3203884, -0.024319857, 0.09506602, 0.023610925, -0.27575597, -0.042449426, -0.017148286, 0.14666425, -0.13386834, 0.02054439, -0.05575814, 0.1107654, -0.16863112, 0.022383632, 0.08456575, 0.14868464) * inp_3_1_2; + result2 += M4(-0.016137088, 0.002761102, -0.0030788647, 0.09071825, -0.10555493, -0.11326085, 0.016684838, -0.06471668, -0.09259946, 0.0008187052, -0.074667886, 0.007401484, 0.16636859, 0.08404795, 0.1367621, 0.019132363) * inp_3_2_2; + result3 += M4(-0.084024556, -0.034183636, -0.11003828, 0.07596261, 0.009530936, -0.123412155, 0.062994644, -0.0016971333, 0.030774757, 0.06060111, -0.112204134, -0.015265249, 0.06952364, -0.12871222, -0.1793224, -0.082263656) * inp_3_0_0; + result3 += M4(0.035075944, -0.03648615, -0.03251158, -0.02360845, 0.09579168, -0.093637735, -0.12766589, 0.02200376, 0.05223472, -0.38457364, 0.2035677, -0.06779454, 0.075349145, 0.24952288, 0.2585974, -0.026620159) * inp_3_1_0; + result3 += M4(0.05988551, 0.024185207, 0.053580564, 0.00680627, -0.010874452, -0.118844636, 0.077303134, 0.0002133361, -0.002078051, -0.13200852, -0.059146896, -0.016534718, -0.0701598, 0.3903104, -0.044406667, 0.06022056) * inp_3_2_0; + result3 += M4(-0.0680266, 0.13831161, -0.099020086, 0.027603677, -0.012557745, -0.12612383, 0.009141904, 0.0027618592, -0.048944946, -0.04472969, -0.019392889, -0.050438944, -0.30377015, 0.09719155, -0.1927275, -0.21734476) * inp_3_0_1; + result3 += M4(-0.0345394, -0.087790735, -0.5650414, 0.06738396, -0.08137511, -0.33920997, -0.13534264, 0.13543794, 0.13309768, -0.15364899, 0.15392002, 0.051194873, 0.24646005, -0.035910964, 0.35060343, -0.029892717) * inp_3_1_1; + result3 += M4(-0.02596073, -0.3088059, -0.008306526, -0.0453417, 0.008620145, 0.13213503, -0.14677626, 0.0022890011, -0.1017914, -0.16327615, 0.15063281, 0.03946359, 0.028780328, 0.01931414, -0.08703548, 0.047522143) * inp_3_2_1; + result3 += M4(-0.028443659, -0.04586124, -0.079354525, -0.22521858, -0.0010945717, 0.18372962, -0.16510531, -0.11550843, 0.060972877, -0.0015049014, 0.011682705, -0.014153036, -0.18183236, -0.27702382, -0.13596578, -0.065135516) * inp_3_0_2; + result3 += M4(0.017811868, 0.15783854, -0.028239341, 0.059509262, 0.038688328, -0.36765572, 0.10929163, -0.010511875, -0.10294899, -0.1696231, 0.008989734, 0.07924746, -0.37400815, -0.12820886, -0.0072698053, -0.12196404) * inp_3_1_2; + result3 += M4(-0.0034627488, -0.07924724, 0.05619683, -0.012788033, 0.018114138, -0.024447763, -0.07260673, 0.005397169, 0.029772269, -0.095115826, -0.011049113, -0.026298985, -0.016546406, 0.17970195, -0.023208177, -0.0030759405) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 (Conv2D-5) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_4 +//!SAVE conv2d_5 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(-0.0018953535, 0.0058265817, 0.018822813, -0.013862387); + V4 result1 = V4(-0.0010489298, 0.005604526, -0.00053814566, 0.0020017463); + V4 result2 = V4(0.010203275, 0.011347302, 0.0063539655, -0.00053525064); + V4 result3 = V4(-0.0053338343, 0.001321621, 0.036247738, -0.019181821); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.19293816, -0.24982975, -0.21115892, 0.023415579, 0.009774828, 0.06236626, 0.08222207, -0.0629858, 0.0619333, 0.012681148, -0.14015609, 0.07153636, -0.13429844, -0.05804902, 0.18437627, -0.058576047) * inp_0_0_0; + result0 += M4(-0.4484673, -0.96403027, -0.21804763, -0.33155116, 0.13409126, 0.11143466, 0.07317458, -0.034854446, 0.0052757114, -0.02699294, -0.0018612333, -0.010977338, -0.08321815, 0.047566846, 0.0144794155, 0.04763027) * inp_0_1_0; + result0 += M4(0.5540873, -0.32753128, -0.6608504, -0.2889768, 0.119986236, 0.08951169, 0.1222837, -0.1704321, -0.028143425, -0.08819469, -0.033623528, 0.014351359, 0.008765508, 0.04452446, 0.020204451, -0.00047179594) * inp_0_2_0; + result0 += M4(0.0037529117, 0.080815926, 0.057914045, 0.10689451, 0.043663103, 0.12956528, 0.10605515, -0.008775666, -0.063651286, -0.08790763, -0.0064682956, -0.045193557, 0.035341766, 0.037771374, -0.10269953, 0.018227393) * inp_0_0_1; + result0 += M4(0.16825603, 0.12547831, 0.21248084, 0.2577808, 0.20802349, 0.13508378, 0.50583375, 0.16538978, 0.29226398, -0.73408896, 0.031909198, -0.14322773, -0.5266555, 0.68081826, -0.1012102, 0.02099461) * inp_0_1_1; + result0 += M4(0.17190212, -0.01142557, -0.1571053, 0.0655869, -0.057913907, 0.36778232, -0.15601146, -0.0419103, -0.1550589, -0.123147294, 0.06394219, 0.092019394, 0.21199438, 0.15671359, -0.046308175, -0.124025375) * inp_0_2_1; + result0 += M4(-0.0008404076, 0.004338585, 0.0019855557, 0.00018114936, -0.020474406, 0.06057655, 0.030161498, -0.06145807, -0.04435459, -0.08627908, 0.10944488, 0.01887649, -0.03103268, 0.03310187, -0.17767999, -0.019043589) * inp_0_0_2; + result0 += M4(0.12954727, -0.12922326, 0.2350974, 0.049719814, 0.13253595, 0.09160491, -0.21646306, -0.04050591, -0.036288727, -0.056381904, 0.0121351825, 0.04496311, -0.31566897, 0.11194864, -0.42841324, -0.016267655) * inp_0_1_2; + result0 += M4(-0.024690468, 0.014333521, -0.06532126, -0.0041400986, -0.10427263, 0.18187162, 0.01258527, -0.019371599, 0.1249462, 0.024022829, -0.031402778, 0.02241293, -0.26506376, 0.08613873, -0.12220515, -0.0029115404) * inp_0_2_2; + result1 += M4(0.31627145, 0.15249805, -0.08140558, 0.42994848, -0.09804992, -0.012594858, 0.0026646887, -0.0043445844, 0.043157805, 0.109746225, -0.026367161, 0.09464095, -0.015199039, -0.14187415, 0.12840094, -0.067172185) * inp_0_0_0; + result1 += M4(-0.1638916, -0.36235115, -0.1975086, 1.575765, -0.1965545, -0.08610196, -0.10926018, -0.00033870476, 0.040758844, -0.0061201644, -0.08756401, 0.04615102, 0.035327163, 0.044442933, 0.10312399, 0.036930207) * inp_0_1_0; + result1 += M4(-0.8492598, -0.33897942, 0.72526574, 0.4631478, -0.17841868, -0.1410183, -0.16832137, -0.013158105, 0.033784576, -0.025566028, 0.0039394298, 0.0092234295, -0.02678299, -0.0073904945, -0.015628401, 0.02390855) * inp_0_2_0; + result1 += M4(0.08460976, -0.009893607, 0.061330132, 0.051070828, -0.16053094, 0.007680145, -0.0623621, -0.07080623, 0.09263616, -0.07130709, 0.094535634, -0.0007521465, -0.06824691, -0.017334202, -0.14649309, 0.05471789) * inp_0_0_1; + result1 += M4(0.21807747, -0.008780514, -0.23558716, -0.07192246, -0.11119064, -0.045066413, -0.01870417, 0.16801721, 0.45134255, 0.14678022, 0.013131626, -0.12167587, -0.34481934, -0.20810209, 0.008862433, 0.14668722) * inp_0_1_1; + result1 += M4(0.10040009, -0.23140623, 0.13991402, 0.13232943, -0.44653964, -0.22550936, 0.041132253, -0.030094247, 0.057539612, -0.09650221, -0.20644088, 0.07337908, -0.0066268765, 0.061737567, 0.22057678, 0.13231337) * inp_0_2_1; + result1 += M4(-0.0073576197, 0.019599516, 0.017028693, 0.00043496815, -0.098762505, -0.010775835, 0.034300815, -0.07583991, 0.042083025, 0.06400441, 0.08720754, -0.007852188, 0.0372069, -0.1406307, -0.076517396, -0.074295625) * inp_0_0_2; + result1 += M4(0.0059161535, 0.0372593, 0.13355313, 0.22900341, -0.16262229, -0.15288241, -0.3086904, -0.120383196, 0.021071693, -0.13865116, -0.007022702, -0.07665101, -0.024432838, -0.033629846, -0.012343005, -0.23553605) * inp_0_1_2; + result1 += M4(0.028445385, -0.009794425, -0.023792878, -0.075042315, -0.12081588, -0.055164486, 0.13519762, -0.108135365, -0.085314415, -0.031570014, 0.027543535, -0.044589665, 0.13610293, -0.018678987, -0.14013505, -0.15338679) * inp_0_2_2; + result2 += M4(0.21252534, -0.11910489, -0.45723984, -0.06417371, -0.021582598, 0.02339392, -0.018546809, -0.012605804, 0.032364845, -0.035078682, 0.058367588, -0.0005620972, 0.051605877, 0.0215126, -0.16632713, 0.026713151) * inp_0_0_0; + result2 += M4(-0.4662353, 0.36299333, -1.5159458, -0.50809747, -0.23438907, 0.030885411, 0.06186301, 0.06464797, 0.016437657, -0.0112345265, -0.114750154, -0.010771786, 0.00076314394, 0.031646077, 0.23297943, 0.08224971) * inp_0_1_0; + result2 += M4(-0.5306165, 0.022781476, -0.6611916, -0.13589059, -0.29746577, -0.03359175, 0.1488752, 0.08763788, 0.0734923, 0.016807996, -0.014261707, -0.009930438, -0.052407317, -0.011143981, -0.0003923795, 0.0061985618) * inp_0_2_0; + result2 += M4(0.07399199, 0.0057193898, 0.025029065, 0.037136503, -0.09694074, -0.015754705, 0.0858824, 0.02630069, 0.1436345, -0.024873883, -0.042757105, -0.0028142098, -0.13067973, 0.016069483, -0.07657447, 0.03459619) * inp_0_0_1; + result2 += M4(-0.024490986, -0.056364402, -0.12789075, -0.2377805, -0.35516652, -0.11532965, 0.096392564, 0.3001136, 0.50962794, -0.09597639, -0.13577257, 0.02288129, -0.62172246, 0.2233473, -0.027296012, 0.3107101) * inp_0_1_1; + result2 += M4(-0.1822321, -0.019152636, -0.03883703, 0.06758995, -0.32357153, 0.010696737, -0.20381221, -0.14015651, 0.04149892, 0.08667886, 0.052319348, -0.028778236, -0.08863007, -0.1016996, -0.026162509, 0.21760902) * inp_0_2_1; + result2 += M4(-0.019655038, 0.01048052, 0.014871437, 0.0047376687, -0.05845112, -0.027396418, 0.0135491295, -0.01598734, 0.010417036, -0.027401034, 0.041378684, 0.10007943, -0.0045745275, -0.03977022, -0.06537003, -0.05988692) * inp_0_0_2; + result2 += M4(0.051048204, 0.112982355, 0.030450165, -0.11833691, -0.22066031, -0.020368785, 0.07926755, -0.14934708, 0.1024632, 0.05717762, 0.07574149, 0.037296783, -0.108641684, -0.14161289, -0.18493624, -0.097702526) * inp_0_1_2; + result2 += M4(0.022333367, -0.035479385, -0.06719012, 0.072104804, -0.13920522, -0.06867922, 0.1834858, 0.09901816, -0.10181411, -0.011209808, -0.03838759, -0.079485156, 0.1112582, -0.04442816, -0.03244046, 0.17494577) * inp_0_2_2; + result3 += M4(-0.008458485, 0.559754, -0.1359481, -0.20492737, 0.010565355, 0.07826572, -0.04546082, -0.06438555, 0.044124458, 0.015091466, -0.039031394, 0.024674136, -0.015993683, -0.046678152, 0.038969137, 0.08587786) * inp_0_0_0; + result3 += M4(-0.12672317, 0.7919048, 0.09465808, -0.28959075, 0.17336527, 0.2023873, -0.07387402, -0.09773626, 0.21337758, -0.035826, -0.023157721, -0.026020411, -0.35271186, -0.004095575, -0.043581124, 0.092579946) * inp_0_1_0; + result3 += M4(-0.0762927, 0.6058523, 0.210049, -0.15095702, -0.12984839, 0.046832986, 0.003953526, -0.09747306, 0.07599791, 0.03548356, -0.052436605, 0.007820468, -0.013407755, 0.014487795, 0.04603643, 0.010825038) * inp_0_2_0; + result3 += M4(-0.039665997, -0.035092063, -0.06810712, 0.108950034, -0.000649656, 0.13788638, -0.015922725, -0.0054936605, 0.017050518, -0.23598951, -0.0052512363, 0.035469808, -0.026771294, 0.17689878, 0.026165131, 0.060948808) * inp_0_0_1; + result3 += M4(0.20632705, -0.16090605, -0.24408017, -0.053601943, -0.2055891, 0.5841354, -0.037936993, -0.042822365, 0.48433793, 0.15146664, -0.039210964, 0.2029982, -0.5239856, -0.14422977, 0.07044831, -0.02499571) * inp_0_1_1; + result3 += M4(-0.14769523, 0.030178303, 0.007047456, 0.10304811, 0.17505062, 0.3024603, 0.0046870145, -0.20263235, 0.09975853, 0.13236913, -0.11148928, 0.22456545, -0.2844659, -0.14753824, 0.21022335, -0.16320874) * inp_0_2_1; + result3 += M4(-0.021687089, 0.013914326, 0.005674425, -0.02157544, 0.06648613, 0.13842705, 0.010751784, -0.0279543, 0.09411157, 0.043079033, -0.0016886615, 0.053833924, -0.047202144, -0.04031651, -0.006346014, -0.06269334) * inp_0_0_2; + result3 += M4(0.010542784, -0.038660403, -0.027727835, 0.0442041, -0.058916762, 0.21794543, -0.0050698183, -0.03180731, 0.29513338, -0.21027178, -0.030230556, 0.12158278, -0.059518564, 0.16094229, 0.092587315, -0.17798163) * inp_0_1_2; + result3 += M4(-0.01876096, -0.033373438, 0.013868456, -0.06437974, 0.10535872, 0.2320939, -0.041797537, -0.03412653, 0.042804, -0.019821629, 0.017664902, 0.02014612, -0.008958272, -0.04446397, -0.04071955, -0.08878301) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.01583359, 0.06754533, -0.01712357, -0.03930749, 0.019515904, 0.0476419, -0.04839703, 0.099027, -0.02762645, -0.07761426, -0.14227375, 0.005808833, 0.062241603, 0.032665376, -0.10276744, 0.0037447736) * inp_1_0_0; + result0 += M4(0.176867, 0.074107334, -0.16574392, -0.06600555, -0.17686988, 0.40425017, 0.5451527, 0.13584052, -0.17639911, -0.19718716, 0.2380433, 0.040593807, 0.10853866, 0.046141937, -0.2325924, 0.007987454) * inp_1_1_0; + result0 += M4(0.0772586, 0.12861234, 0.08976759, 0.03701837, 0.19125976, 0.10426821, -0.040152878, -0.07515106, -0.14654006, -0.20254305, -0.13209806, 0.07523701, 0.03458956, -0.012815592, -0.028856799, 0.029668355) * inp_1_2_0; + result0 += M4(0.019110488, 0.060465347, 0.12735324, 0.029926497, 0.020046815, 0.08939445, -0.010156248, -0.0047141416, 0.009727405, -0.030973857, -0.07694125, -0.0052544693, -0.0875518, -0.080452956, -0.05976568, -0.096559025) * inp_1_0_1; + result0 += M4(0.42901465, 0.2590428, 0.13991387, 0.07037277, 0.36930072, 0.10277632, 0.35448986, 0.0075549292, 0.3952787, -0.24613738, 0.39837205, -0.077002235, 0.63838506, -0.36808252, 0.0059239357, 0.23111042) * inp_1_1_1; + result0 += M4(0.02320368, 0.10004724, 0.0126293525, -0.090640485, -0.067141384, 0.019517098, -0.01910994, -0.08992004, -0.015479739, -0.039290965, 0.058866188, 0.023926063, -0.08454309, -0.10365931, 0.0992991, -0.01995878) * inp_1_2_1; + result0 += M4(0.017662264, 0.048447046, -0.009959364, -0.04590219, 0.015489817, 0.07478854, 0.0035829754, -0.044818107, -0.020652944, 1.7518421e-06, 0.024685964, 0.012436587, -0.009526269, -0.0948704, 0.23454551, -0.00925439) * inp_1_0_2; + result0 += M4(0.10283008, -0.003436092, 0.12427426, 0.086562015, 0.204189, -0.042327147, 0.064794585, 0.015408602, 0.07648754, 0.08140967, 0.14045514, -0.025799247, -0.04064487, -0.2135315, 0.069888115, -0.020488435) * inp_1_1_2; + result0 += M4(0.062685005, -0.0087055005, -0.049382843, -0.014352606, 0.028499393, -0.027238736, 0.09515428, -0.023900118, -0.071811944, -0.03655884, -0.04257451, -0.010197308, 0.029228672, -0.005827241, -0.12256195, -0.029949382) * inp_1_2_2; + result1 += M4(-0.07721696, 0.019634021, -0.065468505, -0.0538411, 0.15386713, 0.105303764, -0.05682918, 0.014476583, 0.21499005, 0.09528613, -0.035307407, -0.0109019205, -0.017080473, 0.06655509, -0.14565326, 0.021859277) * inp_1_0_0; + result1 += M4(-0.08070917, 0.014726409, 0.07630219, -0.1974782, -0.045234982, -0.10786042, -0.20062084, 0.00798719, 0.2289415, 0.15024285, -0.24757579, -0.11945095, -0.06408308, 0.023932865, 0.13997374, -0.08553081) * inp_1_1_0; + result1 += M4(-0.103800066, -0.0119613, -0.0497909, -0.13598542, -0.090290286, 0.13484626, 0.29374337, -0.085325494, 0.13760795, 0.09128403, 0.10423313, -0.022034246, 0.0075501916, 0.033313587, 0.08877397, -0.06258862) * inp_1_2_0; + result1 += M4(-0.19667187, 0.07910811, 0.14975567, 0.11546245, -0.007856336, 0.05762079, -0.026586441, -0.047359627, 0.0952913, -0.0048787566, 0.009396981, 0.07306324, -0.05333312, -0.092696056, 0.1484569, -0.014510268) * inp_1_0_1; + result1 += M4(-0.4483713, -0.08914751, -0.06830535, 0.22022808, -0.02908167, 0.19700284, -0.23201343, 0.100948244, 0.10150403, 0.36964548, 0.3682474, 0.38162547, -0.07337941, 0.32787672, 0.22884098, -0.17473112) * inp_1_1_1; + result1 += M4(-0.11851422, -0.1997371, -0.09265734, -0.068350844, 0.027532142, 0.0598685, 0.20098667, 0.19505432, -0.0071426006, 0.122263566, 0.09087172, 0.14061768, -0.068963185, -0.22508137, -0.27521184, 0.05226415) * inp_1_2_1; + result1 += M4(-0.08752191, -0.035636704, -0.026970783, -0.0063899173, -0.06535668, -0.0097355945, 0.0016719002, -0.028427562, 0.04458897, -0.008972722, 0.0011736943, -0.040193666, 0.06178452, 0.09981747, 0.13165061, 0.066930525) * inp_1_0_2; + result1 += M4(-0.08367123, -0.05284521, 0.027751574, 0.05405288, -0.013956896, 0.13211827, 0.02718628, 0.04126972, 0.013591151, 0.05696284, 0.021740496, -0.06569428, -0.13156594, -0.2217979, 0.12002505, 0.081010014) * inp_1_1_2; + result1 += M4(-0.09057673, -0.065086775, 0.052175682, 0.040668074, -0.0011252841, 0.033768404, 0.055707283, 0.1775509, 0.024380935, -0.0029724136, 0.011439569, -0.036639195, -0.034154296, -0.040933546, -0.04963123, -0.27177313) * inp_1_2_2; + result2 += M4(-0.07619493, 0.015114808, 0.12194339, -0.05388546, 0.122937895, 0.06766423, 0.08985467, -0.0026659921, 0.16911712, -0.12348506, 0.10205851, 0.0040722685, -0.08778425, -0.04494511, 0.13364732, -0.05704994) * inp_1_0_0; + result2 += M4(0.067183, -0.08808697, 0.061798133, 0.026947606, -0.2520032, 0.27808714, -0.12131742, -0.073309034, 0.10515911, -0.05996287, -0.10040219, -0.3855947, 0.09427887, -0.040533386, -0.11460287, -0.11597825) * inp_1_1_0; + result2 += M4(-0.19422445, -0.044388153, 0.030549884, -0.022434473, -0.052113403, -0.03193732, 0.058239404, -0.095854744, 0.20687638, 0.091036074, 0.040095903, -0.12101788, 0.029437194, -0.009060895, -0.091376856, -0.08326711) * inp_1_2_0; + result2 += M4(-0.033702653, 0.062329434, 0.056782924, 0.1510267, 0.10268749, -0.0012141394, 0.028026294, 0.06589578, 0.07167968, 0.0382477, -0.036623612, -0.05445876, 0.061408594, -0.007828243, 0.08684674, 0.061775405) * inp_1_0_1; + result2 += M4(0.18673033, -0.010594418, 0.11519751, -0.015496185, -0.060910117, 0.17213313, 0.10663717, -0.23498611, -0.11552151, 0.12067305, -0.11170714, -0.006541151, 0.41895327, -0.13074741, -0.12857904, -0.28355864) * inp_1_1_1; + result2 += M4(-0.16524398, -0.055524822, -0.0810091, -0.029351775, 0.05192384, -0.032889236, 0.038031064, -0.058420878, 0.061196484, 0.009064973, 0.0010509911, 0.03512171, -0.15589699, -0.004647887, 0.021679884, 0.044907816) * inp_1_2_1; + result2 += M4(-0.044117562, -0.019335665, 0.03378335, -0.027249482, -0.055734895, -0.007945039, -0.0096593145, -0.043825258, 0.00033283542, 0.00740868, -0.008989796, 0.011453801, -0.0032866534, -0.03677149, 0.08357763, 0.13552722) * inp_1_0_2; + result2 += M4(-0.056846637, 0.06251862, 0.10164459, -0.049285304, 0.013761074, 0.044591248, 0.08373373, 0.05985056, -0.08572338, -0.023269488, 0.038841605, -0.015587152, 0.021170331, 0.11302778, 0.11370839, -0.32551986) * inp_1_1_2; + result2 += M4(-0.05821609, 0.004350518, -0.047714118, -0.026734909, 0.010570952, 0.0018678942, -0.017686881, 0.03402182, 0.030670093, 0.0034491834, 0.046588063, 0.023750719, -0.018057328, 0.01436053, -0.016733939, -0.0806178) * inp_1_2_2; + result3 += M4(0.024148023, -0.056969013, -0.007182248, -0.06978146, -0.18521935, 0.049342513, -0.1059268, -0.010528267, -0.13987224, -0.046478126, 0.011630029, 0.03975061, 0.028102472, -0.015797462, 0.041665286, -0.052644428) * inp_1_0_0; + result3 += M4(0.23887786, -0.03063249, -0.0078508025, -0.110535435, -0.47775343, 0.31345952, 0.037840076, 0.1917282, -0.4675718, 0.18246669, -0.071136154, 0.07569014, 0.3363767, -0.05939815, 0.03330824, -0.1149139) * inp_1_1_0; + result3 += M4(-0.03199022, -0.027461693, -0.017600277, -0.01040416, -0.3335923, -0.16069661, -0.0011826943, -0.14604628, -0.10750828, -0.031318568, -0.11515191, 0.14961019, 0.01875921, -0.05859786, 0.0062334435, -0.026974274) * inp_1_2_0; + result3 += M4(0.16624868, 0.08622376, 0.013066398, -0.013561043, -0.14781322, 0.06166629, -0.01690182, 0.03240959, -0.19101089, -0.23269162, 0.023481557, 0.039373416, 0.10989115, -0.33205244, 0.06563763, -0.03763514) * inp_1_0_1; + result3 += M4(0.763446, -0.36806998, -0.054857958, -0.054847606, -0.6365203, 0.124305926, -0.11834348, 0.012177892, -0.41701862, -0.12154834, 0.19443808, 0.23409277, 0.74961615, -0.14717795, 0.08279371, 0.010061856) * inp_1_1_1; + result3 += M4(0.3890335, 0.11852343, 0.06878882, -0.106771834, 0.0013103477, 0.036700066, 0.061958365, -0.23648676, -0.13740712, -0.031022822, -0.005026855, -0.0040705674, 0.3481052, 0.21652177, 0.13818942, 0.14510764) * inp_1_2_1; + result3 += M4(0.024962775, -0.00930012, 0.016999796, -0.007042678, -0.049675427, 0.0561294, 0.010110364, -0.020104202, -0.027516196, 0.02439481, -0.018409938, -0.015501763, 0.07540284, 0.080506206, 0.0070816637, 0.019382445) * inp_1_0_2; + result3 += M4(0.18482067, 0.02875042, -0.028305996, 0.056233536, -0.25161085, -0.07676187, -0.030247726, 0.031174812, -0.16452968, 0.17400448, -0.05394027, -0.11061602, 0.5713144, -0.07015428, 0.0838255, 0.13299061) * inp_1_1_2; + result3 += M4(0.066211306, 0.086373925, 0.025565708, -0.018157946, 0.023741372, 0.08362605, 0.034379553, 0.005279233, -0.03009191, -0.006536514, -0.0043627736, -0.026205579, 0.032223664, -0.11968535, 0.0042308527, -0.02536624) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.020806601, 0.0011769276, -0.06854966, 0.06404834, 0.010257402, 0.09078626, -0.09029915, -0.038121767, -0.08009543, 0.024868483, 0.33892182, 0.02145583, 0.054771744, 0.049150817, -0.011070969, -0.028411673) * inp_2_0_0; + result0 += M4(-0.038379848, -0.008772784, 0.029454285, 0.043145403, -0.028629266, -0.008691371, -0.040970787, -0.06477745, -0.1791925, 0.003425941, -0.14729068, 0.16579328, 0.13128689, -0.002635605, -0.13834825, 0.05271074) * inp_2_1_0; + result0 += M4(-0.091530494, -0.014356574, 0.03452029, 0.058324084, -0.047370777, 0.042062152, 0.052640617, 0.08313879, 0.011118099, -0.019573802, -0.05845368, -0.027856722, 0.1666636, 0.10776295, -0.053498384, -0.035426028) * inp_2_2_0; + result0 += M4(-0.07106617, -0.12926805, 0.11532138, -0.025411379, -0.02660926, -0.011154649, -0.0171705, 0.013136738, -0.65104634, 0.24976598, 0.12305868, -0.6479581, 0.24736935, -0.21200751, 0.08362573, -0.07467725) * inp_2_0_1; + result0 += M4(-0.033144828, -0.2901839, 0.19474508, -0.018116087, -0.0337689, -0.0077542337, 0.022090381, 0.011201993, 0.0003965253, 0.10669989, -0.06420536, 0.21434414, -0.025104653, 0.25331414, -0.094278105, 0.015236804) * inp_2_1_1; + result0 += M4(0.054170903, -0.03878034, 0.023502445, -0.04763652, 0.0436261, 0.02125075, -0.07865895, 0.008801445, -0.03805679, 0.017889298, 0.08710609, 0.028471842, 0.1409927, 0.24610753, 0.18868911, -0.0038281744) * inp_2_2_1; + result0 += M4(-0.024401257, 0.029200602, -0.037531514, 0.020089343, 0.0031562252, -0.015761279, 0.08060079, 0.07492363, -0.75374854, 0.069819294, -0.6806557, -0.22842103, -0.01784711, -0.0015924854, -0.02660206, 0.06682451) * inp_2_0_2; + result0 += M4(-0.18408458, 0.04495705, -0.27017567, -0.04060905, -0.060091477, 0.04199921, 0.042240314, -0.05247994, 0.01244936, -0.11446392, 0.012699051, 0.19231313, 0.16377899, -0.0021420936, 0.20178908, 0.022177307) * inp_2_1_2; + result0 += M4(-0.076426975, 0.060788747, -0.12581491, -0.026730899, 0.078445174, 0.031476885, -0.018560112, -0.027070913, 0.032900266, -0.012133513, -0.06886763, 0.048137616, 0.32230917, -0.11296064, 0.15351215, -0.010818085) * inp_2_2_2; + result1 += M4(0.06736406, 0.075990364, 0.0043325764, 0.043084458, 0.066263326, 0.08283939, 0.01714942, -0.043197032, -0.034201793, -0.19740304, -0.028645728, -0.42067948, -0.17401718, -0.10356778, -0.21782434, -0.1368192) * inp_2_0_0; + result1 += M4(0.121906675, 0.040143315, -0.06954, 0.029039154, -0.064667046, 0.00652776, -0.016123066, -0.042725384, 0.076855555, 0.10874429, 0.057248183, 0.1804212, -0.024840739, -0.001273071, 0.20704693, -0.25340644) * inp_2_1_0; + result1 += M4(0.053181823, 0.010691048, -0.041441515, -0.020986209, 0.07976909, -0.08821121, -0.028313044, 0.08507492, -0.015487181, -0.010594703, 0.04398618, 0.10098527, -0.10889402, -0.0034516156, 0.08802651, 0.039294768) * inp_2_2_0; + result1 += M4(0.122033805, 0.02009872, 0.11733401, -0.01198582, 0.0035701713, 0.085737005, 0.0051125716, -0.08456334, 0.121365964, -0.4063034, -0.073627055, -0.8934959, 0.07101478, -0.0012460023, -0.13605523, 0.4156497) * inp_2_0_1; + result1 += M4(0.09683759, -0.22955927, 0.10484432, -0.26306942, -0.084963664, -0.054211535, 0.0077070566, -0.030115092, 0.05744336, 0.25544357, -0.22682056, -0.22863898, 0.034472905, 0.31963208, -0.19928747, 0.9492331) * inp_2_1_1; + result1 += M4(0.070213765, -0.0038610063, 0.0033997372, 0.06119504, -0.047582276, -0.09507793, -0.083675615, 0.08001755, 0.040334526, 0.037215024, -0.068379946, -0.018164538, -0.0459578, 0.09890098, -0.13228115, -0.16900617) * inp_2_2_1; + result1 += M4(-0.036349338, 0.03735424, -0.013125493, -0.04058556, 0.04095882, -0.011006372, -0.09501445, 0.009363677, -0.13656218, -0.39543343, -0.08865905, -1.3125815, 0.09805664, -0.108527824, -0.039054662, -0.06415699) * inp_2_0_2; + result1 += M4(0.13630877, -0.095158935, -0.10042646, -0.3309934, 0.010858195, -0.07095434, 0.045891337, -0.067784145, 0.009857397, 0.14819881, 0.054163657, 0.04177505, -0.15756398, 0.24096744, 0.013504479, 0.39090788) * inp_2_1_2; + result1 += M4(0.0065320977, -0.014341278, -0.023192916, -0.05885387, -0.046773493, -0.035404146, 0.0049495073, -0.04104518, -0.0531538, -0.012901377, 0.077806786, -0.05745816, -0.21440023, -0.019557446, 0.20342024, 0.27739877) * inp_2_2_2; + result2 += M4(0.057360508, 0.014503564, 0.059143994, 0.010198468, -0.02674482, 0.0022251438, 0.06575039, -0.008726433, -0.09188913, -0.12177862, 0.2584525, 0.1557489, -0.33377033, -0.037951965, 0.1340623, -0.07428824) * inp_2_0_0; + result2 += M4(0.15755674, -0.027416268, 0.031757925, 0.030080441, -0.092128694, -0.05288516, 0.07390179, 0.070589304, 0.042379964, 0.05825198, 0.097974725, -0.07958051, 0.026712047, 0.021791503, -0.19539036, -0.13505116) * inp_2_1_0; + result2 += M4(0.06732846, 0.02477517, 0.047421448, -0.0350228, -0.026210636, -0.07957982, 0.06680819, 0.090554416, 0.003016353, 0.002736857, -0.06721213, 0.016317641, -0.1511062, -0.03932932, -0.0411404, 0.037391737) * inp_2_2_0; + result2 += M4(0.044398054, -0.0039024032, -0.039489146, 0.015305246, 0.085481696, -0.031782832, -0.048250176, -0.04576736, 0.056205854, -0.34265697, 0.3497672, 0.015577426, -0.053595997, -0.056706756, -0.110979, 0.0770339) * inp_2_0_1; + result2 += M4(-0.17363448, 0.109652765, 0.194541, -0.1697986, 0.0554414, 0.027986523, 0.09817557, 0.08573731, -0.13382511, -0.059311867, -0.3453238, 0.2896559, 0.62732804, 0.21806855, -0.0051348326, -0.074557506) * inp_2_1_1; + result2 += M4(-0.0042801355, -0.0034563097, -0.012686132, 0.13073713, -0.033048425, 0.08372879, -0.091064066, -0.085343346, 0.033698123, 0.0035512336, -0.015234775, 0.026158987, -0.022497516, -0.04325933, -0.08212852, -0.010965832) * inp_2_2_1; + result2 += M4(0.01627358, 0.0012432971, 0.03353438, 0.020683315, 0.025408963, -0.059527367, 0.0027960425, 0.027919134, -0.09517613, -0.38686842, 0.17250046, 0.2563248, -0.031954054, -0.032314193, -0.073108226, 0.002805501) * inp_2_0_2; + result2 += M4(0.11107625, 0.0020363845, -0.060272653, 0.17112932, -0.060560506, 0.08849239, -0.042447433, 0.04453629, -0.19810289, -0.030767849, 0.054445386, -0.36024103, -0.043574344, -0.0359943, 0.08719419, 0.11635041) * inp_2_1_2; + result2 += M4(0.01508289, -0.03601694, -0.04689985, 0.06605909, 0.08663423, -0.019983027, 0.04276954, -0.05810252, -0.049331795, -0.011382104, 0.047108665, -0.035963446, -0.15027761, 0.04916842, 0.046085328, -0.3091649) * inp_2_2_2; + result3 += M4(-0.01954963, -0.05955776, 0.0366114, 0.03241877, 0.0811955, -0.08231828, -0.017435858, -0.08624713, -0.19084726, -0.00130446, -0.0041784286, 0.36175868, 0.07715551, -0.020533009, 0.027846111, -0.05263875) * inp_2_0_0; + result3 += M4(0.038249742, 0.05213642, 0.022535365, 0.07490527, 0.08845503, -0.0865709, -0.06229371, 0.043499216, -0.034865715, 0.00839816, -0.10632363, 0.15028821, 0.22725908, -0.21485256, 0.059532907, -0.100963406) * inp_2_1_0; + result3 += M4(0.036063094, 0.0029133533, -0.030805418, 0.07174674, -0.02426538, -0.051893298, 0.10046242, 0.05046725, 0.021173801, 0.032548554, 0.035410833, -0.017246148, -0.047212694, -0.0019793957, 0.05575738, -0.07261234) * inp_2_2_0; + result3 += M4(-0.01674299, -0.008884916, 0.010768661, -0.01639755, -0.08142729, -0.0053191427, -0.036633592, 0.07607754, -0.7825981, -0.43916854, 0.038573936, 0.37393776, -0.08752398, 0.12226086, -0.0039705704, -0.10482764) * inp_2_0_1; + result3 += M4(-0.16088066, -0.121415704, 0.07007931, 0.1544625, -0.08467529, 0.018081093, 0.049794823, 0.04264284, 0.16043149, -0.032744974, -0.23247649, 0.19149105, 0.22916554, 0.4088795, -0.22852364, 0.07474784) * inp_2_1_1; + result3 += M4(-0.09823339, -0.04523368, 0.13438235, 0.05503274, 0.094729334, 0.025204461, -0.010783659, 0.040687785, -0.0020735054, -0.035414696, -0.028707825, 0.009774318, 0.13749972, -0.007978513, -0.10437224, -0.16205452) * inp_2_2_1; + result3 += M4(0.03452105, -0.0019801871, -0.008515022, 0.042908445, 0.023343097, -0.039268777, -0.05582678, -0.01785084, 0.1909139, 0.30671456, -0.09177103, -0.18535422, 0.03572424, 0.096279085, -0.052728545, -0.0008020096) * inp_2_0_2; + result3 += M4(0.04167784, -0.09262971, -0.034826137, -0.04459923, -0.034247838, -0.087677866, -0.077725075, -0.059959635, -0.083735585, -0.08568067, 0.0026664583, 0.38268802, -0.21485022, -0.18185435, 0.031202722, 0.118082285) * inp_2_1_2; + result3 += M4(-0.01308469, -0.039964344, 0.02419818, -0.051316794, -0.045073602, -0.07852878, -0.0641165, 0.10274802, -0.03722715, 0.016585138, -0.01557483, 0.054411575, 0.058821086, 0.17634773, 0.09275543, 0.16511928) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.16157526, 0.0708418, -0.17742826, 0.037568346, 0.1363335, -0.039198983, -0.12991804, 0.12523568, -0.0315292, 0.066681534, 0.019297564, -0.045476478, 0.050666958, 0.0070537156, -0.0741803, 0.043249052) * inp_3_0_0; + result0 += M4(-0.09018603, -0.049359206, 0.18229158, -0.014263066, -0.26950583, -0.22213577, 0.18419883, 0.07491064, 0.107961394, 0.21241283, -0.011421013, 0.004667217, -0.136152, -0.13793777, 0.17264098, -0.025761813) * inp_3_1_0; + result0 += M4(0.010441085, 0.034229126, 0.10410884, 0.0007140697, -0.035234306, -0.20281972, -0.08954763, -0.04823551, -0.024772387, 0.11774257, 0.08591761, 0.03018245, -0.08788433, 0.018554667, -0.034182277, 0.059270818) * inp_3_2_0; + result0 += M4(-0.046677265, 0.17860901, 0.226423, -0.004706376, 0.19468129, -0.20464435, 0.2005496, -0.08843481, -0.17709897, 0.21608044, -0.09500188, -0.0014078907, -0.0823845, -0.008207487, 0.11033482, 0.039437946) * inp_3_0_1; + result0 += M4(0.39077276, -0.63461953, 0.1270757, -0.0005488689, -0.35906503, -0.65365374, -0.42657968, -0.28447995, 0.3077801, 0.5133355, 0.31003663, 0.22172691, -0.3231345, -0.11029882, -0.25303665, 0.17490047) * inp_3_1_1; + result0 += M4(-0.2731292, 0.000310414, -0.15897174, 0.058956403, -0.09936814, -0.07022474, 0.08290902, 0.07600689, 0.17877856, 0.10775786, -0.04695605, -0.03202572, -0.23459665, -0.69781375, -0.27533895, -0.15403226) * inp_3_2_1; + result0 += M4(-0.042978965, -0.054180793, 0.1954828, -0.08684577, -0.13747977, -0.20742784, 0.18355459, 0.11388488, 0.11764892, 0.069994465, -0.21684092, -0.051016156, 0.033618942, -0.036646932, -0.1297882, 0.023407396) * inp_3_0_2; + result0 += M4(0.20020427, -0.22712614, 0.10650477, -0.005730161, -0.24823771, -0.1734196, -0.27462947, -0.0036915976, 0.17370144, 0.11744064, 0.21179977, -0.044981353, -0.0793401, 0.08837848, 0.09162515, 0.030376406) * inp_3_1_2; + result0 += M4(-0.1309085, 0.015177464, 0.017351935, -0.006943054, 0.20613031, -0.07015381, 0.12872961, 0.055942796, -0.010101874, 0.054767746, 0.073140666, -0.003368886, -0.03311943, 0.018623969, -0.1904025, -0.07601106) * inp_3_2_2; + result1 += M4(0.09109263, 0.24044237, -0.07368503, 0.09128383, 0.08638873, 0.066008195, 0.017524574, 0.14434199, -0.05134559, 0.016527405, 0.028160872, -0.009478669, -0.021720985, -0.0031434142, 0.055661436, 0.011320767) * inp_3_0_0; + result1 += M4(0.03140381, -0.12361954, -0.2105949, -0.05841093, 0.20608658, -0.0043003242, -0.32436752, 0.108572416, 0.0137622375, 0.123948485, 0.08976507, -0.0005934278, 0.19517872, -0.09666256, 0.27647632, 0.10041602) * inp_3_1_0; + result1 += M4(-0.00084548816, -0.029597878, -0.069973126, -0.15951297, 0.09769574, -0.059322637, -0.034474894, 0.05295799, 0.035118338, 0.07830424, -0.010667201, -0.04336969, 0.12945734, 0.1678381, 0.23533249, 0.19315714) * inp_3_2_0; + result1 += M4(0.09013079, 0.15298937, 0.009327142, -0.33564213, 0.37823164, 0.02959889, -0.20432287, 0.045236036, -0.2741461, -0.046541527, 0.20261943, -0.10205416, 0.14046308, -0.0027450805, 0.21283917, 0.06460282) * inp_3_0_1; + result1 += M4(-0.18491924, -0.21789634, 0.15175304, -0.887086, 0.71517575, 0.22929609, 0.1805253, 0.11580503, -0.68914616, -0.1291275, -0.012994776, -0.47681156, 0.4985886, 0.004125866, 0.11798174, -0.68233013) * inp_3_1_1; + result1 += M4(0.07321497, -0.14313735, -0.105816804, -0.080761194, -0.06267719, 0.044976983, -0.042560253, -0.074202426, -0.112595245, -0.0060367524, 0.06645215, 0.022692902, 0.45074677, -0.31013855, 0.018929806, -0.080830745) * inp_3_2_1; + result1 += M4(-0.1182609, 0.15505335, 0.14059931, -0.010010356, 0.2792563, 0.021148562, 0.21544349, -0.09246091, -0.19237362, -0.019413901, -0.19110642, 0.15954247, -0.03959726, 0.038067605, -0.06587343, 0.10105769) * inp_3_0_2; + result1 += M4(0.086048566, -0.03875393, -0.010399113, -0.087426275, 0.06872017, -0.06801751, -0.1554103, -0.046588384, -0.072060585, 0.17145237, 0.16459806, 0.2941966, 0.24843049, 0.10976179, 0.0616643, 0.028753892) * inp_3_1_2; + result1 += M4(0.14644687, 0.19136189, -0.012354268, -0.053453315, -0.118824765, 0.007956001, 0.14581923, 0.120377615, 0.08550302, 0.10488886, -0.049412593, 0.04564864, 0.041706, -0.22091928, -0.18077254, -0.07200271) * inp_3_2_2; + result2 += M4(0.12742214, -0.019949354, 0.22852126, 0.009229048, 0.07179215, -0.035888027, -0.06847325, 0.075466916, 0.05451231, 0.04447139, -0.007379507, -0.038457163, 0.0069804247, -0.022739582, 0.015290603, 0.058539122) * inp_3_0_0; + result2 += M4(0.033414926, 0.0688454, -0.01154317, 0.04373435, 0.02220928, 0.07399258, -0.018638128, -0.09049976, 0.14270648, -0.04456102, 0.09852033, 0.095695525, 0.048654117, 0.03194091, -0.2506061, 0.22547816) * inp_3_1_0; + result2 += M4(-0.029927028, -0.018085415, 0.19878025, 0.0600148, 0.15179572, 0.043493457, -0.08094291, 0.05803879, -0.010909439, -0.014285486, 0.15604655, 0.008313019, 0.19220084, -0.024658643, -0.12223889, -0.044626527) * inp_3_2_0; + result2 += M4(0.002232593, -0.117187135, 0.271499, -0.1504283, -0.12024035, -0.15202788, 0.07508506, -0.069154665, 0.14663363, 0.10095183, -0.079744, -0.027517907, 0.12171369, 0.04201386, -0.18390292, -0.08800392) * inp_3_0_1; + result2 += M4(-0.39752677, -0.106147856, 0.31427163, -0.6602043, 0.36713195, 0.1565504, 0.659634, 0.054854617, -0.38186052, -0.14849813, -0.40023437, -0.28087738, -0.28679487, 0.10423841, 0.03607786, -0.32230294) * inp_3_1_1; + result2 += M4(0.075212725, 0.05711698, 0.07420369, -0.15664868, 0.1286679, 0.12669285, 0.25749606, -0.3583118, -0.10613531, -0.07323004, -0.27757177, 0.08621346, 0.1296691, -0.031802166, 0.07022488, 0.22773924) * inp_3_2_1; + result2 += M4(-0.068505526, -0.026667738, 0.12101492, 0.070010714, 0.039327346, -0.05554568, -0.10054333, 0.18232317, 0.09161801, 0.073988214, 0.07982679, -0.101606384, 0.1132725, 0.05208842, 0.033680618, 0.0011496624) * inp_3_0_2; + result2 += M4(0.077517726, 0.10946592, 0.118573286, -0.19028679, 0.09755006, -0.044249807, -0.15750827, 0.061594304, -0.034222055, 0.0128054945, -0.03952524, -0.102706864, 0.25461313, 0.10715616, -0.14800839, 0.18352498) * inp_3_1_2; + result2 += M4(0.112083696, -0.026794339, 0.0014270544, 0.2073605, -0.11959005, 0.03181029, 0.07840882, -0.18645816, 0.03743027, -0.03183679, -0.043347996, 0.13866818, 0.12204855, 0.03666218, -0.121538706, 0.057100873) * inp_3_2_2; + result3 += M4(-0.10662995, 0.05697544, -0.10548284, -0.11210752, 0.047840722, 0.123951785, 0.009479878, 0.078141965, 0.011802129, -0.0045969826, -0.022849994, -0.067880586, 0.042395536, -0.0083619, -0.008202702, 0.06660749) * inp_3_0_0; + result3 += M4(0.19675933, 0.052384473, 0.013265036, 0.098756306, -0.018376395, -0.07318726, 0.06631346, 0.10931116, -0.07211753, 0.08561086, -0.058432173, -0.018883526, -0.2426171, -0.10608711, -7.214139e-05, 0.07174066) * inp_3_1_0; + result3 += M4(-0.10734781, -0.029677497, -0.0359158, 0.019730724, 0.12103277, 0.050042972, 0.047522116, 0.037930418, -0.12674676, -0.085192285, -0.10322901, -0.028011028, -0.23943996, -0.08027147, 0.035006125, -0.05514018) * inp_3_2_0; + result3 += M4(-0.19616649, 0.15140127, -0.09350769, -0.12153282, -0.2692576, 0.17027298, -0.09067922, -0.099699005, 0.23312636, -0.08758269, 0.0017002, 0.01240649, 0.011466379, -0.07665326, -0.009166553, 0.1272778) * inp_3_0_1; + result3 += M4(-0.10554337, -0.28817138, 0.039271317, 0.041808035, -0.44556034, 0.76822776, -0.30355525, 0.2162305, 0.33683625, -0.52597344, 0.24986169, -0.14621596, 0.18584943, -0.18752898, 0.1542312, -0.032974835) * inp_3_1_1; + result3 += M4(0.16487968, 0.07279231, 0.03802793, 0.10356195, -0.07914432, 0.060889, -0.23647681, 0.08861426, 0.14644763, 0.039211847, 0.08409845, -0.13739991, 0.021675752, -0.1462796, 0.20126085, 0.04228552) * inp_3_2_1; + result3 += M4(0.04344281, 0.1361205, 0.043024268, 0.022378847, 0.14772795, 0.25472307, -0.06886387, 0.036575425, -0.10773756, -0.46079612, 0.0655881, 0.045242745, -0.011777071, -0.31816006, 0.03709428, 0.083959974) * inp_3_0_2; + result3 += M4(-0.105607435, 0.0121534355, -0.076223634, 0.15062469, 0.010016192, -0.03524558, 0.045847397, 0.061889775, 0.016607437, -0.05810039, 0.09952769, -0.03271708, 0.10818878, -0.1336954, 0.0047579217, -0.118375205) * inp_3_1_2; + result3 += M4(-0.14107881, -0.1570039, -0.0175814, -0.0017515017, 0.029902417, 0.11668936, 0.00097337883, 0.14668427, -0.11713396, -0.12998298, -0.0028004094, -0.07370321, 0.014416133, -0.06064584, -0.014360191, -0.18469594) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), result0); + imageStore(out_image, output_base + ivec2(1, 0), result1); + imageStore(out_image, output_base + ivec2(0, 1), result2); + imageStore(out_image, output_base + ivec2(1, 1), result3); +} + +//!DESC ArtCNN C4F16 (Conv2D-6) +//!COMPUTE 12 16 12 16 +//!HOOK LUMA +//!BIND conv2d +//!BIND conv2d_5 +//!SAVE conv2d_6 +//!WIDTH LUMA.w 1.0 * +//!HEIGHT LUMA.h 1.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(0, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(1, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(0, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(1, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.08412104, 0.07971554, 0.08434169, 0.076244); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.079171985, -0.0069937697, -0.0210708, -0.033105504, -0.023817735, -0.011238646, -0.043035787, -0.02440147, 0.016872514, 0.03719572, -0.0036019788, 0.012509292, 0.1484504, 0.10084735, 0.06727001, 0.09289472) * inp_0_0_0; + result0 += M4(-0.090545304, -0.16164127, 0.019691145, 0.045617487, 0.0029133197, -0.011457896, -0.1087185, -0.022287082, 0.007693777, -0.1557534, 0.119432844, 0.048796117, 0.01886607, 0.13466214, 0.055788144, 0.011069647) * inp_0_1_0; + result0 += M4(0.019721841, -0.04018983, -0.010603011, -0.041139323, -0.013923174, -0.0069041494, -0.03181753, -0.07459869, -0.032918666, 0.004894833, -0.01307685, 0.038587816, 0.092926815, 0.04549454, 0.06285106, 0.03428836) * inp_0_2_0; + result0 += M4(0.1622716, -0.07768257, -0.013204322, 0.026763849, 0.0012736389, -0.09754597, 0.13953719, -0.07492267, 0.016014466, 0.055583894, 0.07073988, 0.007828915, 0.17086188, 0.109315015, 0.16700633, 0.119697236) * inp_0_0_1; + result0 += M4(0.079182394, 0.2656691, -0.13238232, -0.17505214, -0.23513712, 0.16317949, -0.18635502, 0.3353578, -0.10498728, 0.011073413, -0.10075553, -0.17032194, 0.19368632, 0.19305302, 0.15070842, 0.23248452) * inp_0_1_1; + result0 += M4(-0.002185805, 0.11091493, 0.051263936, 0.041181523, 0.062277913, -0.062091295, 0.03607194, -0.10375673, -0.010489046, -0.01102331, -0.041805126, 0.065893725, 0.15395595, 0.18233144, 0.15172338, 0.21679255) * inp_0_2_1; + result0 += M4(-0.030508783, -0.004990037, 0.0329664, 0.010637486, 0.005623188, -0.003358061, 0.0080712475, 0.00046784236, 0.040540207, 0.004353267, 0.0534382, -0.010169058, 0.10396432, 0.025561178, 0.18441953, 0.004519026) * inp_0_0_2; + result0 += M4(-0.04412904, -0.07338797, 0.06732339, 0.061310094, 0.08977347, 0.04197968, 0.10037899, -0.03313243, 0.029916203, 0.021829529, -0.08954633, 0.08445129, 0.035676997, 0.06716942, 0.06353302, 0.1767009) * inp_0_1_2; + result0 += M4(-0.016475134, -0.01597473, -0.006870764, 0.07254226, 0.052580874, 0.030486876, 0.078329995, 0.02920045, 0.024402283, 0.02916857, 0.008138189, -0.07570842, 0.061067346, 0.12795751, 0.07376389, 0.10487863) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.10219679, -0.0016633151, -0.08416798, -0.06091891, -0.023262773, -0.126822, 0.0497739, -0.001825667, -0.03078599, 0.04718741, 0.0043902365, -0.0053807287, 0.032797694, 0.06849138, -0.02102451, 0.0029395863) * inp_1_0_0; + result0 += M4(0.029171623, -0.119060196, -0.15731424, -0.010288389, 0.044039175, 0.03523954, 0.19108313, 0.0034680488, 0.022408625, -0.100109026, 0.013178398, 0.021233274, 0.02033905, -0.1076448, 0.05507044, 0.042807907) * inp_1_1_0; + result0 += M4(-0.058946244, 0.07518282, -0.0218126, -0.008712151, -0.076766334, 0.05434428, -0.022394644, 0.11280125, -0.07020608, 0.064211406, -0.01466337, 0.04543824, 0.04098286, -0.05094307, 0.017451143, -0.015480388) * inp_1_2_0; + result0 += M4(-0.050165318, -0.11767163, 0.037600912, -0.0783747, -0.04539349, -0.031150874, -0.08755638, -0.14933577, 0.07179043, -0.00836788, -0.08889254, 0.024585087, -0.08558388, 0.006760057, 0.05268061, 0.03279828) * inp_1_0_1; + result0 += M4(0.194146, 0.026081745, 0.22553095, 0.055226117, 0.09558362, 0.056916, -0.14006428, 0.009533805, -0.048172764, 0.06694457, 0.016996864, 0.010374402, 0.1303292, -0.0043800916, -0.06218835, 0.15707439) * inp_1_1_1; + result0 += M4(0.035268318, 0.11117023, -0.0024920474, 0.053387403, 0.0001125205, 0.03284727, -0.041436322, -0.11381764, 0.036874335, -0.05483726, 0.01669829, 0.047346413, 0.01582249, 0.024571301, 0.03841291, 0.0001531784) * inp_1_2_1; + result0 += M4(-0.039766025, -0.013582949, -0.047067195, 0.019274479, -0.0064281444, -0.028889643, -0.03691507, -0.025142971, -0.009235927, -0.014399523, 0.0068894643, 0.018320393, -0.009533652, 0.0047507705, -0.051280286, -0.006059686) * inp_1_0_2; + result0 += M4(-0.008069688, 0.06869032, 0.06720618, -0.039600242, 0.01939327, -0.04401731, 0.16278408, 0.050619956, -0.011940157, -9.242871e-06, -0.005613433, -0.06478905, -0.04764991, -0.00894034, -0.023979772, -0.14476714) * inp_1_1_2; + result0 += M4(0.034411438, -0.023818584, 0.036871288, 0.0619627, -0.02687395, -0.024658777, -0.009806786, 0.098166026, 0.04545056, -0.0035166715, 0.04391233, -0.09520481, -0.022824388, -0.02932159, -0.019960575, -0.013126476) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.042513143, 0.036193915, 0.009267334, 0.02318279, -0.08882127, -0.06790481, -0.025598435, -0.055786755, 0.003923015, 0.08367141, -0.02124261, -0.0036895827, 0.0665154, -0.061491456, -0.010962831, 0.016966973) * inp_2_0_0; + result0 += M4(-0.08984092, 0.014150137, 0.0010094845, -0.0013944331, -0.05288092, 0.014116327, 0.035593804, 0.020797336, 0.04860784, -0.100140445, 0.043347888, 0.03942333, -0.06728835, 0.14273663, 0.026525293, -0.07449118) * inp_2_1_0; + result0 += M4(0.037428003, -0.08130763, -0.010963262, -0.066873446, 0.05335851, 0.13654499, 0.032492008, 0.045801986, 0.009653935, 0.021689994, 0.025831793, 0.03277937, -0.025519112, 0.043301772, -0.0030657381, 0.046498533) * inp_2_2_0; + result0 += M4(0.0417986, 0.08424531, 0.04000319, 0.09104747, -0.16142552, -0.021476395, -0.19967215, -0.037973598, -0.048555277, 0.032703213, -0.033633802, 0.10496307, 0.057205033, -0.055697214, 0.097497426, -0.08111985) * inp_2_0_1; + result0 += M4(-0.061038256, -0.24523515, -0.3324259, -0.2994336, -0.41386676, -0.3934725, -0.2869577, -0.27902487, -0.053344678, -0.14278612, -0.15018024, -0.20823519, -0.034474645, -0.116564386, -0.0512445, 0.043638732) * inp_2_1_1; + result0 += M4(-0.11793706, -0.024524925, -0.07900098, -0.06977263, 0.4436866, 0.095661, 0.44399175, 0.16541167, 0.017248677, 0.017089522, 0.0531066, 0.044330012, 0.0172881, 0.015262031, 0.06628099, 0.11591024) * inp_2_2_1; + result0 += M4(0.034315176, 0.012758982, 0.098702334, 0.017511975, -0.06429503, 0.010301114, -0.1138796, 0.018430594, -0.011578993, 0.0050334428, 0.022777617, 0.036444314, -0.021219404, 0.022264466, -0.036809668, -0.015400894) * inp_2_0_2; + result0 += M4(0.018624214, -0.04151733, 0.14313662, 0.023933941, 0.12591304, 0.046684355, -0.065231994, -0.067107506, 0.017609427, 0.10223146, 0.07743975, -0.12169869, 0.009158939, -0.025597682, -0.08834877, -0.079456866) * inp_2_1_2; + result0 += M4(-0.0021108948, 0.014920775, 0.00642783, -0.022019196, 0.12250748, 0.1506987, 0.16710696, 0.15760566, -0.01257941, 0.0050026863, -0.00019434035, 0.066300645, -0.00047425524, 0.03707401, 0.001639517, 0.026377758) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.03845043, 0.008121379, -0.04463431, -0.021435143, -0.0154112475, 0.008068699, 0.005275401, -0.008412226, 0.011113799, -0.0042059543, 0.021885974, 0.0046847453, -0.097053245, -0.07207643, -0.016230254, -0.057805564) * inp_3_0_0; + result0 += M4(0.020068355, -0.059013963, 0.042093556, 0.007965266, 0.006641936, 0.0053823865, -0.04869122, -0.023604743, -0.05277748, -0.08194451, -0.059982788, -0.052345853, -0.033831976, -0.07052958, 0.027305871, 0.022747202) * inp_3_1_0; + result0 += M4(-0.03663662, 0.027668301, -0.005128969, 0.04180462, -0.07902732, 0.07694945, -0.037715025, 0.025260974, 0.017048629, 0.05412875, 0.029637456, 0.04848225, -0.055232473, -0.090560995, -0.052049804, -0.053691596) * inp_3_2_0; + result0 += M4(-0.041993283, -0.06591007, 0.06993194, -0.014823973, -0.029537756, 0.02038244, -0.05351582, 0.07256843, 0.01772454, -0.04179623, 0.019432299, 0.023107331, -0.03684704, 0.012458426, -0.06536513, 0.03873883) * inp_3_0_1; + result0 += M4(0.19751841, 0.2748706, -0.24543872, -0.079816476, 0.11848018, -0.26794544, 0.11034708, -0.16498065, -0.51390487, -0.41391793, -0.39137235, -0.3589357, 0.37141094, 0.3205968, 0.35281453, 0.25800362) * inp_3_1_1; + result0 += M4(0.03477724, 0.005542787, 0.0653558, -0.0044532754, -0.06219415, 0.13614522, -0.113096826, 0.04641227, 0.047544006, -0.011667869, 0.0035703634, 0.006406095, -0.10998655, -0.14912339, -0.102509305, -0.1656886) * inp_3_2_1; + result0 += M4(-0.015407814, -0.016495913, -0.036472354, -0.009568684, -0.0074188295, 0.021021923, 0.011698857, 0.019404247, 0.09597954, 0.059281915, 0.2022051, 0.05709749, -0.034792032, 0.014734844, -0.041519232, 0.02060852) * inp_3_0_2; + result0 += M4(-0.026737554, -0.05625069, 0.069094196, 0.013394634, 0.06341689, -0.005378102, 0.101725005, -0.05227663, 0.18010192, 0.17765583, 0.042139824, 0.15793523, 0.14893357, 0.057833694, 0.09549699, -0.004848631) * inp_3_1_2; + result0 += M4(-0.015824724, -0.022639401, -0.011159335, -0.0022217152, 0.0025551994, 0.0073573054, 0.011508081, 0.09528377, 0.09761966, 0.17366165, 0.11282759, 0.1593583, -0.014511227, -0.007068555, -0.021812135, -0.03897337) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(1, 1); + imageStore(out_image, output_base + ivec2(0, 0), result0); +} + +//!DESC ArtCNN C4F16 (Depth-To-Space) +//!COMPUTE 12 16 12 16 +//!HOOK LUMA +//!BIND conv2d_6 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +void hook() { + vec4 result = vec4(0.0, 0.0, 0.0, 1.0); + vec2 f0 = fract(conv2d_6_pos * conv2d_6_size); + ivec2 i0 = ivec2(f0 * vec2(2.0)); + result.x = conv2d_6_tex((vec2(0.5) - f0) * conv2d_6_pt + conv2d_6_pos)[i0.y * 2 + i0.x]; + imageStore(out_image, ivec2(gl_GlobalInvocationID), clamp(result, 0.0, 1.0)); +} diff --git a/shaders/ArtCNN_C4F16_DS.glsl b/shaders/ArtCNN_C4F16_DS.glsl new file mode 100644 index 0000000..98d51c0 --- /dev/null +++ b/shaders/ArtCNN_C4F16_DS.glsl @@ -0,0 +1,1407 @@ +// MIT License + +// Copyright (c) 2024 Joao Chrisostomo, Kacper Michajłow + +// Permission is hereby granted, free of charge, to any person obtaining a copy +// of this software and associated documentation files (the "Software"), to deal +// in the Software without restriction, including without limitation the rights +// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +// copies of the Software, and to permit persons to whom the Software is +// furnished to do so, subject to the following conditions: + +// The above copyright notice and this permission notice shall be included in all +// copies or substantial portions of the Software. + +// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +// SOFTWARE. + +//!DESC ArtCNN C4F16 DS (Conv2D) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND LUMA +//!SAVE conv2d +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared F inp[1][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(1, 1); + inp[0][y][x] = F(LUMA_mul * texelFetch(LUMA_raw, input_base + ivec2(0, 0), 0).x); + } + } + + barrier(); + V4 result0 = V4(-0.0049340418, -0.012793901, -0.01654616, -0.04911682); + V4 result1 = V4(-0.029540002, -0.0068046413, -0.00023085524, -0.00035294317); + V4 result2 = V4(0.029907363, -0.004545475, -0.0008227237, -0.00086534343); + V4 result3 = V4(-0.002919027, 0.002460784, 0.012082119, -0.063332476); + const F inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const F inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const F inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const F inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const F inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const F inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const F inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const F inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const F inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += V4(-0.028834578, -0.14101993, 0.007882108, 0.03927023) * inp_0_0_0; + result0 += V4(0.0381181, 0.15082009, 0.1299179, 0.124353915) * inp_0_1_0; + result0 += V4(-0.0026651656, 0.10701949, -0.10302223, 0.06252015) * inp_0_2_0; + result0 += V4(-0.017014246, 0.056569446, 0.013070459, 0.1673612) * inp_0_0_1; + result0 += V4(-0.039012846, -0.083705, -0.3763227, 0.27351955) * inp_0_1_1; + result0 += V4(-0.21789941, -0.13512278, 0.107165866, 0.11088684) * inp_0_2_1; + result0 += V4(0.026416743, 0.15055776, -0.026394987, 0.09503178) * inp_0_0_2; + result0 += V4(0.11317181, -0.09849969, 0.24554619, -0.006209404) * inp_0_1_2; + result0 += V4(0.18810558, 0.015041951, 0.01617648, 0.09057816) * inp_0_2_2; + result1 += V4(0.078574546, -0.07280724, -0.09120986, 0.019795248) * inp_0_0_0; + result1 += V4(-0.067474775, -0.019562894, -0.0067152088, -0.18367955) * inp_0_1_0; + result1 += V4(0.05455347, 0.11168705, 0.07079753, 0.14639775) * inp_0_2_0; + result1 += V4(-0.05000137, 0.09589531, 0.09779115, -0.038142927) * inp_0_0_1; + result1 += V4(0.104602836, -0.16130356, 0.14888051, 0.17604049) * inp_0_1_1; + result1 += V4(-0.11296293, 0.26848587, -0.21014185, -0.13524422) * inp_0_2_1; + result1 += V4(0.06099483, -0.023948722, 0.022344239, 0.013350393) * inp_0_0_2; + result1 += V4(0.09386803, -0.23937507, -0.13151713, 0.025719114) * inp_0_1_2; + result1 += V4(-0.05785345, 0.062087506, 0.10226412, -0.022276009) * inp_0_2_2; + result2 += V4(-0.06026112, 0.10904248, -0.11761055, -0.06018391) * inp_0_0_0; + result2 += V4(0.085813195, -0.03787966, 0.16202296, 0.0041552093) * inp_0_1_0; + result2 += V4(0.060139276, -0.005811277, 0.0070230174, -0.0069510895) * inp_0_2_0; + result2 += V4(-0.17221731, 0.28638083, 0.34320375, 0.17658837) * inp_0_0_1; + result2 += V4(-0.27984276, -0.7016683, -0.30903038, -0.08029049) * inp_0_1_1; + result2 += V4(0.13250893, 0.124444515, -0.059002075, -0.04446707) * inp_0_2_1; + result2 += V4(0.03323799, 0.12117096, -0.14812368, -0.036965195) * inp_0_0_2; + result2 += V4(0.1977777, 0.06994207, 0.10603352, 0.16904502) * inp_0_1_2; + result2 += V4(-0.1536847, -0.004283535, 0.009282772, -0.12100757) * inp_0_2_2; + result3 += V4(0.059486274, -0.11239365, 0.21015224, -0.090100385) * inp_0_0_0; + result3 += V4(-0.15950659, 0.18551329, 0.34821057, 0.16747488) * inp_0_1_0; + result3 += V4(0.010258027, -0.029954039, 0.05202862, 0.056675363) * inp_0_2_0; + result3 += V4(0.036862228, -0.003042499, 0.028995909, -0.18852086) * inp_0_0_1; + result3 += V4(0.017469667, -0.1588153, -0.38980985, -0.008847585) * inp_0_1_1; + result3 += V4(0.042114146, 0.12621936, -0.17563884, 0.20885424) * inp_0_2_1; + result3 += V4(-0.06928606, 0.10595441, -0.058485802, -0.073390864) * inp_0_0_2; + result3 += V4(0.090648934, -0.04735434, -0.15482384, 0.026818749) * inp_0_1_2; + result3 += V4(-0.013016346, -0.06682891, -0.024198746, 0.16552028) * inp_0_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), result0); + imageStore(out_image, output_base + ivec2(1, 0), result1); + imageStore(out_image, output_base + ivec2(0, 1), result2); + imageStore(out_image, output_base + ivec2(1, 1), result3); +} + +//!DESC ArtCNN C4F16 DS (Conv2D-1-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d +//!SAVE conv2d_1 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.011309091, 0.011720209, 0.07717452, 0.012043687); + V4 result1 = V4(0.04592391, -0.009706806, -0.011586145, 0.014143103); + V4 result2 = V4(0.012079102, 0.02975359, 0.008218081, 0.01839072); + V4 result3 = V4(0.0058121867, -0.0034202328, 0.0009524132, -0.02947478); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.09877198, 0.38928044, -0.09383465, 0.079032965, 0.107005835, 0.1136302, 0.041581154, -0.052157145, -0.35730338, 0.27816653, -0.06807881, -0.067746386, -0.006262232, -0.06413886, -0.12926531, 0.028121412) * inp_0_0_0; + result0 += M4(-0.2730201, 0.12183424, -0.000594066, 0.06456225, 0.63564765, 0.16603222, -0.011430876, 0.10374776, -0.5786755, -0.52282465, -0.15073062, 0.017066224, -0.36250365, 0.09160107, 0.039119765, 0.10774151) * inp_0_1_0; + result0 += M4(0.30126116, -0.1014905, 0.08349073, 0.0063151238, 0.120676085, -0.17403236, 0.18270256, -0.057362948, -0.28110328, 0.106739074, -0.035695158, 0.06990916, -0.09574672, -0.018324012, -0.09960064, -0.057645217) * inp_0_2_0; + result0 += M4(-0.17198816, -0.093343705, -0.006382152, -0.18036872, -0.2148838, -0.17424193, 0.22078043, -0.1732282, 0.26076397, 0.1474919, -0.01922907, 0.010837412, 0.028024467, 0.07845438, -0.015646966, 0.027136652) * inp_0_0_1; + result0 += M4(-0.043947384, -0.15946668, -0.046214677, -0.11894077, -0.4706527, 0.20794135, 0.07293495, -0.035387393, -0.46785754, 0.65764594, 0.039504908, -0.4142682, 0.034218732, 0.032816306, 0.106478676, 0.12423036) * inp_0_1_1; + result0 += M4(-0.3440009, 0.024391247, -0.0644611, -0.07619978, -0.4256126, -0.10989194, -0.057316273, -0.05037822, 0.2577093, 0.07522628, 0.060620584, -0.13478145, -0.046803165, 0.06498437, 0.05821759, 0.040200662) * inp_0_2_1; + result0 += M4(0.079720534, 0.049182344, -0.01734871, 0.2098411, -0.06080854, -0.10493844, -0.0061250627, 0.23049541, 0.27885517, -0.18456793, 0.04471378, -0.1519946, -0.047879137, -0.05675035, -0.11165134, -0.020727035) * inp_0_0_2; + result0 += M4(0.05443745, 0.012744339, -0.051926363, 0.12922677, 0.08167649, 0.09113499, -0.06406348, 0.45999956, 0.25078163, -0.18583958, -0.27785185, 0.8986888, 0.0048544668, -0.040135045, -0.060791086, 0.022054149) * inp_0_1_2; + result0 += M4(-0.15824191, -0.063602105, 0.024466638, 0.018670492, 0.18217057, -0.2717177, -0.16882227, -0.17058909, 0.119718775, -0.08420973, 0.12789485, -0.10119966, 0.043762792, -0.070947856, 0.04055627, -0.07537116) * inp_0_2_2; + result1 += M4(-0.07460643, -0.054178257, 0.00027177262, 0.184799, -0.046359397, 0.059696186, 0.033557095, 0.07526354, 0.07089547, -0.07476439, -0.035536528, 0.024276823, 0.07413596, -0.06979502, -0.06169341, -0.12059578) * inp_0_0_0; + result1 += M4(0.14608821, -0.07439824, 0.03865178, -0.086880915, -0.11553095, 0.11800374, 0.13214925, 0.046812996, -0.037123796, -0.018989379, -0.05062097, 0.0021832588, 0.13339424, -0.055192936, -0.11149385, -0.04801339) * inp_0_1_0; + result1 += M4(0.10018024, 0.0015277287, 0.024594266, -0.10473088, -0.10727858, 0.2637988, 0.0025090645, -0.027918315, 0.08310345, 0.11183597, -0.11561776, 0.10297722, -0.112052426, -0.0393831, -0.06215935, 0.14460996) * inp_0_2_0; + result1 += M4(-0.045010846, 0.2596987, -0.061746594, 0.3915752, -0.1178524, -0.040817495, 0.15932876, 0.18028739, -0.060169153, 0.28849506, -0.059507165, 0.07859005, 0.058386788, -0.060939044, -0.03840868, -0.10951335) * inp_0_0_1; + result1 += M4(0.11402059, -0.18600419, 0.20650828, -0.040762946, 0.20945579, -0.22200839, -0.07005221, -0.11765, -0.20845462, 0.18816432, 0.9522476, -0.036692392, 0.16586697, 0.068688564, -0.11158684, -0.08792759) * inp_0_1_1; + result1 += M4(0.05377238, -0.15907322, -0.07312733, -0.10462031, -0.08407747, -0.14599952, 0.20981629, -0.044482782, 0.400037, -0.1437334, 0.0788931, 0.042104036, -0.20607647, 0.08861181, -0.032842077, 0.023695804) * inp_0_2_1; + result1 += M4(0.04181302, -0.060805034, -0.101417646, -0.17794839, 0.168702, -0.51052046, -0.095897056, -0.013912092, 0.038582865, 0.05309609, -0.06728378, 0.341196, -0.017040616, -0.06550378, 0.11086736, -0.042624153) * inp_0_0_2; + result1 += M4(0.11940134, -0.12056612, -0.13654755, -0.026973963, 0.15465894, 0.029888792, -0.49261746, -0.22650442, 0.015893001, -0.44998038, -0.7092512, -0.24032496, 0.07558687, 0.03830741, 0.078829594, 0.06326567) * inp_0_1_2; + result1 += M4(0.18127115, -0.065435536, -0.07445673, -0.0049071168, 0.01085999, -0.0077388254, -0.064653255, -0.09067383, 0.026689146, -0.08541669, -0.060653634, -0.08493797, -0.14466925, -0.11301376, 0.058424987, 0.09166556) * inp_0_2_2; + result2 += M4(-0.13080364, -0.08167301, -0.463303, -0.70742375, 0.077425644, -0.021687286, 0.035808627, -0.39734727, -0.1559171, -0.21604316, 0.39925998, -0.3012099, 0.016638095, -0.08232811, 0.03377222, 0.031966764) * inp_0_0_0; + result2 += M4(0.14442822, 0.12295271, 0.029818185, 0.0359594, 0.04060354, 0.015188929, -0.0029900323, -0.23532009, 0.2359964, 0.14970055, 0.017785046, -0.52034444, 0.059353128, 0.10592766, -0.05263293, -0.10214093) * inp_0_1_0; + result2 += M4(0.122345954, 0.32518455, -0.13197717, -0.2253006, 0.06691174, 0.052411076, 0.100197494, -0.26456442, -0.030602941, 0.2827907, -0.31574076, -0.14921468, -0.05038948, -0.16915296, -0.10316771, -0.02792467) * inp_0_2_0; + result2 += M4(-0.08198538, -0.10204986, 0.5690069, -0.09734485, -0.028890003, -0.15102413, 0.44935277, -0.024167726, -0.015774969, -0.0887488, -0.51489425, 0.43573058, 0.07211464, 0.086417206, -0.029778117, 0.0897787) * inp_0_0_1; + result2 += M4(-0.11789364, 0.06326017, 0.13353379, 0.14045511, -0.097247526, 0.13069586, 0.18198517, 0.07585104, -0.46691963, -0.12969762, 0.12990327, 0.10933748, 0.22077899, 0.08396143, 0.11584505, 0.06981046) * inp_0_1_1; + result2 += M4(-0.15274513, -0.019888762, 0.21179429, -0.08906937, -0.048165828, 0.2743937, -0.05530385, 0.08738966, -0.077265665, 0.31894842, -0.05136382, 0.12788285, 0.09329922, -0.047389865, 0.08291986, 0.1473245) * inp_0_2_1; + result2 += M4(-0.108804405, -0.023400303, -0.2225971, 0.101814784, 0.048623733, -0.14735846, -0.38235044, 0.2508335, 0.0006776365, 0.05468187, 0.56234205, -0.09719959, -0.05784428, -0.015568528, 0.0027001353, -0.08191959) * inp_0_0_2; + result2 += M4(0.0972354, -0.06312126, 0.022070305, 0.120524995, 0.50088096, 0.090986624, -0.05814756, 0.20085476, 0.560176, -0.016112555, -0.08229239, 0.012685615, -0.18278423, 0.109280005, -0.022708299, -0.14846179) * inp_0_1_2; + result2 += M4(0.03168514, 0.09864207, -0.09442118, -0.024364354, -0.10918896, 0.06662421, -0.091709755, 0.05298994, -0.036009606, -0.15768065, -0.10558869, -0.05636757, -0.062536, -0.09078685, -0.03775271, -0.05907822) * inp_0_2_2; + result3 += M4(0.16951673, 0.13079187, 0.15705979, -0.15498151, 0.07683223, -0.06972948, 0.1610643, 0.017183576, 0.017889338, -0.123466015, -0.18230678, 0.020653097, -0.028243298, -0.0455674, -0.0099932505, 0.15229751) * inp_0_0_0; + result3 += M4(-0.14118189, -0.07251147, -0.124787614, -0.031930055, 0.0014606286, 0.061471842, 0.12428364, 0.09564553, 0.08472746, -0.054346558, -0.3817292, 0.018670253, -0.0053583533, 0.057495654, -0.006340129, -0.04558433) * inp_0_1_0; + result3 += M4(-0.22084264, 0.072441526, 0.016335221, 0.061928593, -0.034427874, -0.052877698, 0.031620156, 0.02055477, -0.24549209, -0.28623292, 0.11228471, 0.10617587, 0.0035924714, 0.057636518, -0.0062976037, -0.09103348) * inp_0_2_0; + result3 += M4(0.22203928, 0.0001094966, -0.28109252, 0.14876871, 0.20899206, -0.13489018, 0.15935789, 0.13730305, 0.067521155, -0.17813672, 0.073929176, -0.47425798, -0.14579837, -0.12225127, 0.026552638, 0.09890729) * inp_0_0_1; + result3 += M4(-0.08939892, -0.038700964, -0.023869948, -0.025948375, -0.28878126, 0.06866243, -0.17241889, 0.16191031, 0.48571798, 0.0033233624, 0.5171774, 0.27048627, -0.024863949, 0.10009337, -0.054171123, 0.021327967) * inp_0_1_1; + result3 += M4(-0.0026751498, 0.01677554, -0.114878856, 0.07205768, -0.33671686, -0.20127785, -0.269759, 0.013932504, -0.38406572, -0.3358019, 0.015354786, 0.020901006, 0.13394894, -0.11160113, -0.09172442, -0.02606201) * inp_0_2_1; + result3 += M4(0.02983239, 0.065238595, -0.08852208, 0.041396923, 0.03438514, 0.52203476, 0.09024649, 0.08568877, -0.11356743, -0.06145079, 0.16605784, -0.0046695387, -0.07753392, -0.04085484, -0.04211701, 0.042229425) * inp_0_0_2; + result3 += M4(-0.0152936075, -0.30379444, -0.03498485, -0.059613615, 0.0010579604, 0.03850498, -0.5338625, -0.18131024, -0.010662432, 0.95364696, -0.3127961, 0.10594221, 0.013022731, 0.1168128, 0.0039640763, -0.008202392) * inp_0_1_2; + result3 += M4(-0.04573058, 0.12372858, -0.22841553, 0.07078649, 0.13948447, 0.034082845, 0.19417766, -0.12902696, -0.027753403, 0.1267231, -0.397033, 0.011799876, 0.03935273, -0.0021190709, -0.011170245, -0.010836182) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.8353019, -0.03079682, -0.048795003, 0.035018213, -0.23654273, 0.07702494, 0.2094514, -0.03364075, -0.7785589, 0.48244116, -0.15566188, -0.02168974, -0.2537349, 0.55893207, -0.11559338, 0.056175552) * inp_1_0_0; + result0 += M4(-0.36740738, 0.11978992, 0.0896231, 0.026315548, 0.61221665, -0.37786412, -0.011924415, -0.25350574, 0.7978943, -0.051793884, 0.12227405, -0.11176683, -0.33257982, -0.033167973, -0.080166414, 0.0071900175) * inp_1_1_0; + result0 += M4(0.30219695, 0.19819108, -0.051961806, 0.032858204, 0.13871473, 0.04834231, 0.0116140265, 0.023473512, -0.3913116, -0.5835288, 0.09242092, 0.13168785, 0.06345958, -0.2336482, -0.2062129, 0.07203379) * inp_1_2_0; + result0 += M4(-0.36866486, -0.06509952, 0.106615335, -0.10289987, -0.10938692, -0.016172621, -0.16599819, 0.039859798, -0.05009089, -0.3045099, 0.016047738, 0.14461611, -0.32650867, 0.4984813, 0.22866598, 0.15623319) * inp_1_0_1; + result0 += M4(0.1897873, -0.39516336, 0.09100719, 0.08683436, -0.13866301, 0.26886114, 0.02321497, 0.09762188, 0.015329164, 0.2783753, 0.08462078, 0.041773602, 0.87116414, -0.77580714, -0.25930312, 0.2847646) * inp_1_1_1; + result0 += M4(-0.16257232, 0.08016403, -0.11788802, -0.1697364, -0.22687338, -0.0767716, -0.13487695, 0.12317228, -0.14794314, 0.378525, -0.07111922, -0.14637247, 0.3404566, 0.6845142, -0.06920808, 0.13534123) * inp_1_2_1; + result0 += M4(0.019833196, 0.14731897, -0.025829142, 0.102971524, 0.09881936, -0.14266418, -0.055933498, 0.08291914, 0.31677926, 0.15038142, -0.1840297, 0.035697404, 0.0027101748, 0.07143232, -0.29017213, 0.32565188) * inp_1_0_2; + result0 += M4(0.08040377, -0.04806, 0.111961365, -0.18063085, 0.04080433, 0.03362372, 0.004829591, 0.19333047, 0.0032951036, 0.116119325, 0.15918833, 0.09558537, -0.107474156, -0.014522343, 0.35576323, -0.93175983) * inp_1_1_2; + result0 += M4(-0.11092724, 0.15114045, -0.28484997, 0.04351722, 0.14012209, -0.038325023, -0.024206607, -0.15268601, 0.20977294, -0.552664, 0.11712065, -0.08422484, -0.030889055, -0.48031336, -0.026412616, -0.06320308) * inp_1_2_2; + result1 += M4(-0.29958254, -0.109615885, 0.029395718, 0.016319282, 0.26873666, 0.3702847, 0.09765828, 0.14932635, 0.14159209, 0.095116585, 0.16584423, -0.09755582, 0.019258445, -0.060782902, -0.2806007, -0.1301911) * inp_1_0_0; + result1 += M4(0.10790642, 0.030600157, -0.038562354, -0.026029062, -0.2230801, 0.1270215, 0.18553448, -0.08388566, 0.09725127, -0.05428193, 0.16844873, 0.2568333, 0.12408434, -0.16046543, -0.0019557131, 0.016269071) * inp_1_1_0; + result1 += M4(0.13869679, 0.05662262, 0.10610408, -0.042847093, -0.07361296, -0.06860708, 0.11945361, -0.010420255, -0.26884106, 0.22707044, -0.107094064, 0.103328854, 0.17813848, -0.26080275, -0.095853835, -0.016011981) * inp_1_2_0; + result1 += M4(-0.025391787, -0.5703227, 0.06401796, -0.34907568, 0.10032994, 0.39301944, 0.016423864, 0.4536823, -0.11761743, -0.112939045, -0.024434509, 0.13416661, -0.24094307, -0.4419523, 0.00059161003, -0.46946138) * inp_1_0_1; + result1 += M4(0.35361376, 0.06384827, -0.16368373, 0.1610783, -0.2828763, 0.033816554, -0.13143909, -0.30080402, 0.16076425, -0.22998048, -0.47442713, -0.30463502, 0.3944553, 0.048345, -0.2522477, 0.11306068) * inp_1_1_1; + result1 += M4(0.24947502, 0.07821673, 0.14102261, 0.007180845, -0.11125239, 0.055846, 0.012407736, -0.11969543, -0.26606387, -0.18257982, 0.14033502, 0.1393476, 0.12760912, 0.095806316, -0.1708761, -0.09545417) * inp_1_2_1; + result1 += M4(-0.1447064, -0.4311559, -0.006957143, -0.23297, 0.29948533, 0.39930835, -0.14382444, 0.8876203, -0.15697467, -0.1968718, -0.11124502, -0.2506147, 0.18206203, 0.051802326, -0.09965735, 0.2832789) * inp_1_0_2; + result1 += M4(0.10724873, 0.016814586, 0.21944435, 0.23991458, -0.16073646, -0.015581932, -0.3656503, -0.19130723, 0.21842504, 0.3039945, 0.12558551, -0.22017072, -0.05429101, 0.67426455, 1.0007616, 0.28180587) * inp_1_1_2; + result1 += M4(0.22271243, -0.11349672, -0.21032788, -0.163929, -0.28222632, 0.13967724, -0.017861396, 0.06513735, -0.13312815, 0.1615168, 0.11318072, 0.09575312, -0.20077147, -0.16503984, 0.11308297, 0.025842024) * inp_1_2_2; + result2 += M4(-0.059448976, 0.014798713, 0.57572407, -0.4970689, 0.19702779, 0.13581169, -0.19225039, 0.6739382, -0.15882425, -0.051979855, -0.97899884, -0.22377504, -0.030026965, -0.113155484, 0.24761347, -0.719494) * inp_1_0_0; + result2 += M4(-0.03346012, 0.109789826, 0.20284073, -0.018877316, -0.13332081, -0.25938398, -0.014910783, -0.18132773, -0.20557809, 0.21696718, 0.106756255, 0.23250414, -0.27276435, -0.00024258936, 0.026531879, 0.14486963) * inp_1_1_0; + result2 += M4(-0.014871851, -0.03370725, 0.32739255, -0.056933377, 0.01230874, 0.028961578, 0.15074731, 0.13390249, 0.16060308, -0.28017068, -0.049378213, 0.15798374, 0.1049363, 0.021499243, -0.056283005, 0.5702396) * inp_1_2_0; + result2 += M4(-0.40781596, -0.068078905, -0.2608516, -0.36839285, 0.27331737, 0.06990319, 0.028166782, 0.47841585, -0.07101787, -0.07055015, 1.3041064, -0.08154195, -0.6420218, -0.16353844, 0.8393286, 0.14371522) * inp_1_0_1; + result2 += M4(-0.036683656, 0.23350303, -0.3823271, -0.1895325, -0.042114716, -0.27834532, -0.011016889, 0.054359082, 0.52122265, 0.09595518, 0.29784077, -0.045716044, 0.26147208, 0.1535827, -0.3547086, -0.5459924) * inp_1_1_1; + result2 += M4(-0.08925608, -0.14973558, -0.17211129, 0.03096805, 0.11671369, 0.21920115, 0.06494186, -0.06473811, 0.13254163, 0.0064040422, 0.0197999, -0.029223228, -0.12759385, -0.038808268, -0.07336323, 0.4978441) * inp_1_2_1; + result2 += M4(-0.08437726, -0.20194645, 0.07599329, -0.21935628, 0.3217862, -0.027808418, -0.055483975, 0.48027533, -0.07248972, -0.10917602, -1.1656119, 0.25192067, 0.726754, -0.4072386, -0.84861493, -0.28209558) * inp_1_0_2; + result2 += M4(0.24826227, 0.03057961, -0.025810828, 0.15662467, 0.19474192, -0.20894553, -0.13577338, 0.22615886, -0.18568474, 0.03584874, 0.24559572, 0.13821158, -0.45080966, 0.32287788, 0.014510343, 0.0734196) * inp_1_1_2; + result2 += M4(-0.02822516, -0.023234604, -0.058450423, 0.15003574, -0.010218517, 0.0002537157, -0.05167111, -0.051569637, -0.120971926, 0.122743204, 0.14452058, 0.026441488, -0.17925249, 0.2772131, 0.017249027, 0.16620068) * inp_1_2_2; + result3 += M4(0.030601235, 0.1533475, 0.1354541, 0.17745161, -0.020671252, -0.10372984, -0.13732138, -0.23245959, -0.084360994, 0.22388554, 0.26257366, -0.08955721, 0.054022234, 0.0046199774, -0.40396032, 0.17547776) * inp_1_0_0; + result3 += M4(0.0950914, 0.13105528, -0.17804535, 0.036833197, 0.10695207, -0.12510276, 0.020602226, 0.15301901, 0.17476954, -0.02053389, 0.55537015, -0.09537796, 0.11434194, 0.020771341, -0.0027719524, -0.022421993) * inp_1_1_0; + result3 += M4(-0.09498485, 0.017095882, -0.13202192, 0.040244695, -0.19800507, -0.031560943, 0.04959914, 0.03567479, 0.24101183, -0.042635966, -0.18614642, -0.009154916, -0.00247375, -0.19376199, 0.26423156, 0.03759395) * inp_1_2_0; + result3 += M4(0.07953845, 0.39391887, 0.00727727, 0.35082912, 0.025060296, -0.2595865, 0.16177765, -0.7336906, 0.23894046, -0.070483424, -0.30498013, 0.56130445, -0.010698394, 0.021584244, -0.58075994, 0.68465334) * inp_1_0_1; + result3 += M4(-0.40409416, -0.0077395765, -0.3227979, -0.068225116, 0.5861685, 0.08172666, 0.13572781, 0.3026567, -0.57700115, 0.107233115, -0.2528313, -0.17424521, -0.84155977, -0.02813022, -0.5172479, -0.59169096) * inp_1_1_1; + result3 += M4(0.14502329, 0.06812947, 0.2185236, 0.0643197, -0.2091687, -0.09261454, -0.09526991, 0.040777106, 0.032173075, -0.11730932, -0.13217378, 0.0023497643, 0.44384873, -0.15709418, 0.6121635, -0.090208404) * inp_1_2_1; + result3 += M4(0.04270719, 0.21312836, -0.048879534, -0.11266838, -0.14382827, -0.2192215, 0.0068878373, -0.025609564, -0.09477325, 0.2191171, 0.096425086, -0.16293575, -0.051669516, 0.4190975, 0.12580837, -0.135226) * inp_1_0_2; + result3 += M4(-0.046412982, -0.12211086, 0.0077603217, -0.07431488, 0.17982213, 0.0438941, -0.196129, 0.06958203, 0.0024261524, -0.26292798, -0.097179495, -0.19446476, 0.29509872, -0.07991557, 0.74099654, 0.1677081) * inp_1_1_2; + result3 += M4(0.047113243, 0.058038574, 0.24930288, 0.06464759, -0.03720209, -0.051006317, -0.01912244, 0.011376446, 0.15856679, 0.103483565, 0.46561158, 0.030039294, -0.07310521, 0.45909077, 0.32737142, -0.009899002) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.056658532, -0.084393896, -0.08351355, 0.026212027, -0.16376431, 0.28912234, 0.027704367, -0.071667574, 0.22876024, 0.5063291, -0.034939148, -0.04414098, 0.80793244, 0.2117281, 0.04003154, -0.019289244) * inp_2_0_0; + result0 += M4(-0.6404585, -0.17796884, -0.14469966, 0.064434, -0.037456833, -0.43776658, -0.076254845, -0.016480407, 0.053084683, -0.4298736, 0.009404756, 0.083069295, -1.0547874, -0.20475821, 0.027985618, 0.12540238) * inp_2_1_0; + result0 += M4(-0.28070635, 0.1289751, 0.1219496, 0.01570686, -0.19013144, 0.29028776, 0.012497347, -0.0010326781, -0.7109733, -0.095800534, -0.07843679, -0.017538793, 0.4179525, 0.13152626, 0.106455006, 0.01078675) * inp_2_2_0; + result0 += M4(0.081900895, 0.19029334, -0.073567726, -0.047557395, 0.19428933, -0.038285363, -0.11491762, -0.01837945, 0.07547317, -0.5344631, 0.1524544, -0.14964266, -0.19406794, -0.059020177, 0.19315392, -0.038649715) * inp_2_0_1; + result0 += M4(-0.16288629, 0.43891653, 0.08301114, -0.359797, -0.07925925, 0.157717, 0.23638429, -0.5961064, -0.20833725, 0.6921076, 0.18377437, -0.46835884, 0.23760724, 0.2279108, -0.18868038, -0.24260604) * inp_2_1_1; + result0 += M4(-0.13185735, 0.16606236, 0.07416285, -0.03832922, 0.17361966, -0.13698995, -0.08244967, -0.08690483, 0.023102188, -0.21447626, -0.15169983, 0.22278568, -0.030070322, 0.10786125, -0.09606021, -0.00094145857) * inp_2_2_1; + result0 += M4(0.19589414, 0.008045848, -0.26970163, 0.07926561, 0.0055276607, -0.034727324, 0.014047634, 0.01084498, 0.013823401, 0.045765556, -0.06885619, 0.11313184, -0.09608044, 0.11905903, -0.057270247, 0.17040935) * inp_2_0_2; + result0 += M4(-0.35795772, 0.052093923, -0.27925724, 0.7024668, -0.23307371, 0.15484054, 0.086788125, 0.40594432, 0.030013239, -0.012880656, -0.23584186, 0.6172303, 0.100337416, -0.2668913, 0.07190245, 0.045928806) * inp_2_1_2; + result0 += M4(0.08252405, -0.14609249, -0.064848445, -0.05421016, -0.08036742, 0.064709485, 0.0995519, 0.17094779, 0.19813484, -0.023966646, 0.06744239, -0.24773261, -0.08125354, -0.11565303, -0.004539193, 0.003593128) * inp_2_2_2; + result1 += M4(-0.05913632, -0.13035738, -0.2095817, -0.121928796, 0.24421848, 0.31298313, 0.06490786, 0.11518253, -0.12560591, -0.019254718, 0.10287586, 0.10359144, -0.18111609, 0.003691266, -0.16280791, 0.15910712) * inp_2_0_0; + result1 += M4(-0.09409358, 0.18263733, 0.044311643, 0.06420531, 0.09978127, 0.061665844, 0.19545491, -0.07039197, 0.12624802, -0.034005325, -0.14515208, -0.078887306, 0.106090754, 0.16866021, -0.14042042, -0.046339422) * inp_2_1_0; + result1 += M4(0.07321761, -0.005795847, -0.13165809, 0.019000694, -0.09719375, 0.16906215, -0.08389258, -0.024464838, -0.20402004, -0.22585747, 0.19619657, 0.03625385, -0.056417644, -0.10498231, 0.15780598, -0.05896881) * inp_2_2_0; + result1 += M4(0.11133829, 0.15564004, -0.018679706, -0.20204216, 0.18958686, 0.27253, -0.06635486, -0.14202532, -0.12708612, 0.22483705, 0.028482271, 0.287388, 0.07226748, 0.16693592, 0.083715275, -0.43332836) * inp_2_0_1; + result1 += M4(-0.107852295, 0.4372522, 0.82334834, -0.010232122, -0.124953635, -0.1031519, 0.88873106, -0.066571906, 0.107724965, 0.14239775, 0.38775948, -0.3008945, 0.12835532, -0.004528145, 0.46319053, 0.37589112) * inp_2_1_1; + result1 += M4(0.36154172, -0.048908047, 0.01569887, 0.10236648, -0.3750691, -0.028939823, 0.13799433, -0.07261984, -0.19416392, 0.23474926, 0.16244835, 0.17886005, -0.08432286, -0.099077776, -0.16162856, 0.006568329) * inp_2_2_1; + result1 += M4(0.20400487, -0.11719335, -0.11616023, 0.5995642, 0.122836575, 0.4458128, -0.16099311, 0.699037, -0.21749511, -0.22285137, -0.13708612, 0.08973937, -0.033287726, -0.33511263, 0.01033256, 0.060349323) * inp_2_0_2; + result1 += M4(-0.13193716, -0.27737704, -0.442998, 0.02232665, 0.13035831, -0.17953672, -0.57704264, -0.19806914, 0.66499674, -0.057644695, -0.6075821, -0.7843484, 0.11177764, 0.3197587, -0.19009523, -0.35939646) * inp_2_1_2; + result1 += M4(0.30169463, -0.27423045, 0.030066399, 0.09561448, -0.35065278, -0.09054245, -0.13476075, 0.058679003, -0.240253, -0.25924155, -0.025114952, 0.1503409, -0.10358453, 0.06972844, 0.10086383, 0.1513331) * inp_2_2_2; + result2 += M4(-0.09140265, -0.043480042, 0.39341742, -0.16124645, 0.039826732, 0.0982359, 0.14812395, -0.29226306, -0.12270788, -0.056483883, 0.46743312, -0.12414679, -0.08598476, -0.020382252, 0.8526356, -0.6251697) * inp_2_0_0; + result2 += M4(0.19089483, -0.094089076, 0.27113757, -0.89349926, 0.092731245, -0.052982565, 0.029999843, -0.27503353, 0.1723571, -0.14498913, -0.59834313, 0.38859525, 0.12832993, 0.06796332, -0.43113524, 0.2746368) * inp_2_1_0; + result2 += M4(0.101626456, 0.012754597, -0.25569427, -0.075960755, -0.04676257, 0.022405503, -0.08868581, 0.07564415, -0.1573639, 0.12833588, -0.31780383, -0.46218848, -0.027274387, -0.13945863, -0.110267706, -0.027970377) * inp_2_2_0; + result2 += M4(0.03608637, -0.09479316, -0.21446887, 0.56932735, -0.08810863, 0.06604438, -0.1869864, 0.6002932, -0.12353022, 0.0830962, 0.2746934, 0.16245197, -0.08361289, 0.0022464357, -0.2217645, -0.12708506) * inp_2_0_1; + result2 += M4(-0.3414478, -0.1966153, 0.055342548, -0.013102268, -0.47288916, -0.5555628, -0.14289796, -0.08635351, -0.41934514, -0.6622999, 0.22686398, -0.15859646, -0.16033597, -0.0053745653, 0.36677605, -0.23678315) * inp_2_1_1; + result2 += M4(-0.17615376, -0.046758268, 0.01108182, -0.07680903, 0.029766507, 0.6448251, 0.20447639, 0.056505933, 0.23630296, 1.0478128, 0.26991642, -0.055334356, 0.13279189, 0.026829982, -0.12233411, 0.16576806) * inp_2_2_1; + result2 += M4(0.15395284, -0.1248782, 0.31775445, 0.0008446973, 0.2462245, 0.050902765, 0.22869344, 0.31496996, 0.032222766, -0.19146186, 0.16774654, 0.4773935, 0.12845011, -0.0674604, -0.16974731, 0.6718414) * inp_2_0_2; + result2 += M4(0.19998777, -0.0046336846, -0.17863709, -0.022363333, 0.30268896, -0.21146934, -0.05744014, 0.16582312, 0.55801415, 0.09421628, -0.652831, 0.22474986, 0.052013434, -0.08298826, -0.20941404, 0.2198382) * inp_2_1_2; + result2 += M4(-0.05906059, -0.055516556, -0.15871921, -0.20876054, 0.056753717, -0.122805975, -0.10752009, 0.07214043, -0.2886711, -0.104196325, 0.13151167, -0.11443949, -0.29457253, 0.09404759, 0.0781491, 0.09187794) * inp_2_2_2; + result3 += M4(0.07131227, -0.17103189, -0.65701765, -0.08103885, 0.0114034135, -0.11564006, -0.3758374, -0.30220702, 0.10926563, 0.060695365, -0.13507707, 0.02752198, 0.15815619, -0.099520825, -0.12582445, 0.011142395) * inp_2_0_0; + result3 += M4(0.16390102, -0.043893002, -0.17439, 0.00196632, 0.23113947, -0.054559767, -0.22033226, 0.16813108, 0.07049406, -0.07914666, 0.44900405, -0.2244528, 0.035653476, 0.05198975, -0.16546313, -0.113693014) * inp_2_1_0; + result3 += M4(0.015167149, 0.080200985, 0.18556446, 0.044955164, -0.17171162, -0.055256296, -0.002402905, 0.082981795, -0.22192933, 0.03015825, -0.25711286, 0.011584354, -0.095374405, -0.1382058, -0.12054189, 0.10028561) * inp_2_2_0; + result3 += M4(0.004898744, -0.089915045, -0.095151104, -0.8470385, 0.037769705, -0.07265799, -0.13910796, -0.52633315, -0.07218728, -0.05430542, 0.37463775, -0.4195107, -0.11475595, 0.32739305, -0.06587419, 0.096468985) * inp_2_0_1; + result3 += M4(0.43917456, 0.026247881, 0.19216591, 0.11570986, 0.46347585, -0.39810273, 0.45491657, 0.7642445, 0.52890843, 0.058011733, 0.6879336, 1.197659, -0.17768478, -0.044728726, 0.0114222765, 0.15778284) * inp_2_1_1; + result3 += M4(-0.087177016, -0.10747335, -0.10010042, 0.115062304, -0.8122979, 0.06514974, -0.20169608, -0.10079475, -0.99654114, 0.3199778, -0.07893785, -0.12280641, -0.31013697, 0.34886715, 0.16507483, -0.1397757) * inp_2_2_1; + result3 += M4(-0.040510368, -0.19001658, 0.10233444, -0.21234024, 0.019421631, -0.2970453, 0.0011585673, -0.20484056, 0.07370205, -0.07258561, 0.26393914, 0.021444967, 0.17476425, -0.11027206, 0.45120278, -0.14630376) * inp_2_0_2; + result3 += M4(0.13665591, 0.4259041, 0.0023495876, 0.14909796, 0.19523306, 0.3640925, -0.26424402, 0.22802217, 0.083183356, 0.6097358, -0.7197997, -0.32168692, 0.2591536, 0.26636642, -0.1078281, -0.1142868) * inp_2_1_2; + result3 += M4(0.041843053, 0.021810856, -0.21729478, -0.08708366, -0.2119869, -0.15670185, -0.18791877, 0.05018508, 0.3888126, -0.37974566, -0.27909023, 0.053460464, 0.06214204, -0.44816417, 0.15038887, 0.16712622) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.3472437, 0.013380894, 0.08867833, -0.03453232, 0.58152944, -0.43871528, 0.22380953, -0.04550669, 0.120581925, 0.004563894, 0.04559358, 0.0027206047, 0.017552061, 0.16171905, -0.037060566, -0.01708926) * inp_3_0_0; + result0 += M4(-0.34160993, -0.11255932, -0.058914144, 0.026892548, -0.31992993, 0.26869294, -0.09144462, 0.08680876, 0.26296964, -0.12034341, -0.045838475, -0.032575533, 0.07309527, -0.11566818, 0.018513981, -0.010388167) * inp_3_1_0; + result0 += M4(0.28056777, 0.07695634, -0.059898093, -0.061575457, 0.3669255, 0.028526982, 0.24511854, -0.09934631, -0.07288608, 0.050052203, -0.038593568, 0.008848001, 0.27569962, -0.037571654, 0.056816753, -0.0039305515) * inp_3_2_0; + result0 += M4(-0.028644724, 0.12271751, 0.026339592, 0.008865822, 0.2519346, -0.26284647, -0.1638227, -0.008493934, -0.28506994, 0.011916564, 0.019927721, -0.029855786, 0.0014189436, -0.047583543, -0.050952516, -0.083322175) * inp_3_0_1; + result0 += M4(0.20403737, -0.040827665, -0.0028530445, -0.017813073, -0.4706143, 0.42873096, 0.14829667, 0.046647582, -0.48000586, 0.37023175, 0.08343689, 0.0029796327, -0.23113053, 0.065826334, 0.074439414, 0.074652724) * inp_3_1_1; + result0 += M4(0.1586078, 0.0784932, -0.15297528, 0.09501966, -0.4055182, -0.30885902, -0.060376216, -0.15000467, -0.009729531, 0.07221125, -0.04001262, 0.12093661, -0.15710236, 0.09445375, 0.073956475, -0.019581962) * inp_3_2_1; + result0 += M4(-0.111901745, 0.02471801, -0.06651766, 0.095790766, -0.08006672, 0.19840515, 0.26936525, -0.13326232, -0.10196766, -0.19608083, -0.11811127, 0.22120981, -0.10520785, 0.095748596, -0.007844923, 0.11197408) * inp_3_0_2; + result0 += M4(0.043696456, 0.013067065, 0.07440999, -0.53549933, 0.073651895, -0.0088031795, -0.14840111, 0.44721222, 0.2975085, -0.023100551, -0.15204108, 1.3613566, -0.03796179, 0.07700565, -0.04039371, 0.39191732) * inp_3_1_2; + result0 += M4(-0.035744753, 0.008431576, -0.011160678, -0.089015596, 0.067718446, 0.045862436, -0.1271991, -0.052337117, -0.21953662, -0.021048736, -0.019922525, 0.16980134, -0.06376514, 0.020770412, -0.1292233, 0.19095159) * inp_3_2_2; + result1 += M4(0.04209156, -0.10028043, 0.045473978, 0.029526308, -0.1029502, 0.097725846, 0.11866024, 0.101209536, -0.103658065, 0.1303318, 0.10141563, 0.08520663, 0.056324724, 0.043090805, 0.061262637, -0.009563499) * inp_3_0_0; + result1 += M4(-0.11467653, -0.05272206, -0.12958023, -0.018456401, 0.023291504, 0.10627822, 0.046663657, 0.16016315, 0.049062163, -0.19274554, -0.076242104, -0.039942898, -0.25169963, -0.048676368, 0.0037137556, 0.053856958) * inp_3_1_0; + result1 += M4(-0.15907876, -0.11642729, 0.08522632, -0.012964159, -0.21032064, 0.18714333, 0.018133575, -0.12953383, 0.07832173, -0.07664562, -0.008530792, -0.030324288, 0.2171452, -0.052815564, -0.03799995, -0.07796586) * inp_3_2_0; + result1 += M4(0.014487541, 0.035919957, -0.043378692, -0.10243317, 0.29915744, -0.029785946, 0.08348936, -0.2593623, -0.28476247, 0.15268299, -0.009884593, 0.28988793, 0.18091768, 0.41806173, -0.0008945458, 0.43557742) * inp_3_0_1; + result1 += M4(-0.015301471, 0.028162321, 0.0628364, 0.12303836, -0.07908043, -0.05095927, 0.08793644, 0.109865434, 0.009046035, -0.014763819, -0.10699331, -0.1811893, -0.35765564, 0.015265002, -0.021379912, 0.054260004) * inp_3_1_1; + result1 += M4(-0.008764806, -0.047667857, -0.00043627238, -0.085696295, -0.071407646, -0.31469864, 0.09608359, 0.0036131532, 0.04063981, -0.02390764, 0.03337885, -0.08083824, 0.4892242, -0.030610098, 0.053893816, 0.0005124162) * inp_3_2_1; + result1 += M4(0.23028834, 0.27810562, -0.0005937561, 0.062948644, -0.06315908, 0.2782613, 0.054228317, 0.37353197, 0.04041054, -0.83467233, -0.20950946, 0.2553413, 0.13149354, 0.12652624, -0.108717784, 0.39738894) * inp_3_0_2; + result1 += M4(-0.056789584, 0.22073776, 0.43888393, 0.007940124, -0.17490996, -0.10502325, -0.49565843, -0.26163256, 0.5991587, -0.6067586, -0.9914189, -0.2210728, -0.3194455, -0.15456308, -0.13144505, -0.03552233) * inp_3_1_2; + result1 += M4(-0.32254165, 0.044227004, 0.13516445, 0.03845159, 0.009997396, 0.008264542, -0.06699806, -0.051496867, 0.11909525, -0.28769228, -0.18918002, -0.057668176, 0.23843196, -0.1769408, -0.076675124, -0.031703703) * inp_3_2_2; + result2 += M4(0.024601893, 0.047437504, 0.29823276, 0.09947944, 0.21934599, 0.11803661, 0.65973103, 0.26546025, 0.029531708, -0.0067652045, -0.17580013, 0.26997727, -0.030777141, 0.040013187, 0.024318442, 0.37423348) * inp_3_0_0; + result2 += M4(0.112576716, -0.13343264, 0.08077175, -0.048998382, -0.093169354, -0.04977975, 0.015730407, -0.73369396, -0.09483911, -0.06737101, 0.06244766, 0.07160388, -0.002243437, -0.12980196, -0.042938337, -0.026755292) * inp_3_1_0; + result2 += M4(0.062544756, 0.30026558, 0.17554766, 0.13842122, 0.04878832, -0.1402889, 0.1123605, -0.070087515, 0.016846227, 0.13830933, -0.003600853, -0.07052991, 0.08062244, 0.14440808, 0.037623156, -0.10593128) * inp_3_2_0; + result2 += M4(-0.022144489, 0.031163864, -0.35879242, -0.06148122, 0.18611787, 0.28179172, -0.65257895, 0.22794338, 0.075979315, -0.1493961, 0.022940412, -0.04455144, 0.013953682, 0.08925602, -0.010988895, -0.06853787) * inp_3_0_1; + result2 += M4(-0.104398176, -0.165788, -0.27504763, -0.45820633, 0.12718037, -0.30875504, 0.12423894, 0.15830809, -0.14640152, 0.072613806, -0.013286344, 0.03865688, 0.06950812, -0.34721127, -0.008446023, 0.07753682) * inp_3_1_1; + result2 += M4(-0.0765464, 0.043303255, 0.021159632, 0.031017859, -0.11436186, 0.084210224, -0.3106996, 0.088460155, 0.1289226, 0.20739235, 0.1362793, -0.2524162, -0.17312491, -0.12867886, -0.10566141, 0.031078596) * inp_3_2_1; + result2 += M4(0.09355678, 0.10412212, 0.004731364, 0.42740902, -0.116885625, 0.052118473, 0.43677473, 0.20393315, 0.07955809, -0.119825155, 0.17133446, -0.11519095, 0.13483945, -0.010165948, 0.11746103, 0.033520274) * inp_3_0_2; + result2 += M4(-0.3813429, -0.11363336, -0.12936473, 0.18715818, 0.32119343, -0.021526324, -0.43352234, -0.06257893, 0.6233187, 0.13396265, 0.038704164, 0.0631709, 0.1939896, -0.15153073, 0.123462155, -0.01652716) * inp_3_1_2; + result2 += M4(-0.41880918, -0.030412536, 0.12958126, 0.120551094, -0.022546515, -0.04808989, 0.17756711, -0.108908154, 0.2226288, -0.10673246, -0.16231227, -0.03192408, 0.14065991, 0.1836104, -0.03244477, -0.044319637) * inp_3_2_2; + result3 += M4(-0.0011758883, 0.0031363205, -0.16173664, 0.08941673, -0.11167737, -0.33703038, 0.12200337, 0.055131473, 0.035779245, 0.0029444366, 0.055127386, -0.09139993, -0.033134703, -0.03748916, -0.066961385, -0.108324334) * inp_3_0_0; + result3 += M4(0.053190347, -0.111483805, -0.06346869, 0.012349723, -0.045100734, 0.029720673, -0.22522068, 0.14960602, -0.043017942, 0.092041545, 0.16698928, 0.08137758, 0.16750063, 0.011768444, -0.09525918, 0.010928377) * inp_3_1_0; + result3 += M4(-0.14769338, 0.027719587, -0.058809258, 0.028551238, -0.09908326, 0.10515259, -0.14025599, 0.061426327, -0.042780805, -0.035405204, -0.05823736, -0.016086705, 0.04844154, 0.032153595, -0.07846922, 0.019060513) * inp_3_2_0; + result3 += M4(-0.07933811, 0.29348436, 0.15147564, -0.011950693, -0.07698759, 0.21123506, 0.27513096, -0.4870618, 0.15858337, -0.088143416, 0.0066797114, -0.2147107, 0.09265716, -0.03495672, 0.045518417, -0.3315414) * inp_3_0_1; + result3 += M4(0.1404907, -0.053150203, -0.040700138, 0.18472278, 0.61421394, 0.054680698, 0.046741713, 0.0037532535, 0.13713816, 0.114549585, 0.26238853, 0.21299282, 0.12599483, 0.028305324, -0.010574808, -0.57075983) * inp_3_1_1; + result3 += M4(-0.13837083, 0.1861814, 0.27288082, 0.02824301, -0.2062445, 0.06472042, 0.019210115, 0.007461685, -0.32328922, 0.014523166, -0.30206257, 0.1573444, 0.15600231, 0.0886993, 0.24092384, 0.02336472) * inp_3_2_1; + result3 += M4(0.024918266, -0.28346768, -0.033286523, -0.19488813, -0.021365946, -0.31525356, -0.06427523, -0.022802275, 0.017455311, 0.29595226, -0.21315272, -0.055813782, 0.086387426, -0.14360276, -0.13709465, -0.122531205) * inp_3_0_2; + result3 += M4(0.10574195, -0.4813584, 0.31677288, -0.08348199, -0.15907282, 0.090848915, -0.4333516, -0.014139355, 0.11864891, 0.5082066, -0.43740028, 0.10677436, 0.101659745, 0.06943931, 0.02947963, -0.027463546) * inp_3_1_2; + result3 += M4(-0.20253208, -0.26093277, 0.068154514, 0.024943102, 0.054091427, -0.12938003, 0.20981514, 0.16747186, -0.19666524, 0.109958075, -0.24808154, -0.011728526, -0.020255229, 0.12573044, -0.07719842, 0.07252243) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 DS (Conv2D-2-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_1 +//!SAVE conv2d_2 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.023435008, -0.00027622582, -0.015393672, 0.008721407); + V4 result1 = V4(-0.0058370507, -0.015384002, -0.010110728, 0.015183784); + V4 result2 = V4(0.038818885, 0.047503617, -0.043154787, -0.005362168); + V4 result3 = V4(-0.03511599, -0.0390787, -0.001977005, 0.019544978); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.058053754, 0.13135362, -0.047918122, -0.011845601, -0.0074042883, -0.01840911, -0.011805869, -0.03396952, -0.1423342, 0.26230896, -0.119458295, -0.06616202, -0.009783131, 0.035237905, -0.03701137, -0.10224075) * inp_0_0_0; + result0 += M4(-0.041274697, -0.07608542, 0.047750793, 0.054070923, -0.16413322, 0.014423329, -0.03390137, -0.00094438414, 0.24362351, -0.2306998, 0.025874767, -0.07668255, -0.15923639, 0.46262452, 0.05566397, 0.15915436) * inp_0_1_0; + result0 += M4(0.11520685, 0.0699546, 0.064455785, -0.0076417695, 0.0049518016, -0.0375039, -0.026019963, -0.007440243, 0.03008722, 0.14577916, -0.049544826, 0.05725768, 0.06544244, 0.07811894, 0.05958433, 0.037279688) * inp_0_2_0; + result0 += M4(-0.077427626, -0.28169155, 0.14521974, -0.02468973, -0.012213673, 0.045991287, 0.032625675, -0.041064482, 0.045073047, 0.22772516, 0.09916965, 0.032622837, 0.081653826, 0.0040710922, -0.06014905, -0.014239243) * inp_0_0_1; + result0 += M4(-0.08949968, 0.40064472, -0.3088256, -0.030333402, -0.077949814, 0.036044396, 0.006116637, 0.016873905, -0.061148554, -0.18398748, 0.016047241, 0.21445145, -0.5862237, 0.06960463, -0.24190919, 0.019996881) * inp_0_1_1; + result0 += M4(0.0010335072, -0.074155085, 0.06035906, 0.05635123, -0.029693812, 0.25365904, -0.00024468364, 0.017304827, -0.18047398, -0.060659446, -0.011265205, 0.014874942, -0.60377824, 0.0348222, 0.076552495, 0.06994206) * inp_0_2_1; + result0 += M4(0.0068813893, -0.040201046, 0.15965754, -1.7235106e-05, -0.017728887, 0.0489135, -0.048296545, -0.0256505, 0.09437446, 0.12918611, -0.04645181, -0.22671208, 0.08722971, -0.27255175, 0.024839658, 0.031033102) * inp_0_0_2; + result0 += M4(0.32137305, -0.102484845, 0.5899058, 0.44748813, 0.14033101, 0.26633027, 0.14133942, -0.045242507, -0.3500667, -0.16679467, -0.11007231, -0.1118854, 0.14673825, 0.065924786, 0.017390981, -0.0049263104) * inp_0_1_2; + result0 += M4(-0.2750656, -0.12161614, -0.28282353, -0.22726911, -0.04463269, 0.053947803, -0.038568437, -0.06423929, 0.24576302, 0.03625427, 0.10282412, 0.05768898, -0.30617765, 0.08486049, -0.027985916, 0.014466912) * inp_0_2_2; + result1 += M4(-0.0073026754, -0.10402381, -0.013642001, 0.044249803, -0.02854999, 0.26434416, 0.057275936, 0.08449719, -0.2368094, -0.006792606, 0.08725315, -0.1143782, -0.26464862, -0.14515208, 0.06274822, 0.36444998) * inp_0_0_0; + result1 += M4(-0.013720833, -0.06886963, 0.05349541, -0.06206712, 0.035714574, 0.039087676, 0.08770568, 0.14166538, 0.19585021, -0.2129663, 0.14013258, 0.0022852065, -0.5944084, -0.7182823, 0.122801915, -0.15706588) * inp_0_1_0; + result1 += M4(0.10479358, 0.120234706, -0.064341865, 0.14256644, 0.10301237, -0.04109505, -0.0512812, 0.13723285, -0.029703898, 0.24554458, 0.01530522, 0.3853674, -0.20900846, -0.5164066, -0.20735526, 0.07260991) * inp_0_2_0; + result1 += M4(-0.14815906, -0.01028779, -0.14179946, -0.08245007, 0.019574288, 0.16411702, 0.11887322, 0.0020758726, 0.028338032, -0.16261598, 0.17139073, -0.06354438, -0.18751918, -0.06267931, -0.009964829, 0.011002064) * inp_0_0_1; + result1 += M4(-0.080518, 0.1318538, 0.44151536, -0.04916626, -0.056665212, 0.34340844, 0.16808915, 0.07016322, -0.2744961, 0.019613005, -0.52572715, -0.5972775, -0.17945085, -0.38791883, 0.2364365, 0.4347594) * inp_0_1_1; + result1 += M4(0.18026938, -0.1343583, -0.27794445, 0.25141716, 0.25054744, 0.11847508, -0.022598626, -0.08347308, -0.06789105, 0.56946987, 0.21327427, 0.39672527, -0.07893942, -0.3660021, 0.04420206, -0.04678048) * inp_0_2_1; + result1 += M4(-0.3361689, 0.21600454, 0.29812515, 0.19549452, 0.13161008, 0.1506024, 0.084969185, 0.07457274, 0.115148, -0.10726738, -0.15455638, 0.022031983, -0.07685952, 0.004126467, -0.0036478213, -0.03565146) * inp_0_0_2; + result1 += M4(-0.041066427, -0.11341293, -0.9815334, -1.0637896, 0.23624156, 0.144971, 0.13262825, -0.06459397, 0.3298128, -0.18340024, 0.044938684, -0.078921996, -0.15567741, -0.06563018, 0.058869045, -0.31469694) * inp_0_1_2; + result1 += M4(-0.18666749, -0.04640199, 0.6378595, 0.15205689, -0.010305863, 0.25054187, 0.18608533, 0.12638347, 0.1989298, -0.16685888, -0.008758655, -0.11104765, -0.010293042, -0.19616619, 0.03701753, 0.16267337) * inp_0_2_2; + result2 += M4(-0.03328148, -0.006684863, 0.047662534, -0.06358788, 0.018822119, -0.053844366, 0.06987464, 0.092299104, -0.13518637, 0.12761132, -0.13602121, 0.15030415, 0.16349082, 0.13304846, -0.12295147, -0.5695785) * inp_0_0_0; + result2 += M4(0.09411206, -0.05187804, -0.017689293, 0.013353826, -0.08697054, -0.1597196, 0.22802964, 0.04886305, 0.08418551, -0.0804207, 0.11035258, 0.12820846, 0.023220098, 0.057945892, -0.31034696, -0.15134479) * inp_0_1_0; + result2 += M4(0.114032544, -0.06916583, 0.025773713, 0.05741373, -0.24842425, -0.09751518, 0.14063355, 0.0502536, 0.054900263, -0.17048357, -0.11259802, 0.160759, 0.16757573, -0.01877, -0.11194997, -0.16462773) * inp_0_2_0; + result2 += M4(0.35808134, 0.039701495, 6.3124726e-06, 0.03133524, -0.05278441, -0.054526035, 0.04481739, 0.2529997, -0.16400562, -0.19464107, -0.2156525, -0.04006176, 0.19686534, 0.033792473, -0.49558243, -0.25051036) * inp_0_0_1; + result2 += M4(-0.05304926, -0.3043419, 0.10092999, -0.058093864, -0.23438485, 0.034214076, 0.057646334, 0.1186709, 0.044353776, -0.1963721, -0.37588304, -0.13445406, 0.127387, -0.35068044, -2.7945485, -0.34946597) * inp_0_1_1; + result2 += M4(-0.39820927, 0.21416184, -0.05426307, 0.04687176, -0.2081737, -0.2406106, 0.23088469, 0.11969322, -0.083836876, 0.29234567, -0.28048143, 0.052370936, 0.21438457, 0.03972491, 0.13101222, -0.27309152) * inp_0_2_1; + result2 += M4(-0.41306856, 0.16440691, -0.09808768, -0.26407242, 0.0053243865, -0.09325784, 0.20075214, 0.3811357, 0.30143264, 0.058478504, -0.06928174, 0.027018353, -0.20570262, -0.013981209, 0.007406996, -0.118252516) * inp_0_0_2; + result2 += M4(0.27038062, 1.5538056, -0.87050104, 0.03884074, -0.28182444, -0.08340967, -0.0689404, 0.3859192, -0.116228536, -0.31909284, 1.1460763, -0.2930017, 0.05609198, -0.26499516, -0.40788504, -0.4939044) * inp_0_1_2; + result2 += M4(0.18884245, -0.25252223, -0.2608849, -0.101122685, 0.037499864, -0.23475505, 0.23866269, 0.112167336, -0.011161603, 0.13258833, 0.23283808, 0.20873502, 0.12333728, 0.008156681, -0.061962094, -0.2777167) * inp_0_2_2; + result3 += M4(-0.017292995, 0.059847377, -0.01150032, -0.004381958, 0.009071516, 0.006968245, -0.034055986, 0.03740713, -0.07671129, 0.010568533, -0.11548467, -0.03640214, 0.004297413, 0.013166457, -0.020208651, -0.042670313) * inp_0_0_0; + result3 += M4(0.021905567, -0.012356532, 0.034336973, -0.025187774, 0.021469206, -0.04151741, 0.009018021, 0.11130828, 0.036343213, 0.023039078, 0.046457145, -0.16021183, 0.07557342, -0.04547214, -0.06765464, -0.10687027) * inp_0_1_0; + result3 += M4(-0.030245442, 0.017085928, 0.05411745, -0.02326739, 0.09594549, 0.042214155, -0.051801145, 0.08451421, -0.13254002, -0.02382279, 0.050920837, 0.00031751744, 0.18047972, 0.16602163, 0.030823914, -0.0011384314) * inp_0_2_0; + result3 += M4(0.023018463, 0.17725265, -0.083900005, -0.0016977334, 0.08052999, 0.012068541, 0.023925066, 0.062392928, 0.089258514, 0.20762452, -0.0012363704, -0.06545757, -0.041220512, 0.14856975, -0.006452312, -0.06116456) * inp_0_0_1; + result3 += M4(0.26562902, -0.016244365, 0.0019193676, 0.24509418, -0.09421186, -0.010551239, 0.023509221, 0.2747535, 0.22532648, 0.12740539, 0.036053278, 0.05915232, -0.2972877, 0.3417145, 0.49117815, -0.15531492) * inp_0_1_1; + result3 += M4(-0.24040136, 0.12780526, -0.013421846, -0.25284502, 0.11611097, -0.025960911, 0.03066189, 0.1830375, 0.21415165, 0.033922963, -0.13749541, 0.02706012, -0.2598328, 0.21364947, 0.09336273, 0.04968067) * inp_0_2_1; + result3 += M4(-0.03718352, -0.96204364, 0.03714818, -0.43719187, -0.048487782, -0.43293557, -0.059800256, 0.078956455, 0.0018238121, -3.0549855, -0.03621669, 0.108869955, 0.036982004, 0.19670472, 0.036557764, 0.1534082) * inp_0_0_2; + result3 += M4(0.26199692, -0.8192162, 0.28409663, 0.9116149, 0.089281835, -0.75085104, 0.07663377, 0.13557278, -0.08273171, -3.062832, -0.019690165, -0.18279873, -0.037827354, 0.18978551, -0.028312258, -0.09479274) * inp_0_1_2; + result3 += M4(0.21662533, -0.042922545, -0.20742215, 0.028488081, -0.022670094, -0.5893865, 0.008961727, 0.3320175, 0.028824994, -2.5308259, 0.11584823, -0.08467847, -0.09340072, 0.3430715, -0.060575213, 0.101658076) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.020158637, 0.04921676, 0.0011248378, -0.0139853535, -0.021115072, 0.0842691, 0.07378322, -0.0016990606, 0.059866313, -0.28137094, -0.06698033, 0.10465488, 0.010329514, 0.0108864745, -0.01272496, 0.045122433) * inp_1_0_0; + result0 += M4(0.08854995, 0.055070054, -0.055015758, 0.021567572, -0.11257386, 0.5842653, -0.0069135004, 0.035885066, -0.1636142, -0.7459314, -0.15335257, -0.010262181, 0.027063252, 0.15648766, -0.055906493, -0.05358466) * inp_1_1_0; + result0 += M4(0.11930604, -0.041682154, -0.00046179755, -0.046034325, -0.039645318, 0.13995461, 0.06940307, 0.0001820343, 0.25363562, -0.08676501, 0.017460763, -0.0004489692, 0.23728251, 3.2216347e-05, 0.08378842, 0.11764811) * inp_1_2_0; + result0 += M4(-0.055466212, -0.04458063, 0.092873715, 0.038544595, -0.14927305, 0.005744432, 0.04113772, 0.019167574, 0.036161095, -0.33363798, 0.039980143, 0.045724906, 0.1571698, -0.0023385854, -0.07739416, -0.08512195) * inp_1_0_1; + result0 += M4(0.16172823, 0.19970015, -0.023721108, -0.08872322, -0.06674386, 0.20343593, 0.04090839, 0.12648766, 0.32689074, 0.07949466, 0.77407956, 0.27892375, 0.0955797, -0.3725432, 0.11103006, 0.12239984) * inp_1_1_1; + result0 += M4(-0.38779613, -0.01784853, -0.06963441, -0.0397871, -0.63667417, 0.11148345, 0.11130723, 0.080527484, 0.52029324, -0.077319995, -0.024498427, 0.018516215, 0.4087798, -0.3360343, -0.06909514, -0.045169) * inp_1_2_1; + result0 += M4(-0.14526395, 0.061370913, -0.043710344, 0.00422225, -0.009295979, 0.039428223, -0.037319314, -0.028051874, 0.011409687, -0.035212006, 0.044103246, 0.07119403, -0.029897586, -0.11282113, 0.06211073, 0.029109601) * inp_1_0_2; + result0 += M4(-0.09135313, -0.06939499, 0.07843825, 0.097238205, -0.074063435, 0.063782595, -0.0199373, -0.004162513, 0.23876402, 0.048402824, 0.011737331, 0.0032931073, -0.027612906, -0.060305446, 0.062121384, 0.02301595) * inp_1_1_2; + result0 += M4(0.3584948, 0.042655364, 0.036384244, 0.035225525, -0.08145385, 0.11985752, -0.030626295, -0.015063418, 0.05193084, -0.1576456, -0.013641532, -0.018054835, 0.014948068, -0.050316945, 0.0032408063, -0.014731045) * inp_1_2_2; + result1 += M4(0.32308826, 0.14756969, -0.25738078, -0.08276465, 0.0055609527, 0.063924596, -0.022715418, 0.049488764, 0.02728907, -0.13584627, -0.028130148, -0.25563374, 0.06999099, -0.050134107, -0.00291317, 0.0083785765) * inp_1_0_0; + result1 += M4(-0.12584916, -0.064904496, 0.12157791, -0.48184228, 0.105223686, 0.22921236, 0.07946646, 0.15504126, -0.2577391, -0.37409326, 0.120499425, 0.12071196, 0.1728067, -0.05941374, 0.08807147, -0.4108605) * inp_1_1_0; + result1 += M4(0.06337823, 0.15880086, -0.099946834, -0.114392236, 0.1709455, 0.5266816, -0.13256815, 0.16290307, 0.077787966, -0.7275313, 0.12744896, -0.41949978, -0.2116448, -0.9786744, -0.1913137, 0.1305901) * inp_1_2_0; + result1 += M4(0.16809405, 0.23277469, -0.058339387, 0.16693619, -0.038102575, -0.08851083, -0.02797779, 0.04274495, -0.20028922, 0.04436475, 0.013740321, 0.053681087, 0.048335608, 0.032794934, -0.07580541, -0.047612146) * inp_1_0_1; + result1 += M4(0.39193976, -0.035292547, 0.13096325, -0.5574103, 0.19815198, 0.09274524, -0.19850785, 0.21971238, -0.47791016, -0.37023675, 0.4238322, -0.085052595, -0.113550246, 0.019958464, -0.021854822, 0.1149585) * inp_1_1_1; + result1 += M4(-0.1860216, -0.23182867, -0.013862331, 0.608505, -0.06452028, 0.28561857, 0.04867474, 0.8088521, 0.0956222, -0.13799746, -0.20208229, -0.71716607, -0.041455816, -0.3238654, -0.42159647, -0.09715043) * inp_1_2_1; + result1 += M4(0.144747, -0.0021215512, -0.08473307, 0.27575985, 0.022519859, 0.039966933, 0.030069487, 0.04688268, -0.07048565, 0.03966074, 0.041769076, -0.047249142, 0.04115463, -0.008614794, -0.0038662087, -0.060845178) * inp_1_0_2; + result1 += M4(-0.05863267, -0.004415535, 0.12966555, 0.24865213, -0.014542384, -0.09795358, -0.032396104, 0.36158124, 0.05366866, 0.004015526, -0.0067248484, -0.38101593, 0.10725015, 0.012040856, 0.023441372, -0.069572) * inp_1_1_2; + result1 += M4(-0.09699632, 0.15249658, 0.12531403, -0.3328034, 0.0030972431, -0.19210772, -0.035863765, 0.45071825, -0.1378622, 0.08406743, -0.038835898, -0.20673525, 0.07893035, -0.054715797, -0.08594201, -0.2384776) * inp_1_2_2; + result2 += M4(-0.10114114, -0.17318277, 0.2932721, 0.37389088, 0.04549849, 0.021528823, -0.0007721709, -0.1394988, 0.1169677, -0.08984449, -0.01845354, 0.19966806, 0.13676907, -0.055648476, -0.018576363, 0.15089002) * inp_1_0_0; + result2 += M4(-0.08810577, 0.12845947, -0.022037087, 0.0713056, 0.026246676, -0.011513274, 0.0025324174, -0.082259364, -0.38545743, -0.2139153, 0.090562925, 0.1171016, 0.020509541, -0.14015672, -0.10214009, 0.030530844) * inp_1_1_0; + result2 += M4(0.005022763, -0.1465861, 0.17625697, 0.07496652, 0.06826987, 0.0644632, 0.05419615, 0.068747275, -0.01850323, 0.11714754, 0.015112417, 0.12423838, -0.21304888, -0.008375001, -0.2605828, -0.07451024) * inp_1_2_0; + result2 += M4(-0.15553749, -0.34850895, 0.39819357, 0.22360839, 0.054737903, 0.043017726, -0.008483063, -0.32135597, -0.11481686, 0.070533566, 0.32961053, -0.21778224, -0.13037261, -0.15484872, 0.07325692, 0.13470246) * inp_1_0_1; + result2 += M4(0.16771689, -0.3213681, -0.22630855, 0.2090357, 0.531006, -0.1665998, -0.55734706, -0.7523218, -0.090682685, 0.39249292, 0.21835013, -0.030219488, -0.1309162, 0.08927703, 0.40079466, 0.5337078) * inp_1_1_1; + result2 += M4(-0.047077622, 0.10245612, -0.11671954, -0.039104506, 0.045307513, 0.06795554, 0.37351328, -0.27963153, -0.10477316, 0.012324867, -0.17526017, 0.091815375, 0.38696444, 0.14811198, -3.5837452, 0.32542264) * inp_1_2_1; + result2 += M4(0.107646614, -0.12702344, -0.017104609, -0.10133434, 0.062007267, 0.02794019, -0.12198437, -0.20940919, -0.039446287, -0.04715233, -0.1441309, -0.00020755765, -0.050709587, 0.004934061, 0.066610165, 0.102615274) * inp_1_0_2; + result2 += M4(0.055885743, 0.20596245, 0.39146072, -0.10714875, 0.0031467446, 0.042376287, 0.20682976, -0.46683162, -0.029935647, 0.12960306, -1.4127905, 0.297964, -0.09073476, -0.10628283, -0.15256898, 0.28072315) * inp_1_1_2; + result2 += M4(-0.01828279, 0.055520464, -0.1621053, -0.100111686, 0.051583163, -0.023852073, -2.2467358, -0.43954092, -0.09379297, -0.004591499, 0.12515631, 0.13008092, -0.09091408, -0.10551536, 0.06935946, 0.267165) * inp_1_2_2; + result3 += M4(0.001121231, -0.116080426, -0.107541114, -0.19430692, 0.03921505, 0.032906685, 0.027074352, -0.006836348, -0.049477026, -0.020372244, -0.046985947, -0.017023273, -0.09252118, 0.00045681695, -0.05083715, 0.0002327922) * inp_1_0_0; + result3 += M4(0.17081107, 0.171148, -0.0045726285, -0.059847992, 0.102544926, -0.037925754, 0.023703234, -0.016200975, -0.068067454, 0.08789572, -0.045858927, -0.15687598, -0.030475779, 0.3318887, 0.092105575, 0.0339815) * inp_1_1_0; + result3 += M4(-0.3998928, 0.10400071, 0.0146760205, -0.079928584, -0.19716969, 0.05670307, 0.043592338, -0.05051233, -0.4631333, -0.111446775, 0.018087799, -0.13826992, -0.4345676, -0.28385895, -0.09957666, -0.09572035) * inp_1_2_0; + result3 += M4(0.025526108, -0.65327173, 0.050278466, -0.17187065, 0.02873274, -0.049899336, 0.034705333, 0.0026502954, -0.06212493, -1.0741755, 0.00038897205, -0.010395267, 0.030468699, 0.23473783, -0.009471362, -0.06953327) * inp_1_0_1; + result3 += M4(0.504466, 0.25026208, 0.14870858, -0.32623893, 0.043759342, 0.119388305, -0.01180262, 0.045797486, -0.15875077, -1.2279036, -0.13139768, -0.015066072, 0.15799735, 0.36802685, -0.02803516, -0.009432813) * inp_1_1_1; + result3 += M4(-0.07725342, -0.23465729, 0.01499422, 0.008299808, 0.080197036, -0.34347633, 0.021336041, 0.0015247765, -0.08134993, -1.0686655, 0.006038173, -0.17920311, -0.021682333, -0.5358267, 0.032830767, -0.16503559) * inp_1_2_1; + result3 += M4(-0.046656102, 0.4130624, -0.08565986, 0.044300493, -0.00034583264, -0.4603019, -0.00814766, 0.03564214, 0.011428414, 0.13996872, 0.03787744, -0.095117405, 0.027809668, -0.47052267, 0.053844158, 0.014706537) * inp_1_0_2; + result3 += M4(0.22918473, -1.2321059, 0.018048212, 0.14816047, -0.08237241, -0.8479986, 0.029264655, 0.045883853, 0.0739114, 0.3766523, 0.025773916, -0.1114103, 0.007666082, -1.6611128, 0.06056709, 0.013368697) * inp_1_1_2; + result3 += M4(0.070496134, -0.13917391, 0.01671008, -0.02739195, -0.055815388, 0.27967262, -0.026290499, 0.044944398, 0.04376932, -1.7079539, 0.014957602, -0.0064308657, -0.0064193904, -1.7823993, 0.020053854, -0.020422848) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.040685326, 0.019202568, 0.085796, 0.058194246, -0.12204348, -0.17381316, 0.14245704, 0.08302883, -0.11325476, -0.098387495, 0.011919243, 0.037839588, -0.019909292, -0.090265736, -0.029772518, 0.021361295) * inp_2_0_0; + result0 += M4(0.1350175, -0.17427717, -0.06368384, 0.04834391, -0.32116097, 0.22988725, -0.15886529, -0.057563584, -0.06309216, -0.19327909, 0.012142371, -0.019530954, 0.015532162, -0.09410268, 0.028791951, 0.019857269) * inp_2_1_0; + result0 += M4(-0.09504906, 0.09759539, -0.037708234, -0.03228641, -0.04091912, 0.019800322, 0.037136376, -0.014333935, -0.04841269, 0.006947392, -0.058824852, -0.01539875, 0.031869523, -0.10707408, -0.0053441883, 0.037088424) * inp_2_2_0; + result0 += M4(-0.017622449, 0.1668945, 0.049392745, 0.023371896, 0.14355041, 0.1256854, -0.09238751, 0.6084779, -0.06498068, 0.031000355, 0.008305978, 0.06628111, -0.0059575806, -0.07780641, -0.019977028, 0.053992756) * inp_2_0_1; + result0 += M4(0.64182985, -0.24790576, 0.22865957, 0.15013333, 0.22472541, -0.41521356, 0.2727451, 0.1425033, -0.104730055, 0.07813815, -0.07939012, -0.004840109, 0.015298698, -0.40924573, 0.047924146, 0.050329972) * inp_2_1_1; + result0 += M4(0.5166944, -0.14351964, 0.002835482, -0.021241073, -0.044501536, -0.09123378, -0.0025898484, 0.088492654, -0.060680177, 0.17358576, -0.031046059, -0.023313675, 0.21963911, -0.32172033, -0.03685404, -0.056302886) * inp_2_2_1; + result0 += M4(-0.14249846, 0.1919643, -0.054700527, -0.030300103, 0.116425626, 0.030547854, 0.29164848, 0.24575163, 0.113290496, 0.081504695, 0.11042106, 0.052331973, 0.051052187, -0.035564587, 0.10448482, 0.04722249) * inp_2_0_2; + result0 += M4(-0.20679013, -0.1357482, 0.0670046, -0.0044386904, -0.103470646, -0.026976867, -0.019741116, -0.096597396, 0.22226769, 0.039062824, 0.09040389, -0.0021132238, 0.0815542, -0.4116235, 0.30562884, 0.15595485) * inp_2_1_2; + result0 += M4(0.31853187, -0.0028201935, -0.0018939296, 0.000118292395, -0.03563755, 0.08407976, 0.047397576, 0.0067874063, -0.07854643, 0.08589363, 0.0595104, 0.033278853, 0.4471929, -0.1569817, 0.082737334, 0.017763961) * inp_2_2_2; + result1 += M4(-0.051908046, 0.04940803, 0.025206795, -0.08582518, 0.105329625, -0.13497052, -0.086282, 0.3592072, -0.021779265, 0.01662948, -0.029943835, 0.037047792, 0.01232303, 0.011557858, 0.011784409, -0.03676768) * inp_2_0_0; + result1 += M4(-0.18673477, -0.24641654, 0.33000603, 0.11542049, -0.30434307, 0.5306456, -0.011384738, 0.45843646, -0.20390716, 0.10540199, 0.016882136, -0.031867232, 0.008356345, -0.13086288, -0.041344773, -0.0036602747) * inp_2_1_0; + result1 += M4(0.13682915, 0.0036812855, 0.012057137, 0.23811786, 0.07334074, -0.08856756, 0.04595943, 0.1599024, -0.18250804, 0.13405186, 0.04430016, 0.051927723, 0.056383044, -0.027024115, 0.038770597, -0.07303996) * inp_2_2_0; + result1 += M4(0.15318306, -0.12760171, 0.0450346, -0.07374663, 0.07834138, 0.49790388, 0.2915172, -0.09512411, -0.19560269, 0.14700219, 0.07985623, 0.10233619, -0.115605205, 0.053538296, 0.052413, -0.01793204) * inp_2_0_1; + result1 += M4(0.25549623, 0.79109895, -0.15794283, -0.4189323, -0.065393336, -0.88975954, 0.08374594, -1.1873229, -0.016332334, 0.15877184, 0.110330045, 0.22505662, -0.10667615, 0.2046037, -0.034100883, -0.14114152) * inp_2_1_1; + result1 += M4(-0.029152432, 0.19976863, -0.0067866994, 0.1554457, 0.07682561, 0.13939528, -0.11835224, -0.1414863, -0.24614279, 0.087009184, 0.2559374, -0.06699069, -0.085265845, 0.18493001, -0.013739076, -0.42368194) * inp_2_2_1; + result1 += M4(0.118983015, -0.0572679, 0.000318014, 0.007505368, -0.0299957, 0.14891346, 0.12727791, 0.54379475, -0.07486102, 0.117346324, 0.09264876, 0.19114546, -0.051801726, 0.09137759, 0.076237656, 0.007558985) * inp_2_0_2; + result1 += M4(-0.0016464916, 0.092834815, -0.07756129, 0.4916174, 0.15548897, 0.41225353, 0.033371974, 0.05942626, -0.22053158, 0.1703363, 0.018514646, 0.014471713, -0.0042645177, 0.11441778, 0.20387441, -0.19286348) * inp_2_1_2; + result1 += M4(0.045293007, 0.056085728, -0.04795258, -0.22916062, 0.083087645, -0.03853095, 0.012642993, -0.11186545, -0.11702325, 0.21539073, 0.1151789, 0.12692805, 0.048481543, 0.073370904, -0.1511963, -0.4363887) * inp_2_2_2; + result2 += M4(0.22008175, 0.006780327, 0.005894409, 0.10082709, -0.044127602, 0.05716219, 0.0787319, -0.08502259, -0.05248802, 0.10199217, 0.12158407, -0.12550665, -0.06999623, 0.022333184, 0.014213934, 0.11376998) * inp_2_0_0; + result2 += M4(0.19652066, 0.36215308, 0.09469319, 0.06413764, 0.05205069, -0.016372532, 0.1787366, 0.0877199, -0.08429393, 0.21526356, 0.14981632, -0.1523603, -0.0466523, -0.057867594, 0.04867976, 0.069361486) * inp_2_1_0; + result2 += M4(-0.2724398, 0.19309507, 0.09607288, 0.1206929, 0.07003121, 0.09855454, -0.025575627, 0.009461037, -0.19269364, 0.16064173, 0.14619134, -0.08403769, 0.04281966, 0.055891816, -0.015193178, 0.02850246) * inp_2_2_0; + result2 += M4(0.052729435, 0.018342854, 0.020109378, 0.049135573, -0.27488902, -0.20894177, 0.08238209, 0.12393387, -0.05489923, 0.12008817, 0.13158463, -0.15824428, -0.18391077, 0.03304128, 0.04371131, 0.08666164) * inp_2_0_1; + result2 += M4(-0.07128967, 0.31714946, 0.08881361, -0.08835794, 0.041942906, -0.07898635, 0.09270609, -0.17499882, -0.1766717, 0.17561086, 0.1755127, -0.23229517, -0.46135002, 0.109490745, 0.11468097, 0.04771001) * inp_2_1_1; + result2 += M4(-0.049790166, -0.058075182, -0.072881676, 0.03250728, -0.009275402, -0.010968189, -0.1080809, -0.05768197, -0.26625115, 0.2584098, 0.23041652, -0.2520977, -0.21001528, 0.2393364, 0.06696907, 0.0046516233) * inp_2_2_1; + result2 += M4(0.23925087, 0.0680813, 0.078727536, -0.022581024, -0.095084116, 0.057004742, 0.3138766, 0.0392872, -0.14981374, 0.07913679, 0.1031623, -0.040174864, -0.10357394, 0.07672665, 0.02854845, 0.047957916) * inp_2_0_2; + result2 += M4(-0.08796459, 0.21651562, 0.2702043, -0.1740451, -0.27310392, 0.09648933, -0.3957877, -0.12951781, -0.021011474, 0.19034348, 0.11784486, -0.37994373, -0.5231188, 0.13480479, 0.19004749, 0.08633311) * inp_2_1_2; + result2 += M4(-0.09953264, -0.057516363, 0.009389417, 0.14430472, 0.032242656, -0.066502385, 0.28266618, 0.09512168, 0.09544029, 0.07469234, -0.004258793, -0.33108658, -0.46292925, 0.060545143, -0.26074094, 0.08396749) * inp_2_2_2; + result3 += M4(-0.07606638, -0.063000284, 0.09598554, 0.104964264, -0.040376373, -0.035215527, -0.0042664115, 0.1667837, 0.063100494, -0.018531347, 0.029744422, -0.075527735, 0.03385397, -0.021013837, -0.017285448, -0.08043407) * inp_2_0_0; + result3 += M4(-0.26622432, -0.03477078, 0.03494469, 0.04049817, 0.039655168, 0.08699442, -0.050543044, 0.22162461, 0.069138594, -0.050977368, -0.022323107, -0.05545389, 0.015020561, 0.026642598, 0.021018691, -0.02690074) * inp_2_1_0; + result3 += M4(-0.032372512, -0.08706534, -0.015817178, -0.08862899, 0.013261543, 0.002546997, 0.0176546, 0.008601677, 0.049245533, 0.04126535, -0.036267422, -0.1031398, 0.008470616, 0.015351556, 0.019256743, -0.016997326) * inp_2_2_0; + result3 += M4(0.0823704, 0.2817941, 0.08857372, 0.10827305, -0.12110614, 0.078699365, 0.23771732, 0.094654255, -0.042905893, 0.0771783, 0.0006978189, 0.029819358, -0.0036443584, -0.020106701, -0.01071964, -0.01958439) * inp_2_0_1; + result3 += M4(0.48942843, 0.27745262, 0.36281285, -0.028398752, 0.24205421, 0.25413743, 0.13406385, -0.018467713, -0.122251295, 0.0134095885, -0.074013464, -0.11212041, 0.00941324, -0.03942664, -0.008397736, -0.008076683) * inp_2_1_1; + result3 += M4(0.20749235, 0.21867277, 0.004653491, 0.03703782, 0.023102382, 0.07013684, -0.016614152, 0.028991466, 0.034551147, -0.079350136, -0.006204742, 0.061720155, 0.061270434, 0.028488534, -0.010227663, 0.07652426) * inp_2_2_1; + result3 += M4(-0.02412553, 0.0037526242, -0.0668934, -0.054726753, -0.016596323, -0.30688837, 0.049872916, 0.06895975, -0.017586173, 0.3452859, 0.0950053, -0.018741097, -0.048104398, 0.017518392, 0.0949136, 0.028228115) * inp_2_0_2; + result3 += M4(0.013070116, -0.5232367, 0.058542944, 0.050612744, 0.102370545, -0.7376758, 0.08592539, 0.07714531, 0.013114515, -0.0074695004, 0.02178679, -0.15938848, 0.020757858, -0.48573405, 0.32483444, -0.023649752) * inp_2_1_2; + result3 += M4(0.046947844, -0.3603543, 0.07617314, -0.04335851, 0.05356554, -0.04626905, 0.0144886095, 0.05473025, 0.07629946, 0.89244694, 0.020768393, -0.22464417, -0.0074107046, -0.87721777, 0.052553397, -0.090482995) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.0766504, -0.09879246, 0.0396668, 0.017115591, -0.010305095, 0.19718798, -0.071258314, 0.0664194, -0.046132524, 0.062901266, 0.080579214, -0.004289638, 0.12400763, -0.0585527, 0.015766127, -0.0032669778) * inp_3_0_0; + result0 += M4(-0.020116923, -0.1888125, 0.059224084, 0.08714167, 0.4200794, -0.22349876, 0.11738465, -0.08908094, -0.12611064, 0.28323323, -0.0006456269, 0.055735517, 0.09580583, -0.03230914, -0.06237639, -0.0038313572) * inp_3_1_0; + result0 += M4(-0.015171148, -0.011160129, 0.039504074, 0.034451094, -0.33802676, -0.20952617, -0.09564441, -0.018064525, -0.14134207, 0.13155054, 0.0101029305, 0.033066314, 0.16871352, -0.0057818503, -0.0054384056, -0.03857239) * inp_3_2_0; + result0 += M4(-0.059774876, -0.23344266, 0.1916854, -0.41434157, 0.1374049, 0.28787696, -0.029185118, -0.033947468, -0.26908988, 0.10820922, 0.012907376, 0.06392264, 0.035846196, -0.10413254, 0.02084434, -0.10425743) * inp_3_0_1; + result0 += M4(-0.08171906, 0.35755453, 0.059284337, 0.0021495572, 0.020121615, -0.08626559, 0.16330962, 0.08871405, -0.3114198, 0.0147190485, 0.097635314, 0.13202067, -0.31036153, 0.011890783, 0.1266637, 0.5408988) * inp_3_1_1; + result0 += M4(0.17335528, -0.015333025, -0.008093493, -0.033920698, -0.02464884, 0.15351357, 0.036093365, 0.03906647, -0.26172918, 0.21810411, 0.0920626, 0.07798469, -0.16078314, 0.09534679, -0.08410649, -0.104074486) * inp_3_2_1; + result0 += M4(0.09742962, 0.22259852, -0.0017837521, -0.12143848, 0.050734755, 0.22144549, -0.052987207, -0.049092356, -0.14100018, 0.013511058, 0.043222908, 0.061185308, -0.11384891, -0.0965968, 0.010946058, 0.12053483) * inp_3_0_2; + result0 += M4(-0.42434677, 0.23842174, 0.030445544, 0.060407106, 0.07218617, 0.03208096, -0.071624324, 0.0028445057, -0.15972686, -0.002714478, 0.07611455, 0.047295272, 0.07009659, 0.13138281, 0.05384319, 0.043430082) * inp_3_1_2; + result0 += M4(-0.0030897667, -0.040491477, -0.045542356, -0.037420522, 0.0134954015, 0.015531995, 0.01853244, -0.033848308, -0.19752295, 0.054179564, 0.04510645, 0.049722757, 0.20566362, -0.05376662, 0.05160025, 0.082582206) * inp_3_2_2; + result1 += M4(-0.071607076, -0.01151562, 0.03144804, 0.06795253, 0.035164766, 0.09399475, 0.046911433, -0.105985604, -0.027395945, 0.08368641, -0.03945179, 0.06652106, -0.009234248, 0.0311306, 0.015887855, 0.013628602) * inp_3_0_0; + result1 += M4(-0.009326969, -0.5451517, -0.06685787, -0.2203032, -0.04059302, 0.50291795, -0.23659435, -0.16453515, -0.019921033, -0.08829904, 0.022711797, 0.04344343, 0.080518015, -0.017371742, -0.12549073, -0.1885871) * inp_3_1_0; + result1 += M4(0.06340467, -0.045215208, -0.011862773, -0.17774045, 0.03218759, -0.21211256, 0.24903278, 0.16339235, -0.0889197, 0.26705155, 0.026684994, 0.20748319, 0.21641175, -0.7041937, -0.12879434, 0.034087796) * inp_3_2_0; + result1 += M4(0.0043784324, -0.1104343, 0.0051153954, 0.3049556, 0.053384513, -0.083815835, -0.077591434, 0.06180734, 0.056226797, -0.060590953, 0.023422653, -0.021765847, 0.06481506, 0.038366422, -0.03140693, -0.04423246) * inp_3_0_1; + result1 += M4(0.14104234, -0.42322505, 0.58770734, 0.02756258, -0.06619171, 0.039784182, 0.09670571, -0.11221906, 0.090540856, 0.21492137, 0.0033946468, -0.054638606, -0.26438943, -0.40769553, 0.58308834, 0.011558848) * inp_3_1_1; + result1 += M4(0.038047027, -0.09069749, -0.03155484, -0.4204703, 0.112935, 0.15827107, -0.1785291, 0.10565701, 0.03801543, 0.13049063, 0.18165028, 0.40097496, 0.2054982, -0.65470904, -0.17466919, -0.74355334) * inp_3_2_1; + result1 += M4(0.085544996, -0.17516859, -0.09178954, -0.47846717, 0.081615664, 0.03366028, -0.008114159, 0.10606008, 0.010830146, 0.0031332439, 0.06839305, 0.0031851435, -0.054583967, -0.022798512, 0.062276945, -0.01278501) * inp_3_0_2; + result1 += M4(-0.03308873, 0.18022367, 0.42132232, -0.31112126, 0.13086608, 0.16092083, 0.032381505, -0.061450902, 0.09202975, 0.20787741, 0.008323081, 0.117322624, 0.09185017, -0.079603694, 0.11225445, -0.27967831) * inp_3_1_2; + result1 += M4(-0.03957761, -0.06413558, -0.020417236, -0.094888, 0.16328244, 0.29664227, 0.04430604, -0.067853294, 0.08792947, 0.15714999, 0.05795048, 0.101340644, -0.002680674, -0.050374318, 0.00048598138, -0.35752374) * inp_3_2_2; + result2 += M4(-0.060640704, -0.15616873, 0.07173303, 0.029078547, -0.30562615, -0.041268278, 0.20111884, 0.41848227, 0.06553992, -0.040807955, 0.043503594, -0.24304286, -0.0060193194, -0.012492793, -0.081317544, -0.059194572) * inp_3_0_0; + result2 += M4(-0.04040787, -0.16354334, -0.17756464, -0.015088575, 0.23186228, 0.05988759, 0.14465544, 0.16085775, 0.18045077, -0.105936624, 0.044305015, -0.17218077, 0.04191084, -0.02523788, -0.23255497, -0.04335376) * inp_3_1_0; + result2 += M4(-0.006653806, -0.01155372, 0.013032641, 0.004019512, -0.017225059, -0.34220526, 0.094255075, 0.12780511, 0.06525166, -0.07204751, -0.028964553, -0.08786299, 0.01816411, -0.084005155, 0.00058218115, -0.073107585) * inp_3_2_0; + result2 += M4(0.15325405, -0.18560395, 0.1131455, 0.06522893, 0.07688168, 0.054853395, -0.063450925, 0.10854047, 0.02840006, -0.0005397363, 0.05471179, -0.54284006, -0.017266683, 0.0016633559, -0.02881508, -0.05636048) * inp_3_0_1; + result2 += M4(0.13207924, 0.2558923, -0.056082908, 0.13571228, 0.083247505, -0.016255124, -1.6765794, 0.026998602, 0.35833323, -0.25714707, -0.06403621, -0.259124, 0.0952539, 0.11210623, -0.12490101, 0.07662671) * inp_3_1_1; + result2 += M4(-0.021977363, -0.0713963, 0.123100124, 0.052161366, -0.20624985, -0.1925915, 0.00520385, 0.110770926, 0.17356953, 0.020864306, 0.11559725, -0.079656266, 0.021110583, -0.314465, 0.04681424, 0.1371713) * inp_3_2_1; + result2 += M4(0.30375904, -0.17828616, -0.17909098, 0.013856255, -0.06746472, 0.003626132, 0.19023083, -0.05196694, 0.15099213, -0.06683428, 0.08304773, -0.12654506, 0.13353965, 0.044826567, -0.059660748, 0.013467923) * inp_3_0_2; + result2 += M4(0.08426794, -0.22384238, 0.19148509, 0.05827365, 0.018852733, 0.1217786, -0.014563931, 0.021475017, 0.057863247, -0.040182285, 0.58330965, -0.22231136, 0.050184354, 0.12184998, -2.07873, -0.018987421) * inp_3_1_2; + result2 += M4(-0.020585502, -0.0018608408, -0.14940372, -0.011206775, -0.052012913, -0.021318972, 0.27726486, 0.13465387, 0.18750753, 0.03791731, 0.040556125, -0.11679988, 0.19256034, -0.053861372, -0.028166458, -0.14577334) * inp_3_2_2; + result3 += M4(0.1110923, -0.023193434, 0.08967661, 0.0026217531, -0.05411397, 0.00651578, -0.031594105, -0.09873143, 0.041768722, 0.04100008, 0.036410563, 0.039395727, -0.011185455, 0.01551338, 0.023943875, 0.015728712) * inp_3_0_0; + result3 += M4(-0.046828236, -0.07020306, 0.00973051, 0.0005743727, 0.1787815, 0.22740924, 0.11705792, -0.0115812505, 0.057035774, -0.0070796604, 0.014894732, 0.024319354, -0.047951322, 0.03793726, -0.10123618, 0.014985628) * inp_3_1_0; + result3 += M4(0.046608195, 0.026250076, 0.0219202, -0.009327337, -0.008816733, -0.082837604, -0.017703755, 0.2030575, 0.056901768, -0.0084842825, 0.012729636, -0.08129811, 0.019200847, 0.032389343, -0.0009601458, 0.013909917) * inp_3_2_0; + result3 += M4(-0.48060805, -0.23521748, 0.34547088, -0.040182896, -0.038119644, -0.18511339, -0.04657396, -0.027486663, 0.08065303, 0.12756409, 0.036840674, 0.10895672, 0.047392767, -0.0069511794, 0.094890505, 0.052782986) * inp_3_0_1; + result3 += M4(0.12509732, 0.03977793, -0.03640901, 0.50160116, -0.15279287, 0.318791, 0.13314092, -0.1444542, -0.044084627, 0.084593356, 0.078950174, 0.16075894, -0.03516418, -0.2527174, -0.036211584, 0.47695947) * inp_3_1_1; + result3 += M4(-0.12992151, 0.043950334, 0.03127988, 0.042125385, -0.19439988, -0.25358784, -0.048711743, -0.20638546, 0.13232373, 0.0047641313, 0.08614499, -0.0324139, -0.6161785, 0.08246424, 0.15840074, -0.26129988) * inp_3_2_1; + result3 += M4(0.011187205, 0.42798644, 0.008353978, -0.044744402, -0.0177301, 0.25025943, -0.041332502, -0.11565288, 0.010321948, 0.536089, 0.03314616, 0.008272843, -0.008212299, 0.09620918, -0.008280064, 0.11386974) * inp_3_0_2; + result3 += M4(-0.061153438, 1.292626, -0.014955989, 0.20095024, -0.027531676, -0.7807742, -0.11907358, -0.09337009, 0.03249329, -0.62426835, 0.0146850245, 0.026055751, -0.04021995, -1.9652365, 0.088370696, 0.11366978) * inp_3_1_2; + result3 += M4(0.04068244, 0.35956866, -0.024620563, -0.029591298, 0.0932946, 0.34455878, 0.011712873, -0.20691097, -0.004321678, -0.2839504, 0.010122162, 0.025036965, -0.02681107, -2.100412, 0.0069077644, 0.06897316) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 DS (Conv2D-3-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_2 +//!SAVE conv2d_3 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.0017480821, -0.013207066, -0.011228051, -0.0030521527); + V4 result1 = V4(-0.0059395116, 0.02963556, 0.0096618235, 0.02099762); + V4 result2 = V4(0.0037767761, 0.008920694, -0.019380828, 0.009338229); + V4 result3 = V4(-0.010227559, -0.02027447, 0.025720553, 0.0076178582); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.013742333, -0.31396708, 0.26787847, 0.072659366, 0.11329625, 0.09537591, 0.033292115, -0.017220195, 0.001464037, 0.008237256, -0.11971067, 0.017268868, 0.09323862, 0.09715007, 0.060889743, -3.5066485e-05) * inp_0_0_0; + result0 += M4(-0.50970757, -0.5762601, 0.20819591, -0.17460805, 0.11446012, -0.15912902, -0.121048756, -0.047206264, -0.08427633, 0.0025400645, -0.33599967, 0.10243455, 0.0020691168, -0.3237394, 0.13666141, -0.13717362) * inp_0_1_0; + result0 += M4(-0.20074122, -0.041116606, -0.07211998, 0.03917335, 0.005626392, 0.00093446556, 0.04984837, 0.052918322, -0.095496096, 0.02798376, -0.16388294, -0.09691992, -0.009316182, 0.002156926, 0.076914035, -0.0018362058) * inp_0_2_0; + result0 += M4(-0.04646638, 0.04301821, -0.213666, -0.068135574, 0.049697164, 0.13429289, -0.19906549, 0.32909, 0.07195283, -0.112840325, 0.03280211, 0.049278136, -0.10621306, -0.10757828, 0.021037694, 0.20384435) * inp_0_0_1; + result0 += M4(-0.077998064, 0.22377425, -0.3773312, -0.088498555, 0.0053320946, -0.058212977, 0.080621, -0.11171977, -0.21263243, 0.011046657, 0.35355136, -0.06552714, 0.09067343, 0.3376479, 0.34425646, -0.43196526) * inp_0_1_1; + result0 += M4(0.061848424, 0.06426705, -0.030383265, 0.03173913, -0.16706698, 0.010781343, 0.21188083, -0.2265141, -0.01627768, -0.14701325, 0.082368046, -0.05859685, -0.04978609, 0.19023238, -0.03965014, 0.29524118) * inp_0_2_1; + result0 += M4(-0.0306261, -0.04085749, -0.23889224, -0.050767697, -0.04013987, -0.13312452, 0.19715339, 0.26171264, 0.0013510226, -0.013842771, 0.027681874, -0.03974694, -0.19338731, 0.04583281, -0.046023604, 0.041369166) * inp_0_0_2; + result0 += M4(-0.10139793, 0.04532661, -0.0342177, -0.009461673, 0.15787649, 0.12668087, -0.13030411, 0.090191655, 0.18736099, 0.04283658, 0.12219039, 0.027710259, 0.024654623, 0.01619275, -0.35501233, -0.051116623) * inp_0_1_2; + result0 += M4(-0.12528433, -0.026363146, -0.16625732, -0.08191529, 0.12736906, 0.26764688, 0.10838407, -0.11167493, 0.059556503, 0.056794092, 0.06564879, 0.0980191, -0.11926366, -0.20925348, -0.15895343, -0.0804178) * inp_0_2_2; + result1 += M4(0.28437835, -0.002334728, -0.057142854, -0.13161235, -0.037597105, -0.0081220865, 0.033518326, 0.16829304, 0.048631717, -0.05146907, 0.01925202, -0.08801352, 0.031352233, 0.06670703, 0.0057261786, -0.07080493) * inp_0_0_0; + result1 += M4(0.20693526, -0.0027875837, -0.024844248, 0.003722317, 0.12421726, -0.071424775, 0.017107086, -0.3732517, 0.03228796, 0.026641833, 0.014621808, 0.003753755, 0.011267291, 0.012458715, 0.021493524, -0.118005805) * inp_0_1_0; + result1 += M4(-0.034746096, -0.03172964, -0.014664306, -0.012086779, 0.1931416, -0.03533445, 0.01723795, -0.5334721, -0.07718448, -0.033954136, 0.025482401, -0.18039058, 0.0783087, 0.09332574, -0.033299036, 0.15519528) * inp_0_2_0; + result1 += M4(-0.329095, -0.13896094, -0.17261124, -0.016496744, 0.09107782, -0.01243064, 0.06770809, 0.30866104, -0.0288415, 0.028245337, 0.023785003, 0.03607363, -0.011177616, 0.1798321, -0.04502171, 0.13481946) * inp_0_0_1; + result1 += M4(-0.34093675, 0.07681657, 0.0021810206, -0.06599798, -0.22647366, -0.16830544, -0.08243902, -0.30915564, 0.04177963, 0.5109498, 0.062553845, -0.034190703, 0.04370762, 0.30578157, -0.073416814, -0.06466905) * inp_0_1_1; + result1 += M4(0.04676398, -0.028934004, 0.025172938, 0.05854845, -0.12591504, -0.011103147, 0.028433567, -0.010902395, -0.15242963, 0.008639989, -0.018708037, 0.13760155, 0.19433762, 0.0031262431, -0.004067586, -0.39977702) * inp_0_2_1; + result1 += M4(-0.18624696, -0.072138086, -0.108983666, 0.09679024, 0.082618475, -0.03762175, 0.08016512, 0.21064514, -0.049806964, 0.03683179, 0.12170394, 0.04623598, -0.050608203, -0.04886757, -0.14925289, -0.23452131) * inp_0_0_2; + result1 += M4(0.06740208, 0.03922189, -0.024193132, -0.023183608, -0.10275763, 0.026307985, 0.06166279, -0.0033073507, 0.103257954, -0.003347554, 0.07212322, 0.056260653, -0.13365982, 0.05859138, -0.16502652, 0.19636813) * inp_0_1_2; + result1 += M4(-0.10216632, 0.008577115, 0.0034097305, -0.03322281, 0.031984664, 0.03745504, -0.12077493, 0.10455194, 0.072156295, 0.0039019848, -0.08020873, 0.14048693, -0.1509022, -0.0042885765, 0.15331472, -0.262448) * inp_0_2_2; + result2 += M4(-0.16221876, 0.057853937, -0.02687466, -0.02580708, -0.039356407, 0.026669305, -0.016994065, -0.0018950413, -0.03317146, 0.111001246, -0.08564103, 0.036529347, 0.0069948873, -0.004476116, 0.037428625, -0.032405715) * inp_0_0_0; + result2 += M4(-0.024450691, -0.18772535, -0.03373765, -0.02393417, 0.08165734, 0.04839238, -0.04392691, 0.060463354, 0.08244979, -0.030043233, -0.17591904, -0.105013795, 0.09993796, -0.07685819, 0.18041363, 0.068260804) * inp_0_1_0; + result2 += M4(-0.07076884, 0.007816242, -0.04245959, 0.03505174, -0.017449595, 0.10012675, -0.08593324, 0.026215378, -0.12722993, 0.11531461, -0.044889923, -0.07379326, 0.102622665, -0.13516678, 0.027440194, -0.025661053) * inp_0_2_0; + result2 += M4(-0.2417654, 0.532874, -0.1792782, -0.016072318, 0.12632751, -0.1394212, -0.104871325, -0.2143921, 0.009683901, -0.13191098, -0.072481215, 0.14556748, 0.14193138, -0.084580764, 0.02502378, -0.1356686) * inp_0_0_1; + result2 += M4(-0.070205666, -0.27398396, 0.07058423, -0.1282003, -0.19091621, -0.00998729, 0.009443734, -0.22386715, 0.4032219, -0.1489337, -0.036794376, 0.010098983, -0.17007609, -0.1622153, 0.5655884, 0.09552588) * inp_0_1_1; + result2 += M4(-0.05603438, 0.04169446, 0.012783244, 0.05043658, 0.053274922, -0.09159566, 0.062812835, -0.07592551, 0.033113863, -0.05460731, 0.06573498, 0.040921483, -0.07896506, 0.1589944, -0.1188062, 0.107915975) * inp_0_2_1; + result2 += M4(-0.14555661, -0.02623733, -0.010950724, -0.0029378114, 0.16225207, -0.14775589, 0.043020986, -0.12051408, 0.043429397, 0.05345529, -0.038897146, -0.010908579, -0.021893447, 0.097037636, -0.012969422, 0.13148984) * inp_0_0_2; + result2 += M4(0.0028671154, -0.13369134, 0.009956911, -0.052492116, -0.029130064, 0.58226454, -0.011425127, -0.013592997, 0.021517135, -0.008963109, 0.02541666, 0.017184312, -0.16393614, -0.110572346, 0.0063540046, -0.31564647) * inp_0_1_2; + result2 += M4(-0.033714134, -0.06151679, 0.026827423, 0.03188713, 0.042517334, -0.025831262, 0.04598944, -0.08595885, -0.003915388, 0.09385612, -0.038792178, 0.0895971, -0.09253884, -0.021541333, 0.086981736, -0.10932342) * inp_0_2_2; + result3 += M4(-0.08393953, -0.22956555, 0.011609948, 0.009277218, 0.039219324, 0.04410125, -0.01109496, -0.05332186, 0.03279442, -0.046855666, -0.057603728, -0.006750665, 0.030960107, -0.03515314, 0.05504648, 0.015092096) * inp_0_0_0; + result3 += M4(0.13919544, 0.1411814, 0.042253297, 0.0037964282, -0.040356793, 0.12674251, -0.015921002, 0.053343415, 0.0379153, 0.20943864, 0.0771062, -0.030640893, 0.011386835, 0.0866107, 0.023407476, 0.058897074) * inp_0_1_0; + result3 += M4(0.052371733, -0.3991684, -0.07190776, 0.0007726265, -0.07851629, 0.18438594, -0.06764928, -0.5050416, -0.100258075, -0.09006746, -0.015903315, -0.5025817, 0.0031620082, -0.08231843, 0.05990831, 0.0768073) * inp_0_2_0; + result3 += M4(-0.06402679, -0.6725876, -0.10156491, -0.09864526, 0.02643018, 0.3727122, 0.008444335, -0.08263052, 0.018349787, 0.044862207, 0.0880957, 0.004279047, 0.054860793, -0.048947245, 0.07504498, -0.035847556) * inp_0_0_1; + result3 += M4(0.11614327, -0.30468974, 0.0444558, -0.028236007, -0.067298174, 0.29058734, -0.14453624, -0.099617906, -0.22497794, -0.18741079, 0.18873163, 0.07804972, -0.05881788, -0.22348139, -0.108909026, -0.04795675) * inp_0_1_1; + result3 += M4(0.058302045, -0.0505233, 0.0009843127, -0.043714497, -0.21508288, 0.30368665, 0.00013597557, 0.18061589, 0.039270017, 0.005499783, 0.071200795, 0.14625464, 0.09535705, 0.04838145, -0.056300323, -0.32017702) * inp_0_2_1; + result3 += M4(-0.014569219, -0.14319171, -0.044703428, -0.04628076, 0.036289185, 0.11027814, -0.023670927, 0.027902605, -0.016727578, -0.0030887127, 0.058026824, 0.03686519, -0.028439755, -0.12083449, -0.030791108, -0.016661761) * inp_0_0_2; + result3 += M4(0.007907899, -0.22081214, 0.021030104, -0.02149127, -0.0752811, 0.2893503, -0.033847194, -0.0119202975, 0.029012432, 0.024946356, 0.07516003, 0.08124122, -0.01716123, 0.031961255, -0.20085806, -0.051188) * inp_0_1_2; + result3 += M4(-0.0072488342, -0.20686667, 0.015600979, -0.041693658, 0.0012413642, 0.15499248, 0.04859961, 0.0626556, 0.020021334, -0.12558144, -0.017673044, -0.015979042, -0.050852936, -0.008009429, 0.0006964212, -0.031111179) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.050834622, 0.13558929, 0.069609776, 0.0836248, 0.16258588, -0.1463772, 0.10431995, 0.071166046, -0.09360978, -0.030868849, -0.089349106, -0.05845485, -0.052687116, -0.019358756, 0.13166283, 0.047010917) * inp_1_0_0; + result0 += M4(0.1834363, -0.06733706, 0.19551572, 0.065064564, -0.10159622, -0.44030255, 0.17712298, -0.15667069, 0.018854847, 0.27443087, -0.20249093, 0.059142705, -0.0146979755, 0.107905276, 0.3368964, -0.14103155) * inp_1_1_0; + result0 += M4(0.03400846, -0.020920517, 0.054308336, -0.06452696, -0.10025594, -0.11509778, 0.0049686376, -0.029111736, 0.08407605, 0.14476754, -0.044888042, 0.05088734, 0.010941878, -0.08833402, -0.02657171, -0.074516624) * inp_1_2_0; + result0 += M4(0.11975449, -0.09650759, 0.063281395, -0.022790521, -0.5575803, -0.09101216, 0.013859138, -0.013325497, 0.03603514, 0.030577073, -0.011164303, -0.18578358, -0.01083901, 0.24841565, -0.13914369, -0.05354659) * inp_1_0_1; + result0 += M4(-0.26356968, -0.54071015, -0.4976373, -0.043348465, -0.22630574, -0.19664787, -0.32047185, 0.016972514, 0.46792364, -0.034396674, -0.08538839, 0.102404736, -0.15684944, 0.40727407, -0.12092723, -0.2929467) * inp_1_1_1; + result0 += M4(0.1258391, -0.2243027, -0.13347167, 0.11358319, -0.08303393, -0.14977665, 0.0890761, -0.41722098, 0.15439256, 0.030496476, 0.012219409, 0.19310397, 0.26037794, 0.027789328, 0.08922465, 0.089834034) * inp_1_2_1; + result0 += M4(0.09877862, 0.05284025, -0.027668688, -0.001652929, -0.32570714, 0.021121345, -0.3423895, 0.079213284, 0.33848628, -0.049122784, 0.04044871, -0.06866454, 0.09534095, -0.0642997, 0.07336694, -0.030166717) * inp_1_0_2; + result0 += M4(-0.014141151, 0.40663037, -0.03562297, 0.00014230338, -0.31842545, 0.03633864, -0.36178958, -0.042703845, -0.1249328, -0.028372467, 0.40126094, 0.070099086, 0.08341997, -0.15070833, -0.0008065649, -0.09727535) * inp_1_1_2; + result0 += M4(0.027538782, 0.07063461, 0.086960584, -0.0014761664, 0.14140855, 0.13613716, -0.07045416, -0.18241577, 0.0012894623, -0.16937791, 0.14318486, 0.12240525, -0.109862946, 0.038892377, -0.059320077, 0.018929685) * inp_1_2_2; + result1 += M4(0.031230053, 0.054024037, 0.015748722, 0.19641443, 0.04458012, 0.0074059726, -0.024924599, -0.22967412, -0.065919496, 8.747364e-05, 0.00095081795, 0.079052135, 0.044639762, 0.034701884, -0.070215575, -0.15965857) * inp_1_0_0; + result1 += M4(-0.093358554, -0.050979193, -0.06365453, -0.21407472, 0.056124493, -0.031864822, -0.001345247, 0.26996806, -0.15269825, 0.029912075, -0.014851082, 0.05646165, -0.1369963, -0.005340246, -0.00034040198, -0.87173325) * inp_1_1_0; + result1 += M4(-0.053627335, -0.05403443, 0.0053771413, -0.033885114, 0.07943473, -0.049489744, 0.01970428, -0.019735165, -0.16704302, -0.029533712, -0.012479018, 0.046492025, -0.122892916, 0.016930556, -0.0114216255, -0.15970671) * inp_1_2_0; + result1 += M4(0.108939044, 0.06477513, 0.102464, 0.047452956, -0.12532373, -0.018778939, -0.1330631, -0.09594444, -0.009711892, 0.08322932, 0.097861886, 0.087248646, 0.03657147, 0.02723903, -0.10135503, -0.2575392) * inp_1_0_1; + result1 += M4(-0.008707382, 0.16884588, -0.06652616, 0.08253744, -0.034825716, 0.034717374, 0.03668941, -0.4708626, -0.18865623, 0.13615835, 0.017796587, 0.2501019, 0.20887725, 0.096245155, -0.08776682, -0.020289192) * inp_1_1_1; + result1 += M4(0.0970189, -0.030351888, -0.00047928322, 0.085058145, 0.027607283, -0.007281266, 0.007417884, 0.019575235, -0.029443549, -0.04141028, -0.039709818, 0.21408917, -0.049271036, -0.05297429, 0.040338963, -1.5085386) * inp_1_2_1; + result1 += M4(-0.119401, 0.03140251, 0.045685366, 0.24838144, -0.043740734, -0.0737762, -0.009221195, -0.14987206, 0.16932084, 0.019038102, 0.16664478, 0.16489927, -0.04896412, 0.05431783, -0.06988649, 0.13275269) * inp_1_0_2; + result1 += M4(0.150259, -0.15978405, -0.0844281, -0.06703002, -0.24657513, 0.06366323, -0.069003426, -0.2717428, 0.4409574, -0.037973717, -0.029585278, 0.017423902, 0.09426487, -0.04516054, -0.104453884, 0.21409835) * inp_1_1_2; + result1 += M4(0.009213807, -0.027094958, 0.07477295, 0.020622253, -0.07857662, -0.04560902, -0.024470983, 0.2686737, 0.09560327, -0.022401039, -0.010302134, 0.19773903, 0.03367946, 0.046936627, 0.10942362, -0.04420304) * inp_1_2_2; + result2 += M4(0.06776484, 0.031195775, 0.050318476, -0.052922856, 0.12900554, 0.018970301, -0.036268327, -0.048933093, -0.05853769, 0.0007942279, -0.029834637, 0.0031533486, 0.07673135, -0.094641976, 0.06459924, -0.056525134) * inp_1_0_0; + result2 += M4(-0.11017411, 0.098181106, -0.02243249, 0.012068443, 0.005660485, 0.052767463, -0.035950188, 0.06065624, -0.13324538, 0.026223551, -0.021790896, 0.0048657963, -0.04097028, 0.05637621, 0.027283916, -0.15542829) * inp_1_1_0; + result2 += M4(-0.013024199, 0.015949627, -0.08571484, -0.054483596, 0.033917774, 0.06274524, -0.050583415, 0.06525622, -0.04354908, 0.025803443, -0.011482242, -5.2527274e-05, 0.03598789, 0.09888249, -0.04873406, -0.06561173) * inp_1_2_0; + result2 += M4(-0.018317174, -0.03853359, 0.09234778, 0.087074734, -0.26256627, 0.19705102, -0.016328111, -0.1725605, -0.028978063, -0.18006021, 0.17666177, 0.05648208, -0.088303916, 0.40847126, 0.074141726, -0.13249528) * inp_1_0_1; + result2 += M4(0.06658258, 0.03539948, 0.09751061, -0.08332911, -0.30838192, 0.31569394, 0.03325235, -0.52049816, 0.4147554, -0.06113487, 0.10763208, 0.48811552, 0.2149239, -0.02266595, -0.064685725, -0.12511243) * inp_1_1_1; + result2 += M4(-0.095920496, 0.0039743925, -0.025515337, 0.07142987, -0.08141908, -0.024632594, 0.0048594745, 0.06391914, -0.02217199, 0.13312626, -0.09880823, 0.02288019, 0.022563223, 0.0145039195, 0.013533599, 0.15826075) * inp_1_2_1; + result2 += M4(0.010565236, 0.0057190843, 0.006396659, -0.038720515, -0.2800984, 0.18256105, -0.0718135, -0.12158327, 0.015065574, -0.124020405, 0.013299919, -0.1870773, 0.104143724, -0.0570007, 0.015877953, -0.06448135) * inp_1_0_2; + result2 += M4(0.10921295, -0.09829529, -0.13485469, 0.03348664, -0.25693277, 0.12156001, 0.052303057, -0.18438673, 0.03092165, 0.029485954, -0.0062324405, 0.08378771, -0.06272121, -0.22547439, -0.016985578, -0.28853402) * inp_1_1_2; + result2 += M4(0.08607484, 0.041633364, -0.0058278185, 0.06025964, 0.0077968123, 0.016047232, -0.010274299, -0.008913052, -0.026840642, 0.090148285, -0.023221692, 0.13393198, 0.049763493, 0.060152527, 0.041689675, -0.017965268) * inp_1_2_2; + result3 += M4(0.008406257, -0.070935205, -0.007202847, 0.06941878, -0.05537707, -0.18120946, -0.03022563, 0.16825119, 0.010797398, -0.12705854, -0.0070367176, 0.0055851717, -0.03206117, 0.2384432, 0.05903697, 0.013868561) * inp_1_0_0; + result3 += M4(0.02166264, 0.046648763, 0.021499218, 0.065290526, 0.01560753, -0.17776456, -0.025728986, 0.1073188, 0.0889913, -0.011712805, 0.051837422, -0.10854497, 0.08656417, 0.012107013, -0.0058191423, 0.06694211) * inp_1_1_0; + result3 += M4(-0.030368745, 0.15441988, -0.047315974, -0.0033873403, 0.0558242, 0.05901615, -0.04364993, 0.18534467, -0.00180104, -0.11714469, -0.021285538, -0.14386547, -0.012022105, -0.06351964, -0.020860594, -0.030060872) * inp_1_2_0; + result3 += M4(0.03706961, -0.134447, 0.107362546, -0.01044757, -0.014409411, 0.1598686, -0.013746884, -0.09035731, -0.0048773824, -0.1106227, 0.11328745, 0.14612412, -0.019757058, 0.2840584, -0.06905247, 0.044269875) * inp_1_0_1; + result3 += M4(0.00435332, 0.22003464, 0.054780096, 0.02049974, 0.08106458, -0.23199026, 0.13086085, -0.33637485, 0.042000774, -0.148645, 0.049710836, 0.11972893, 0.12264688, 0.24849172, 0.1564239, 0.13550651) * inp_1_1_1; + result3 += M4(0.07536812, 0.10604653, -0.036423583, -0.26073584, 0.0397844, -0.045089003, -0.019320367, 0.19621585, 0.10164428, -0.009166188, -0.07304803, -0.015371115, 0.04261303, 0.11308855, -0.032034043, -0.20426352) * inp_1_2_1; + result3 += M4(-0.015813572, 0.0056332136, -0.012351634, 0.08331286, -0.007511319, -0.6502108, -0.04515211, -0.09339431, 0.027167298, 0.23520617, -0.00018588088, 0.040712796, 0.057343673, 0.114973925, 0.02719836, 0.021863716) * inp_1_0_2; + result3 += M4(0.037174106, 0.12065753, -0.07257851, 0.090148546, -0.058854315, 0.026826117, 0.030978559, -0.013551632, 0.049525514, 0.13865441, 0.016414402, 0.061311614, -0.014844421, 0.085599475, -0.05553838, -0.011335998) * inp_1_1_2; + result3 += M4(-0.024182256, -0.03277256, -0.023684012, -0.06914193, 0.03953002, 0.00093374, -0.03862413, -0.0043832413, 0.086972594, 0.017723167, -0.02329716, 0.0585194, -0.028904395, -0.030326229, 0.037591804, -0.06744188) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.032315515, -0.122047596, 0.059832327, -0.03277833, 0.020007847, 0.13211598, -0.097809285, 0.122699976, 0.13954099, 0.071660824, 0.13365898, 0.035498723, -0.32890487, -0.23000252, 0.18859388, 0.2246585) * inp_2_0_0; + result0 += M4(-0.09090872, -0.15547122, 0.14182991, -0.03447231, -0.08700012, -0.14764556, 0.06351315, -0.031944465, -0.24570633, -0.10371965, -0.6612911, -0.010604841, 0.30677596, -0.122792654, -0.3476362, -0.3333027) * inp_2_1_0; + result0 += M4(-0.101048835, -0.28088036, 0.064946696, -0.02987513, -0.053139113, -0.0017336245, 0.021613726, -0.09509941, -0.24492142, -0.027400596, -0.03304482, -0.2676795, -0.17882577, -0.0015913589, 0.07456976, -0.10931344) * inp_2_2_0; + result0 += M4(0.018682102, 0.03897567, -0.0043925717, -0.12452545, -0.2039322, 0.07347261, -0.077316, 0.11665575, 0.12262391, 0.012757696, -0.033062913, -0.04495245, 0.006626678, 0.18125992, 0.040581536, 0.019702636) * inp_2_0_1; + result0 += M4(-0.059305314, 0.078166485, -0.19206336, 0.107413165, -0.35976288, 0.20749648, -0.10897632, 0.048565254, -0.28695294, 0.13703996, -0.3667627, 0.13787156, 0.011949593, -0.08204921, -0.20876266, -0.036897074) * inp_2_1_1; + result0 += M4(-0.0057640765, -0.25577998, -0.27986136, -0.1747803, 0.07495716, 0.16943099, 0.084771186, -0.1751805, 0.048841394, 0.06562859, 0.021907087, -0.24557696, 0.24831182, -0.1436971, 0.56543666, 0.032267977) * inp_2_2_1; + result0 += M4(0.067160636, -0.010749014, -0.15154673, -0.022950703, 0.11410057, 0.045740303, 0.23280439, 0.10311792, 0.10404408, -0.038766913, 0.101108626, 0.014880373, -0.08169517, 0.03724728, -0.004071181, -0.02176287) * inp_2_0_2; + result0 += M4(-0.1724258, 0.043157067, 0.023351375, -0.10025255, -0.17951916, 0.047159195, 0.022547374, -0.098868735, 0.07145314, -0.0070737815, 0.035666347, -0.011632881, -0.098744564, 0.014386245, 0.15310442, 0.1590473) * inp_2_1_2; + result0 += M4(0.03659194, 0.048870873, -0.06802044, -0.06394387, -0.09571226, -0.04181391, -0.02092777, -0.08023691, 0.0043218927, -0.07452731, 0.02718202, -0.032503504, 0.066612795, 0.25409463, -0.29573214, -0.100742854) * inp_2_2_2; + result1 += M4(-0.06804398, 0.010259403, -0.05606417, -0.45905623, 0.03798285, -0.011380956, -0.0043548928, 0.0049317023, 0.064162396, -0.16467147, -0.13547602, -0.4170852, -0.0946343, 0.12367309, 0.0036930486, 0.2594846) * inp_2_0_0; + result1 += M4(0.08167365, 0.0076501844, -0.040654324, 0.076445766, 0.061445758, -0.07112302, 0.020587264, -0.094360456, 0.14121495, 0.039353162, 0.07584208, -0.24924478, 0.13394992, -0.15720025, 0.020550527, -0.4719891) * inp_2_1_0; + result1 += M4(0.24099086, 0.004460851, 0.033801142, 0.028916445, 0.009813314, 0.02370655, 0.019507933, 0.0723726, 0.11482338, -0.0041218535, 0.0060363747, 0.18329585, -0.03605137, -0.016704429, -0.03968744, 0.49401382) * inp_2_2_0; + result1 += M4(-0.03777468, 0.07079181, -0.086785324, -0.19576482, 0.016638516, 0.06932382, 0.02143979, -0.18267234, -0.25579676, -0.11076712, -0.2595194, 0.11735666, -0.086780265, -0.04006134, 0.049523488, -0.3053417) * inp_2_0_1; + result1 += M4(-0.19085847, -0.0018226462, -0.09526131, -0.030490309, -0.09358571, -0.1312608, -0.025299216, -0.4467069, -0.40401617, -0.11442126, -0.02932193, -0.55489945, -0.06258919, 0.17412789, -0.13525261, 0.36862898) * inp_2_1_1; + result1 += M4(-0.1783346, 0.020232402, 0.062352747, -0.2333071, 0.20440717, 0.036881648, 0.011426944, -0.161388, -0.091673456, -0.07425262, -0.007313462, 0.18958011, -0.05012611, 0.14050211, 0.023201272, -0.18373603) * inp_2_2_1; + result1 += M4(-0.041670453, 0.04761505, -0.07205055, -0.16726835, 0.16217317, 0.031830892, -0.045013987, -0.13016471, 0.038423758, 0.018830528, -0.1379043, 0.07583382, -0.08549732, 0.020179233, -0.05180274, -0.08676527) * inp_2_0_2; + result1 += M4(-0.1144892, -0.065310515, -0.07988956, -0.28776947, -0.022516059, -0.10576069, -0.09915789, -0.029305372, -0.018182946, 0.051951002, -0.031691708, 0.109498486, -0.010285694, -0.058526095, -0.015336989, 0.28561556) * inp_2_1_2; + result1 += M4(-0.114991814, -0.0060320315, 0.032515556, -0.088495135, 0.0023830642, -0.015636275, 0.10081914, -0.18555105, 0.0049523246, -0.01522886, 0.031541333, 0.14967763, -0.13520668, -0.00976766, 0.07235242, -0.13526863) * inp_2_2_2; + result2 += M4(-0.006102216, -0.029172745, 0.09222103, -0.028744753, 0.036760766, 0.02058598, -0.051013798, 0.07528594, -0.19947468, 0.2854517, -0.22350396, 0.07103823, 0.15858191, -0.16111182, 0.10137347, 0.0031016655) * inp_2_0_0; + result2 += M4(-0.051077593, 0.018110406, -0.085154414, -0.11970748, -0.06248552, 0.090771616, -0.11020889, 0.016226625, -0.30493045, 0.34879982, -0.08281113, -0.2973166, -0.08395863, 0.14489202, 0.10018392, 0.2918778) * inp_2_1_0; + result2 += M4(0.100762405, -0.14077328, 0.0068873675, -0.012728327, 0.038007546, -0.010162205, 0.016245509, -0.045379486, -0.015239795, 0.044774063, -0.0041919495, -0.039544307, 0.10751771, -0.19274761, -0.13351429, -0.21966757) * inp_2_2_0; + result2 += M4(0.0014801857, 0.090907656, 0.09321273, 0.19191459, 0.11852471, 0.024387602, 0.13766855, 0.058077153, 0.13642266, 0.10572148, 0.03806547, 0.115434796, -0.13728566, 0.015369699, -0.029896675, 0.1222438) * inp_2_0_1; + result2 += M4(-0.23657471, 0.01041624, -0.104025744, -0.08028565, -0.27475524, 0.014432225, -0.190358, -0.1933413, 0.06009237, 0.35213372, -0.18603286, 0.15629223, -0.075596966, -0.045948125, -0.069723725, -0.2296189) * inp_2_1_1; + result2 += M4(-0.114092045, -0.21760537, 0.06743137, -0.16528656, 0.038565528, -0.047547337, 0.016258612, 0.04621514, 0.06486923, 0.21303502, -0.056794677, 0.07416883, -0.27225333, -0.106772475, 0.116170004, 0.03875536) * inp_2_2_1; + result2 += M4(-0.12807086, -0.050668288, 0.004014784, -0.12517461, 0.05560518, -0.031908523, 0.02181089, 0.054382585, -0.031665996, 0.052780844, 0.0075956094, -0.05371376, 0.0088007385, 0.05524695, 0.049430843, 0.08108161) * inp_2_0_2; + result2 += M4(0.051009595, -0.1502449, -0.045252007, 0.06836838, 0.14730917, 0.036979046, -0.083785385, 0.06063368, -0.028182903, 0.07504901, 0.055856213, 0.04504785, 0.18590024, -0.045080796, -0.036583446, 0.012569273) * inp_2_1_2; + result2 += M4(0.09400213, -0.09781128, -0.028674224, -0.04409969, 0.03257724, -0.060171966, 0.018233486, 0.059538074, -0.05567502, 0.027766956, -0.004594858, 0.013047014, 0.118355066, 0.10237973, 0.017876882, -0.0016306012) * inp_2_2_2; + result3 += M4(-0.060102426, 0.055194635, -0.0050862706, 0.031027785, 0.015334437, 0.05874696, -0.014036861, -0.09948192, -0.022876646, 0.25203875, -0.16902465, -0.1250054, 0.028966324, 0.19289416, 0.06767192, -0.027996095) * inp_2_0_0; + result3 += M4(-0.073572166, -0.2641532, 0.0045350282, -0.0032056102, -0.018192617, -0.053080373, -0.077567, -0.120395035, 0.05026236, -0.2493179, -0.047281366, -0.4302733, -0.04435675, -0.08884186, -0.081195176, 0.05236053) * inp_2_1_0; + result3 += M4(0.15846111, 0.033074684, -0.002145444, 0.25345713, -0.016138427, 0.060776513, 0.020433042, 0.054068796, 0.07300529, 0.1499025, 0.01061005, 0.26232153, -0.086272724, 0.19294065, 0.07322928, -0.13114798) * inp_2_2_0; + result3 += M4(-0.026156582, -0.09473598, 0.01886588, 0.03316904, 0.046567984, 0.05356517, 0.112859644, 0.045939382, -0.014500696, 0.39915556, -0.044323806, 0.08406331, -0.02588856, 0.28643692, -0.054337215, -0.044069048) * inp_2_0_1; + result3 += M4(0.119249105, -0.06426904, 0.049732402, -0.24069054, 0.053948652, 0.18656449, -0.13553333, -0.09931661, 0.05298581, 0.06414778, -0.01429046, 0.0886309, -0.0169578, 0.19047803, 0.18266238, 0.0035147448) * inp_2_1_1; + result3 += M4(-0.0056939553, -0.21608217, 0.02736181, -0.036639106, 0.0103363665, 0.029477157, 0.016544899, -0.067491375, 0.07800084, -0.12613757, -0.0043560416, 0.0653098, 0.03597968, 0.0737496, -0.108304635, -0.15834598) * inp_2_2_1; + result3 += M4(-0.024152312, -0.03797177, 0.024080073, -0.0372, 0.025841238, 0.1450337, 0.003514035, 0.01807124, -0.014084937, 0.20126233, -0.07188575, 0.009998302, 0.014528717, -0.0146696335, 0.06857181, 0.032898333) * inp_2_0_2; + result3 += M4(-0.0058606123, -0.18987623, 0.0017278753, 0.010762768, -0.06410252, 0.05551138, -0.044577245, -0.07427778, 0.013683679, 0.17193417, 0.08636119, 0.052021578, -0.04665759, 0.009889614, -0.13780324, -0.06077317) * inp_2_1_2; + result3 += M4(-0.024604267, 0.0576184, -0.0052168164, -0.013863482, 0.0020399143, 0.14541508, 0.021378214, 0.034496024, 0.042570945, 0.10022286, -0.02205846, 0.14285377, 0.033961337, 0.20753984, 0.07047152, -0.2780571) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.027015617, -0.7996558, 0.18498614, 0.104103, 0.38189876, -0.11344139, -0.0007145073, 0.3342583, 0.031134395, 0.089367434, 0.037405856, 0.015087987, -0.14192465, -0.22596288, 0.029936088, 0.0421774) * inp_3_0_0; + result0 += M4(0.18507116, -0.13057783, 0.18906131, -0.04625072, 0.4304938, 0.20377009, 0.15997867, -0.01429329, 0.038801454, 0.08704504, 0.21694064, -0.11549993, -0.0045122113, -0.3900684, -3.388382e-05, 0.15001586) * inp_3_1_0; + result0 += M4(0.060679402, -0.16186985, 0.061862193, -0.00022022054, 0.26157132, -0.043998968, 0.1945971, -0.7142528, 0.09871455, 0.022045933, -0.024860913, 0.004302735, 0.14181943, -0.18637265, -0.00040650467, 0.11827929) * inp_3_2_0; + result0 += M4(-0.5922311, 0.22684027, -0.11227259, -0.21391045, 0.032060653, -0.053092804, 0.31259525, -0.07501715, -0.10745047, -0.0038042206, -0.10862252, -0.004506264, 0.20306757, 0.25435647, 0.16563417, -0.17325446) * inp_3_0_1; + result0 += M4(-0.35888693, 0.16700989, 0.1668772, 0.17332852, -0.05505689, -0.11818606, -0.06606742, 0.110823445, 0.03806446, -0.113237, -0.31512976, 0.095162764, -0.46377453, -0.0036337571, -0.16946682, 0.1773919) * inp_3_1_1; + result0 += M4(-0.12228825, -0.039548386, 0.011141476, -0.1074657, 0.019009113, 0.08645584, 0.2815848, -0.06357786, 0.015157962, 0.09658943, 0.053875048, -0.033454716, -0.0061273533, 0.062192447, 0.07787697, 6.049956e-05) * inp_3_2_1; + result0 += M4(-0.15141164, -0.5041164, -0.9490496, 0.19432089, 0.02835402, -0.04002404, 0.08439427, -0.010552297, -0.07459201, 0.021660993, 0.032625314, 0.010420403, -0.07382987, -0.07785111, -0.10839164, -0.052428048) * inp_3_0_2; + result0 += M4(0.05921418, -0.13308622, -0.37330568, 0.17807813, 0.07824402, 0.03588622, -0.12656505, 0.09064255, -0.06055568, -0.024535418, -0.043053485, 0.00056338724, 0.06676607, -0.27000788, -0.29120812, 0.11573923) * inp_3_1_2; + result0 += M4(-0.028129566, 0.14413905, -0.16586044, 0.017026152, 0.076706395, -0.05394849, 0.09306623, 0.019118821, 0.007054275, 0.08550639, 0.13275635, -0.025670476, -0.0022794658, 0.10155379, -0.02085458, 0.034746658) * inp_3_2_2; + result1 += M4(-0.12369097, -0.022380395, -0.19092223, -1.0336181, 0.25007322, -0.1082927, -0.1355875, -2.3267636, -0.060449358, 0.047252428, -0.01162158, -0.005936594, 0.11749812, -0.09796796, 0.028199805, 0.1737005) * inp_3_0_0; + result1 += M4(0.21402386, 0.013675318, -0.030755024, -0.0027503022, -0.2956065, -0.10900944, -0.47659904, -1.3750017, -0.22972079, 0.06601595, 0.013311301, 0.12648493, 0.24865986, -0.0054492513, 0.015514159, -0.035419848) * inp_3_1_0; + result1 += M4(0.04552766, 0.037142105, 0.0035919624, 0.08431789, -0.3844037, -0.28543824, -0.23054305, -0.94371766, -0.06714347, 0.07686601, -0.0064314655, 0.087116875, 0.05579566, -0.070394486, 0.0021310588, 0.045538615) * inp_3_2_0; + result1 += M4(-0.37080222, -0.18180142, -0.24774034, -1.7342087, -0.06769111, 0.043335035, 0.35196152, -0.0039335964, 0.044669848, -0.03951889, -0.025922338, -0.048581965, -0.10638707, -0.15603809, 0.017693024, -0.15826935) * inp_3_0_1; + result1 += M4(-0.15859805, 0.099043906, -0.051725943, -0.2880917, -0.18174146, 0.0665793, 0.54645437, -0.033481486, 0.40742868, -0.3033671, 0.122001864, -0.08608495, -0.2042584, 0.05535326, 0.12946245, -0.4357408) * inp_3_1_1; + result1 += M4(0.12178875, 0.025560115, 0.028441695, -0.22325999, 0.061120175, -0.025200972, 0.14321159, 0.19563259, -0.022041185, 0.04249189, -0.07945956, 0.11619728, -0.0501297, -0.054087505, -0.011183701, 0.1266374) * inp_3_2_1; + result1 += M4(-0.6316759, -0.0918079, -0.3422181, -0.2808048, 0.03502315, -0.07254006, 0.021251619, 0.1637716, 0.0266244, 0.014856987, -0.073231086, -0.057996526, -0.07746048, 0.007990325, -0.021293677, 0.14186025) * inp_3_0_2; + result1 += M4(-0.10816348, -0.19827484, -0.03404185, 0.17547783, 0.071025066, -0.013042217, 0.043203786, 0.06272457, -0.22442414, 0.1362349, 0.14682624, -0.030669976, -0.3585226, 0.027426068, 0.15036522, -0.1341319) * inp_3_1_2; + result1 += M4(-0.14291224, -0.049865674, 0.025149126, -0.1153935, 0.057290137, -0.05218865, -0.0013165397, 0.027519017, 0.134451, -0.0015477352, -0.062499885, 0.0006934406, -0.030470002, 0.010570013, -0.013825029, -0.04198862) * inp_3_2_2; + result2 += M4(-0.10711042, 0.032619312, -0.024730971, -0.06444852, 0.4182004, 0.54544973, -0.239182, -1.0138891, 0.027894305, -0.08686301, 0.077421546, -0.046399735, 0.063517295, 0.01817226, -0.09217656, 0.04170022) * inp_3_0_0; + result2 += M4(0.22543283, -0.109545745, 0.025299635, -0.025161963, 0.7423745, -0.216506, 0.0028229007, -0.73982394, -0.008515469, -0.061802708, 0.32045597, -0.08967708, 0.054728646, 0.01958016, -0.10577295, 0.19468236) * inp_3_1_0; + result2 += M4(0.05417426, -0.06550254, 0.008215511, 0.08211287, 0.49578804, 0.02951148, -0.051892225, -0.23949671, 0.07806937, -0.035536528, 0.13598205, 0.08785305, 0.079127, 0.070848905, -0.03802217, 0.051596798) * inp_3_2_0; + result2 += M4(-0.48896796, 0.68660605, -0.16183376, -0.86002463, 0.033824537, -0.08554051, 0.003849123, -0.08059784, -0.029788414, 0.08485035, 0.03887551, -0.05369966, -0.13131899, 0.22066273, -0.10666296, 0.05315469) * inp_3_0_1; + result2 += M4(-0.167758, 0.29998848, -0.034977388, -0.09690403, 0.13826017, 0.24243373, 0.100414276, 0.17001465, -0.2882979, -0.3450798, 0.18749917, -0.13422024, -0.17123859, 0.09044185, 0.052391898, -0.36916175) * inp_3_1_1; + result2 += M4(-0.16430867, 0.0064501395, 0.06647598, -0.023820901, 0.08984767, 0.013764179, -0.035873856, 0.032932702, 0.09450842, 0.071256734, -0.040001966, -0.04960062, -0.007343706, 0.049707595, -0.016152225, -0.0027885356) * inp_3_2_1; + result2 += M4(-0.73847115, 0.5513414, 0.030851787, -0.2581955, -0.0024027135, -0.0036326675, -0.030248651, -0.004381591, -0.02528615, -0.019515892, 0.029741172, -0.003951281, -0.019615853, -0.03865882, 0.003828569, -0.0031004255) * inp_3_0_2; + result2 += M4(-0.17671159, -0.081465006, -0.07955902, -0.04966974, -0.06376834, -0.023979286, -0.015434015, -0.041929364, 0.120791264, 0.036787927, 0.04004447, 0.09695027, -0.08316816, 0.09391913, 0.049567543, 0.027576985) * inp_3_1_2; + result2 += M4(0.10369331, -0.024534395, -0.052448582, -0.09192535, 0.027912363, 0.09893594, 0.028118687, 0.06701703, 0.014928166, 0.017885402, -0.03428379, -0.025608117, 0.031982064, 0.003519881, -0.0178403, -0.009937768) * inp_3_2_2; + result3 += M4(-0.027271697, 0.42789787, -0.049469214, 0.022823947, -0.17875957, -0.9508793, -0.059357125, 0.17309445, -0.008523562, 0.106697135, 0.06968476, 0.011999886, -0.052791767, 0.063847676, -0.10121569, 0.035633165) * inp_3_0_0; + result3 += M4(0.14716758, -0.07930711, -0.017321438, 0.13599691, 0.07637399, 0.04328131, -0.07516573, 0.43305922, -0.08643355, -0.04845797, 0.016906133, 0.030227428, -0.0071497494, -0.11972896, -0.05875496, 0.10012184) * inp_3_1_0; + result3 += M4(-0.04849445, 0.020217191, -0.046229035, 0.18088053, -0.22129643, -0.12000977, -0.12619595, 0.1956666, -0.008121098, -0.14342684, 0.10044852, 0.1925586, -0.013161276, 0.0966338, -0.056078617, 0.09678964) * inp_3_2_0; + result3 += M4(0.08718787, -0.40120795, 0.14511861, -0.74981576, 0.08892279, -0.25088233, 0.1971236, -0.008586428, -0.036342554, -0.003950924, -0.10522428, -0.008721086, -0.051654376, 0.15270655, -0.11333946, -0.1062836) * inp_3_0_1; + result3 += M4(0.3832336, -0.069977686, -0.014638319, 0.22976342, 0.4424893, -0.68896824, 0.50525415, 0.1229973, 0.2716183, 0.22153828, 0.42152727, -0.04672893, -0.050966874, -0.5484808, 0.05782651, -0.0730039) * inp_3_1_1; + result3 += M4(0.064079545, 0.11863564, 0.11544964, -0.19748935, 0.32926935, -0.8571917, -0.07095916, 0.053836744, -0.12118399, -0.16282205, -0.03557967, 0.015947886, 0.028216584, 0.09699497, -0.0085840095, -0.0819769) * inp_3_2_1; + result3 += M4(-0.07120117, -0.63295966, 0.043656614, -0.45833355, 0.024976943, 0.16151588, -0.07555022, -0.009623016, 0.010849734, -0.1750549, -0.021309523, -0.009259946, 7.156295e-06, 0.15191126, -0.018279374, -0.04998776) * inp_3_0_2; + result3 += M4(0.17812641, 0.07574793, -0.13986841, -0.04758223, 0.039438676, -0.04838939, 0.05826339, 0.058625273, 0.010918394, -0.008298822, 0.13868612, -0.011732604, -0.024179596, 0.02025137, 0.0014702389, -0.072934866) * inp_3_1_2; + result3 += M4(-0.044331793, -0.021380348, -0.065975286, -0.00053424994, -0.010777215, 0.062775485, -0.026242074, -0.017773766, -0.034250915, 0.114954434, -0.020100623, 0.04363309, -0.029236004, -0.14147997, 0.0040791784, -0.043546647) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 DS (Conv2D-4-ReLU) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_3 +//!SAVE conv2d_4 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(-0.006771086, -0.0051601403, 0.020885777, -0.024551088); + V4 result1 = V4(0.004770867, 0.0010445794, -0.0035112808, -0.0010415314); + V4 result2 = V4(-0.0118335625, -0.08267318, -0.0066933953, 0.00024997361); + V4 result3 = V4(-3.5229634e-05, 0.01858382, -0.012685065, -0.008151426); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.0033632028, 0.04721141, 0.03007575, -0.052616846, -0.008006311, 0.065169215, 0.016507383, -0.0044050934, -0.018410988, 0.07643572, 0.03065518, -0.08753873, 0.015026827, 0.16328007, 0.004729976, -0.014612305) * inp_0_0_0; + result0 += M4(-0.0510358, -0.040047985, -0.15714039, 0.18750839, 0.029424198, 0.063464284, 0.04334012, -0.051018972, 0.044537134, 0.016376844, 0.0021454738, 0.07393311, -0.003398863, -0.07367582, 0.03664616, -0.0471132) * inp_0_1_0; + result0 += M4(0.033857785, -0.044069454, 0.0029815182, 0.07231605, -0.012478533, -0.014247982, -0.011120171, 0.0064618033, -0.024211371, -0.0057577016, 0.009435734, -0.00255496, 0.00047270884, 0.049642805, 0.010110964, -0.023349527) * inp_0_2_0; + result0 += M4(0.024893802, -0.06915593, -0.09700506, 0.109927185, -0.022845587, 0.033251625, -0.0370686, 0.04165276, -0.023201028, -0.09822818, -0.0098308325, 0.03426258, 0.038701996, 0.36037982, 0.030453933, -0.045780078) * inp_0_0_1; + result0 += M4(-0.0022862866, 0.099955656, 0.34152862, -0.3465966, -0.05589964, -0.05136851, -0.068635, 0.09597882, 0.07702414, 0.021747537, 0.12726207, -0.1702579, 0.025863616, -0.06331183, -0.17451076, 0.18619111) * inp_0_1_1; + result0 += M4(-0.010405649, 0.018087514, -0.15909216, 0.14597063, 0.033948172, 0.013681024, -0.00019566377, 0.013083054, -0.0172498, 0.0056358925, -0.00644117, 0.009749327, -0.010631505, 0.021705946, 0.09615771, -0.044029847) * inp_0_2_1; + result0 += M4(-0.024415338, -0.18363151, -0.01793161, 0.023585768, -0.075834185, -0.0050683604, 0.018748691, -0.008734701, -0.011380264, -0.002517223, -0.007086535, 0.0369585, -0.013384224, 0.19569841, 0.02990988, 0.0053327563) * inp_0_0_2; + result0 += M4(-0.040272474, -0.0018999686, -0.036718227, 0.05683352, 0.14068884, -0.059090048, 0.0601508, -0.039334733, -0.14742632, -0.02577353, -0.058017954, 0.057766154, -0.071603104, -0.13627124, -0.042406775, 0.042193558) * inp_0_1_2; + result0 += M4(-0.03953849, -0.012823383, 0.012647818, -0.07757381, -0.06622981, 0.04571122, 0.02738234, -0.013842928, 0.029961985, 0.015561659, -0.015383494, 0.021000577, 0.057185896, 0.037138227, 0.02095205, -0.047683973) * inp_0_2_2; + result1 += M4(0.0057615293, -0.045122698, -0.01178126, -0.0726996, -0.0086135715, 0.065157086, 0.0034225588, 0.07258049, -0.03279438, 0.060885813, -0.00041689439, 0.08573385, -0.029732056, -0.031844694, 0.036845736, -0.10094928) * inp_0_0_0; + result1 += M4(-0.12540935, -0.059108384, 0.003970208, -0.12744214, 0.06369681, 0.028249402, 0.007363609, 0.122652315, 0.0926682, 0.027998177, -0.03176788, -0.16297963, 0.030422911, 0.07676895, -0.0079176305, 0.057718776) * inp_0_1_0; + result1 += M4(0.030936485, 0.031883776, -0.007541764, 0.009011137, -0.0032886202, 0.036986377, 0.0038485127, 0.07384179, 0.015596031, -0.028106213, -0.0056048124, 0.03516302, -0.03694747, -0.029075751, 0.011198101, -0.039395273) * inp_0_2_0; + result1 += M4(0.09053454, 0.016422741, -0.03282414, 0.0018926301, 0.045385055, -0.07430422, -0.022797182, -0.052842602, 0.04633681, 0.12838002, 0.015648523, 0.10493874, -0.11721678, 0.102124445, 0.009502804, -0.036585268) * inp_0_0_1; + result1 += M4(-0.04929572, -0.07120267, 0.11189219, 0.14805685, -0.071155205, 0.0014907664, -0.045666497, -0.2830528, 0.082157016, 0.3569714, -0.08436788, 0.45907578, 0.25751808, 0.007985261, -0.018987287, -0.077328935) * inp_0_1_1; + result1 += M4(0.001983042, 0.0573755, -0.059997357, 0.12338883, 0.0121495845, -0.04396366, 0.008587791, -0.014707099, 0.02200498, 0.08107376, -0.005465822, 0.068521366, -0.023648549, 0.055134445, 0.024040049, 0.012487843) * inp_0_2_1; + result1 += M4(-0.03344048, 0.018812401, -0.099432044, -0.092147544, -0.013474613, 0.12958124, -0.026809819, 0.12613833, -0.006871271, -0.004189431, -0.049348816, 0.01963418, 0.0218454, -0.1742686, 0.094456315, -0.057249658) * inp_0_0_2; + result1 += M4(-0.012384111, -0.17734681, 0.12383786, -0.112375386, 0.0319456, 0.27962422, 0.046854213, 0.398646, -0.034528103, -0.2823273, -0.11815615, 0.04903127, -0.010071655, -0.014617646, -0.20853819, 0.051345073) * inp_0_1_2; + result1 += M4(-0.017807463, 0.085978284, -0.004161402, 0.018392334, 0.004443354, 0.17043431, 0.0004278643, 0.26888165, -0.009966159, 0.039737593, -0.024603937, -0.06556405, -0.013565388, -0.02318172, 0.03753665, -0.01551806) * inp_0_2_2; + result2 += M4(-0.00054385135, -0.013860364, 0.037204344, 0.0643842, 0.009427588, 0.050591286, 0.015325365, 0.026667146, 0.019358223, 0.060875133, 0.003089811, -0.026155524, 0.054400604, -0.030613834, -0.0073381513, 0.0010448373) * inp_0_0_0; + result2 += M4(-0.11140873, -0.077490225, -0.0008244639, -0.111035444, 0.014723916, -0.111481555, -0.0516383, 0.066743694, 0.042972323, 0.01950517, 0.074459195, 0.050886415, 0.11208063, 0.020193007, -0.03352396, 0.055053547) * inp_0_1_0; + result2 += M4(0.026718343, -0.10349276, -0.10949595, 0.12181208, 0.020611692, 0.07150552, 0.03742183, -0.038923062, 0.021384154, -0.02058103, -0.15753624, 0.012840425, -0.0046102917, -0.09406839, -0.05100171, 0.032406077) * inp_0_2_0; + result2 += M4(-0.074565805, -0.013674222, 0.01627147, -0.09966034, 0.06198092, 0.03641343, -0.032527886, -0.06883835, 0.015009717, -0.026334036, -0.028027749, 0.06361123, 0.20694518, 0.06313499, -0.031564172, 0.05146381) * inp_0_0_1; + result2 += M4(-0.0727687, 0.042550147, -0.04598127, 0.3267873, 0.061976686, 0.04911097, 0.081161864, 0.010707485, 0.2691173, -0.043794725, -0.09971116, -0.0033741079, 0.021865325, 0.043241937, 0.18235348, -0.054897718) * inp_0_1_1; + result2 += M4(-0.00985757, -0.016703412, -0.1516014, 0.11700871, -0.018276513, -0.051278856, -0.24498534, 0.07523947, 0.08632356, -0.020398337, -0.111400016, -0.014939744, -0.04313168, -0.07714612, -0.008079888, 0.020002536) * inp_0_2_1; + result2 += M4(-0.013238882, -0.102667235, 0.0081237415, 0.035577383, -0.03021197, -0.10485464, 0.011287993, 0.078355186, 0.030628305, 0.05074276, -0.017268093, 0.025273146, 0.09983698, -0.018156344, 0.0009785192, -0.012089172) * inp_0_0_2; + result2 += M4(0.011669444, 0.018538315, 0.027060565, 0.092130765, -0.05551045, -0.076386236, -0.062335093, -0.15230888, 0.09960692, -0.013955326, 0.0051692463, 0.086296074, 0.03327316, -0.0583193, -0.05385146, 0.018058175) * inp_0_1_2; + result2 += M4(-0.010289144, -0.040999196, 0.072243415, -0.021734484, 0.031605948, 0.07325174, -0.060475502, -0.012607067, 0.021910584, 0.01122505, 0.054743167, 0.053025585, 0.015383842, -0.042237084, 0.010509368, -0.030073771) * inp_0_2_2; + result3 += M4(-0.09841719, -0.13165414, 0.045820847, -0.007834082, -0.007131807, -0.046782803, 0.02734628, 0.01637415, -0.119316526, 0.1290529, -0.067837425, -0.17189166, 0.0032192334, 0.116386436, -0.02809339, 0.06934349) * inp_0_0_0; + result3 += M4(0.09417788, 0.14279406, -0.061828166, 0.06364808, -0.040369745, 0.07213133, -0.031408317, 8.409518e-05, 0.11984481, -0.06191443, 0.07229216, -0.022234676, 0.005406791, 0.16676822, 0.22716026, 0.024176734) * inp_0_1_0; + result3 += M4(0.05202953, -0.14130098, -0.0026728045, -0.054721516, 0.02505792, 0.06512413, -0.012624254, -0.0026803268, -0.047477644, -0.031517543, -0.032461733, 0.0070039, -0.038684703, 0.12445629, -0.016449094, -0.00015740903) * inp_0_2_0; + result3 += M4(0.1427558, -0.26331204, 0.23879163, 0.1472501, 0.07586082, -0.19956431, 0.11914642, -0.018028205, 0.042948782, -0.18455848, 0.028981531, 0.06794226, -0.04177945, 0.09921873, 0.20470385, 0.11457745) * inp_0_0_1; + result3 += M4(0.4082949, 0.20943645, 0.081940874, 0.12100776, -0.002409686, -0.007796975, -0.039054655, 0.033258572, 0.12229252, 0.027062602, -0.3295776, -0.04143495, -0.06493101, -0.28356364, 0.51172125, -0.03805709) * inp_0_1_1; + result3 += M4(-0.09025853, -0.11847181, -0.15800075, -0.03284227, 0.009739382, -1.3548135e-05, 0.005809967, -0.016361618, -0.007935478, 0.045800693, 0.06297317, -0.014967157, 0.086511806, 0.1897742, -0.066169955, -0.008127524) * inp_0_2_1; + result3 += M4(0.038830314, -0.13548805, 0.10421148, 0.09081409, -0.07634593, -0.060178645, -0.07031697, 0.054025967, 0.020105308, -0.0027928702, 0.031130863, -0.026592439, 0.014720058, 0.19513103, 0.002097078, 0.18665725) * inp_0_0_2; + result3 += M4(-0.08901566, 0.105436236, 0.12266256, -0.008518654, 0.11778259, -0.053422395, 0.028649012, -0.040792372, -0.02262042, -0.10925559, -0.07001872, -0.035234697, -0.07897347, 0.08139603, 0.054484908, 0.019872947) * inp_0_1_2; + result3 += M4(0.030658608, -0.02215864, -0.0070415963, -0.016830377, 0.035668887, -0.068572775, 0.017487563, 0.021502042, -0.0044210944, 0.05756212, -0.020683121, -0.006085243, -0.008396225, 0.021756154, -0.049787946, 0.01207104) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.03791764, 0.03606116, 0.0045328056, 0.002800669, -0.009491753, 0.075630374, 0.04046336, -0.028276388, 0.04324208, 0.524792, -0.09134197, 0.08187007, 0.029704953, 0.08065349, 0.007941393, -0.026542963) * inp_1_0_0; + result0 += M4(0.02040871, -0.12661457, 0.16988854, -0.16411963, -0.08627451, -0.08485256, -0.13350333, 0.16505302, -0.03161001, 0.122473575, 0.29984474, -0.2572558, -0.030814288, 0.050678268, -0.008602223, 0.027681787) * inp_1_1_0; + result0 += M4(-0.006042254, 0.065050334, 0.04664241, -0.037401382, 0.03355854, 0.054504145, 0.047228526, -0.019673886, -0.109151475, -0.0869173, -0.21530285, 0.3827806, 0.020756625, -0.0028767965, 0.00789321, 0.021198263) * inp_1_2_0; + result0 += M4(-0.0031582236, -0.13864206, -0.049212236, 0.035027854, -0.040887404, -0.053039804, -0.06926417, 0.07521589, -0.0047208094, 0.15803817, -0.009107502, 5.1163806e-05, -0.035306234, -0.034462266, 0.032939598, -0.054286096) * inp_1_0_1; + result0 += M4(-0.05159398, 0.021360615, -0.12616381, 0.07439948, -0.04818794, 0.11798935, -0.24307126, 0.3104743, 0.16276325, 0.14583969, 0.021263607, -0.058796406, 0.12709579, -0.124082625, -0.06194249, 0.08661151) * inp_1_1_1; + result0 += M4(0.09366448, -0.0023552156, -0.114171155, 0.11347451, -0.05757338, -0.03278382, -0.039372697, 0.01685123, 0.12495786, 0.20478605, -0.06560785, 0.15574126, -0.04436519, 0.012480755, 0.084948376, -0.104769275) * inp_1_2_1; + result0 += M4(-0.09293131, -0.06462749, -0.007985044, -0.012933727, -0.04487777, -0.22023484, -0.0037138779, -0.013158153, 0.00241268, 0.30657583, -0.0056309095, -0.011388346, 0.035876844, 0.2619356, -0.0003885763, -0.035041932) * inp_1_0_2; + result0 += M4(0.18430625, 0.035722308, 0.039618477, -0.051990308, 0.15817565, 0.12178207, 0.024091955, -0.005528151, 0.026752066, 0.0029761952, 0.040815126, -0.018809414, -0.12874056, -0.062183477, -0.0050868164, 0.008158902) * inp_1_1_2; + result0 += M4(-0.070743024, -0.014308823, -0.00028148116, -0.010128748, -0.051406384, -0.03582649, 0.004809814, -0.015474758, -0.06934015, -0.019315397, 0.0028014528, -0.010465397, 0.03486373, 0.15004137, -0.0046289526, 0.011293259) * inp_1_2_2; + result1 += M4(0.017685123, 0.0065368274, -0.0015516317, 0.16557714, -0.03033398, 0.025646772, -0.010180449, 0.047718406, 0.11997764, 0.15046796, -0.03974632, 0.026449608, -0.022485612, -0.02235598, -0.0026649777, 0.0047121164) * inp_1_0_0; + result1 += M4(0.3358178, -0.013722061, 0.035134647, 0.14561415, -0.24687243, -0.07977394, -0.006837952, -0.2426016, -0.18184388, 0.14377251, -0.014832799, 0.22288579, 0.017362798, -0.12165396, 0.003879503, -0.117855765) * inp_1_1_0; + result1 += M4(0.04104673, 0.08014578, 0.007094119, 0.13034703, -0.021104911, 0.018781923, 0.021670882, -0.037076604, 0.17533164, 0.06820291, 0.07606097, 0.06600506, 0.029399764, 0.033080503, -0.001904172, 0.052032262) * inp_1_2_0; + result1 += M4(-0.007679661, -0.018380007, -0.016621359, 0.014491733, 0.04202803, 0.04733234, 0.050396703, -0.009298026, -0.008895612, -0.099489, -0.07935202, -0.050699767, -0.08127414, -0.019099122, 0.04923852, -0.06022952) * inp_1_0_1; + result1 += M4(-0.13803823, 0.13586937, -0.28232625, -0.32198295, -0.25998548, -0.0856141, 0.22959727, -0.005808529, -0.12802751, -0.53791004, 0.17587951, -0.4111663, 0.17720166, 0.059367396, 0.012145319, 0.022847874) * inp_1_1_1; + result1 += M4(-0.008384057, 0.07714925, -0.03306005, 0.011172002, -0.0613773, -0.14301087, 0.015359433, 0.008426981, -0.008028197, -0.082278445, -0.10858002, 0.08871151, -0.12919591, 0.028668016, -0.022689562, -0.015607325) * inp_1_2_1; + result1 += M4(0.0020820436, -0.005625805, -0.00054294884, -0.025311854, 0.006265746, 0.0085602505, -0.049143896, -0.024635661, -0.0070366124, 0.016309332, -0.0054611517, 0.07001931, -0.027046647, -0.045871366, 0.074525505, 0.044885844) * inp_1_0_2; + result1 += M4(0.0038440404, 0.3018618, 0.12885766, 0.16752897, 0.0049168784, 0.008830848, 0.25186682, 0.030004857, 0.0025120769, 0.3281529, 0.13829912, 0.24118833, -0.0017494321, -0.16340025, -0.17641474, -0.050659727) * inp_1_1_2; + result1 += M4(-0.0058690743, 0.017535014, 0.026015634, 0.0069791945, 0.009430142, 0.011086416, 0.037033264, 0.058812175, -0.0071097505, 0.056450658, 0.033287015, -0.031129349, 0.018289886, -0.019709148, 0.09328557, 0.03190014) * inp_1_2_2; + result2 += M4(0.06894697, -0.10339465, -0.035631135, 0.022989944, -0.01942999, -0.10801729, 0.0216407, 0.031430345, 0.0035577503, 0.024212655, 0.0071231346, -0.056087773, -0.00088516675, 0.025889328, -0.0022241352, -0.0057471152) * inp_1_0_0; + result2 += M4(0.2759868, -0.027209675, -0.013602369, 0.08910978, -0.14602913, -0.10279265, -0.06586457, -0.26223028, 0.025394203, -0.027354881, -0.06079269, 0.09261669, 0.069493055, -0.0055911513, 0.00068189483, -0.048568405) * inp_1_1_0; + result2 += M4(0.15641908, -0.035849106, 0.23181237, 0.054865167, -0.07924946, -0.04749266, -0.27688533, 0.110440694, 0.30449897, 0.07126261, -0.11757854, -0.0020133695, -0.05560786, 0.055558626, 0.018453365, 0.05488586) * inp_1_2_0; + result2 += M4(0.05669848, -0.00070812786, -0.0056745764, -0.06824219, 0.04319297, -0.06513989, -0.0015118121, -0.081020415, -0.024937613, -0.08211584, 0.008090276, 0.004001641, 0.043160763, -0.008445913, -0.004146166, 0.027650317) * inp_1_0_1; + result2 += M4(0.28002256, -0.08631263, -0.059070054, 0.019348877, 0.24592939, -0.08331847, -0.14509794, 0.22009538, 0.16204305, 0.04204707, -0.039180923, -0.018922726, 0.061964963, -0.05724076, 0.089339934, -0.16005886) * inp_1_1_1; + result2 += M4(0.004549639, -0.09183629, 0.1420763, 0.032508075, 0.10194179, -0.10927332, 0.27485055, -0.018509366, 0.06662383, 0.033839677, 0.08738133, 0.09459715, -0.034808353, 0.0061988346, 0.02458268, 0.012714486) * inp_1_2_1; + result2 += M4(-0.026079418, -0.038056526, 0.002398695, 0.007867446, -0.019024998, -0.087564975, 0.015248439, 0.010014585, -0.013561912, -0.08886625, -0.0134702865, 0.02232676, 0.037407853, 0.053970724, 0.00631281, -0.043232646) * inp_1_0_2; + result2 += M4(-0.0022799855, -0.0369194, 0.016964918, -0.008896998, 0.0009860508, -0.043279737, -0.0263229, 0.003257031, 0.012866944, -0.047402006, 0.0036670251, -0.017854307, 0.0634053, 0.027829783, -0.0018171946, 0.08086287) * inp_1_1_2; + result2 += M4(-0.013369, -0.101083554, -0.07694392, -0.020025238, 0.017319538, 0.023366045, -0.01640813, -0.04008224, -0.03418966, -0.017737657, -0.072516754, -0.07620339, 0.017667681, 0.04104676, -0.11862017, -0.022559365) * inp_1_2_2; + result3 += M4(0.045322407, -0.02171791, -0.061052725, -0.012117548, -0.015696114, -0.07482115, 0.04300487, -0.032141753, 0.0804886, -0.4146384, 0.29769376, -0.05980045, -0.026526874, 0.19134584, -0.1898744, 0.0952924) * inp_1_0_0; + result3 += M4(-0.113841474, -0.19846705, -0.082990475, -0.013619692, 0.18104905, -0.079608805, -0.041662235, 0.0829167, -0.18034573, 0.8529516, -0.46155354, 0.3802709, 0.041667365, -0.11552713, 0.217227, 0.049550664) * inp_1_1_0; + result3 += M4(-0.0020833479, 0.102125585, 0.008216506, 0.010471269, -0.06279899, 0.077044636, -0.097625405, -0.0039822925, -0.050997138, 0.7753718, 0.38631454, 0.05260894, -0.042959493, 0.009713864, 0.06273459, 0.0045036124) * inp_1_2_0; + result3 += M4(0.0746249, -0.027850332, -0.000757232, -0.11083669, 0.053586207, -0.05182651, 0.08614704, 0.15321635, -0.076562144, -0.17570184, 0.11280837, -0.116007045, -0.040575534, 0.065053694, -0.06028298, -0.13140927) * inp_1_0_1; + result3 += M4(-0.07656796, -0.08148092, -0.16069895, 0.04187618, -0.14711398, -0.24460338, -0.17429228, -0.16669545, 0.13918693, 0.20594399, 0.09800724, 0.18768425, -0.086857975, 0.062444944, 0.16921277, -0.13279808) * inp_1_1_1; + result3 += M4(-0.074363284, -0.19581212, 0.0012813862, -0.0075201634, 0.0020850392, 0.028007274, 0.023813803, -0.030834958, 0.07274119, 0.28911227, 0.095511995, 0.016141748, 0.109687485, 0.12591973, -0.20956549, 0.010454399) * inp_1_2_1; + result3 += M4(-0.03802425, -0.057888344, 0.06638698, 0.021309895, -0.040915377, -0.17378275, 0.049781483, -0.0038457427, -0.01987416, -0.075760044, 0.029176561, 0.053127218, 0.05793729, 0.001864354, 0.011282336, -0.11085149) * inp_1_0_2; + result3 += M4(0.009166591, 0.020393299, -0.013589619, -0.0043293405, 0.022690987, 0.1941181, -0.01498279, 0.018238517, 0.016372807, 0.08158214, -0.038956385, 0.090630956, 0.0064879647, 0.0019467361, 0.061438218, 0.12570952) * inp_1_1_2; + result3 += M4(-0.036306724, -0.022533497, 0.02743402, 0.009214226, -0.012935099, -0.08962785, 0.029733934, -0.0031940192, -0.016709115, 0.05964771, 0.063720234, 0.022471542, 0.012363867, 0.20758559, 0.011010401, 0.037424065) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.013779818, 0.21916316, -0.01749961, -0.031653825, 0.019197604, -0.6749215, 0.025190348, 0.009256963, 0.037712105, -0.0427757, -0.0043518688, -0.014002386, 0.0035128384, -0.25496736, 0.005694031, -0.0139859775) * inp_2_0_0; + result0 += M4(0.058478884, -0.035180025, 0.16013937, -0.15942277, -0.03816243, 0.05733203, -0.06691323, -0.016521277, 0.0045641474, -0.083760835, 0.026783314, -0.031845126, 0.028373491, -0.047164347, 0.08748592, -0.18181978) * inp_2_1_0; + result0 += M4(-0.029648367, -0.0064177266, -0.007985839, -0.0039937594, 0.049200006, 0.04194013, -0.012315959, -0.058244944, -0.00062385213, 0.03707708, 0.045191098, -0.033270165, -0.029975431, -0.008462107, -0.043282945, -0.019695746) * inp_2_2_0; + result0 += M4(0.03685474, 0.21790871, 0.016414702, -0.0036660742, -0.02711461, -0.5112229, -0.0076950877, -0.027526189, -0.07460244, 0.1775834, 0.096185096, -0.09191064, 0.06321831, -0.06237055, -0.09763056, 0.07062399) * inp_2_0_1; + result0 += M4(-0.08479572, -0.14922842, -0.1637572, 0.30417043, -0.035105832, -0.24034815, -0.04410996, -0.046823483, 0.0038008555, -0.08467451, 0.31348646, -0.41025126, 0.12546113, 0.18967205, 0.04131372, 0.04792723) * inp_2_1_1; + result0 += M4(0.06739356, 0.013132563, 0.0705947, -0.09722243, -0.07827824, -0.034469802, -0.011826323, -0.055389136, -0.009527839, 0.025252374, 0.24526902, -0.20351002, 0.03863696, -0.0358095, -0.08841542, 0.08530016) * inp_2_2_1; + result0 += M4(0.0024189504, 0.18470794, 0.02421729, -0.026005035, 0.0714845, -0.38582283, -4.2597487e-05, -0.008914323, 0.10920884, 0.29031822, 0.0063368627, -0.009375747, -0.014497603, 0.1282962, -0.022127206, -0.013304615) * inp_2_0_2; + result0 += M4(-0.030173173, -0.103350885, 0.049853764, -0.067631066, -0.28206545, 0.11199615, -0.030596651, 0.020736802, -0.23197545, -0.08767077, 0.08164665, -0.09930701, 0.39759257, 0.01888446, 0.087139525, -0.11122967) * inp_2_1_2; + result0 += M4(0.044511873, 0.031926055, 0.013973623, -0.026140142, -0.16958922, 0.03009211, -0.018803382, 0.017162027, 0.037430823, 0.026251895, 0.001828609, 0.0070498935, 0.032491688, -0.06525586, -0.042710643, 0.009969354) * inp_2_2_2; + result1 += M4(-0.028666057, 0.102332056, 0.029340958, 0.097780496, -0.050370127, 0.024993198, -0.014046047, 0.06757201, 0.0028525956, 0.009097466, 0.0012397132, 0.020048415, 0.034758266, 0.001306835, 0.021822734, 0.040313948) * inp_2_0_0; + result1 += M4(0.12116667, 0.042435147, -0.011453865, 0.28418344, -0.054431155, -0.041074473, -0.021197021, -0.46425793, 0.024403436, 0.10476772, 0.00850296, 0.17764671, 0.19450468, 0.04881686, -0.017300593, 0.15328363) * inp_2_1_0; + result1 += M4(-0.014537472, -0.04785431, 0.0057213237, 0.08120087, 0.0027244955, 0.036710683, 0.0018011717, -0.11301808, -0.06367366, -0.014481189, -0.009738734, -0.01731468, 0.0046592485, 0.015897358, -0.0037436956, 0.0090299705) * inp_2_2_0; + result1 += M4(-0.0897561, -0.077474676, -0.040233955, 0.11166737, 0.012042107, -0.13035285, 0.0069526, -0.029161317, 0.04087425, -0.05005156, -0.02397979, -0.049189534, 0.08019726, 0.0033636147, -0.0046941456, -0.04718199) * inp_2_0_1; + result1 += M4(-0.019481955, -0.11552646, -0.15306385, 0.11965796, -0.06444712, -0.60503227, -0.03709784, -0.84860533, 0.101685636, 0.041876853, -0.018051691, -0.09969215, -0.117303394, -0.17066102, -0.19214894, -0.06141623) * inp_2_1_1; + result1 += M4(-0.08162457, 0.016572323, 0.009119889, 0.055340182, -0.013891592, -0.30231586, -0.021164672, -0.49435094, -0.051145483, 0.14773344, 0.07521264, 0.06259801, 0.03906362, -0.13338828, -0.030600214, -0.098313935) * inp_2_2_1; + result1 += M4(-0.0056195445, 0.28928724, 0.1379861, 0.0032541384, -0.0068257446, 0.011568706, -0.01583596, -0.026307525, -0.015456645, 0.016127326, -0.025889514, 0.050082583, -0.0007289241, -0.010907576, -0.12133015, 0.01162384) * inp_2_0_2; + result1 += M4(0.028638389, 0.23542702, 0.121689275, -0.23637827, -0.016180132, -0.67607766, -0.08673431, -0.10939401, -0.010357574, -0.08129334, -0.09344, 0.016316568, 0.025065977, 0.3341326, 0.22300017, 0.09743363) * inp_2_1_2; + result1 += M4(-0.015541606, 0.031042485, 0.051960707, -0.10814859, -0.0031766663, -0.13280825, -0.022083284, -0.06239775, -0.0022412688, -0.11887442, 0.047357682, -0.16150878, 0.010135667, 0.10523319, -0.025714098, 0.03423172) * inp_2_2_2; + result2 += M4(-0.022993447, -0.10126082, -0.008862645, 0.009558404, -0.054707915, -0.111216895, -0.012196099, 0.07278377, 0.0041023744, -0.019806284, -0.002214899, 0.030154316, 0.07870343, -0.013954103, 0.013901531, -0.0071220016) * inp_2_0_0; + result2 += M4(0.05095645, -0.042629406, -0.082931906, 0.09913234, -0.041729834, -0.081676796, 0.0075822813, -0.3088201, 0.028836848, -0.082174934, 0.032421783, -0.0060300524, 0.14015388, -0.06350905, 0.13277183, 0.051554084) * inp_2_1_0; + result2 += M4(-0.021707237, -0.032912396, 0.21629085, 0.014243769, -0.028248513, -0.085443296, -0.3280954, -0.13558732, -0.042475957, -0.04921339, 0.0012851176, 0.032892134, 0.051295515, 0.06387788, 0.021846004, -0.13766341) * inp_2_2_0; + result2 += M4(0.023979997, -0.053251967, -0.0006032927, 0.090948775, -0.03888054, -0.102491334, 0.01808955, -0.040047757, -0.021477126, -0.07267349, -0.012966651, 0.030831197, 0.10165511, -0.06750721, -0.017767964, -0.09202411) * inp_2_0_1; + result2 += M4(-0.046669472, -0.013510663, 0.059922248, 0.23835911, -0.07820152, 0.06794421, 0.035604022, -0.1144176, 0.07068062, -0.04091932, 0.05944978, 0.11380249, 0.09088974, -0.1002041, -0.088322915, -0.030037394) * inp_2_1_1; + result2 += M4(-0.051205207, 0.05612446, 0.07506183, -0.09648897, -0.024628337, -0.016302107, -0.91603076, -0.29067314, -0.04936889, -0.08389894, -0.32963422, -0.07402971, 0.074949786, -0.057981458, 0.5925726, 0.038325448) * inp_2_2_1; + result2 += M4(-0.045664266, -0.054451637, -0.010032334, 0.034178797, 0.029870953, -0.11087751, -0.008587346, 0.005013674, 0.010290779, -0.10230002, -0.016301338, -0.0010879014, -0.061455965, -0.013092095, -0.0126922345, 0.021366991) * inp_2_0_2; + result2 += M4(-0.20278515, -0.11891043, -0.047657784, -0.16653648, 0.0005207907, -0.10197919, -0.012389828, 0.039248805, -0.027018683, 0.016838243, 0.10375171, -0.13223636, 0.060682498, 0.010384079, 0.05070221, -0.07521598) * inp_2_1_2; + result2 += M4(-0.06732721, -0.09149638, -0.01440614, -0.00046416372, -0.024689594, -0.086670674, 0.0056709866, 0.04906158, -0.011234572, -0.00085715187, 0.041561518, -0.011770444, 0.05219869, -0.005724713, 0.07658236, -0.07809252) * inp_2_2_2; + result3 += M4(-0.043154147, 0.1813734, -0.24296522, -0.18964617, -0.00053656293, 0.073823325, 0.07934629, 0.0077484837, -0.033539794, 0.07983527, -0.04132395, 0.0221986, -0.046767786, -0.2046515, 0.093034185, 0.017791785) * inp_2_0_0; + result3 += M4(-0.07986458, 0.24019942, 0.2890016, 0.05044439, 0.053371403, -0.68155944, -0.21055256, -0.19590291, 0.04625938, -0.09285042, 0.005184423, -0.024542352, -0.1242854, 0.16712302, 0.25536102, -0.06046315) * inp_2_1_0; + result3 += M4(0.110498555, 0.07516408, -0.07876151, 0.01883748, -0.114289135, -0.29517758, -0.14721058, 0.022091808, -0.0359855, 0.08394964, -0.019007629, 0.019101847, 0.019339366, -0.11714168, -0.07094147, 0.00451848) * inp_2_2_0; + result3 += M4(-0.012919992, 0.1369222, -0.2732416, -0.17526399, -0.010347271, -0.01868432, -0.015816586, -0.14344539, 0.018896159, 0.19946118, -0.037967134, -0.10760814, 0.032594014, -0.41689512, 0.058743387, 0.19437246) * inp_2_0_1; + result3 += M4(0.11102623, 0.1572921, 0.23168686, -0.069944575, -0.1813538, -0.6271781, -0.24745354, -0.17729184, -0.33937684, -0.0861067, -0.002288483, 0.055063516, -0.041452993, 0.5463022, 0.028170375, 0.11677861) * inp_2_1_1; + result3 += M4(0.08435565, 0.032648746, -0.055590957, 0.0014671348, 0.11301972, -0.3885799, 0.011423688, 0.02565552, 0.18209329, 0.074671805, -0.041186612, 0.025571901, -0.14688689, -0.27317134, -0.03077098, 0.0117346905) * inp_2_2_1; + result3 += M4(0.04817234, 0.26817775, -0.10161488, 0.040350743, 0.010257333, 0.031333394, 0.002950192, 0.0534698, -0.012836827, 0.11579518, -0.08975087, -0.032125667, -0.15702203, -0.15051942, -0.015707918, -0.03141244) * inp_2_0_2; + result3 += M4(0.09410685, -0.013702716, 0.17390637, -0.030210355, 0.0147846555, -0.06855739, 0.04796251, 0.009910011, 0.1618562, 0.050896388, -0.0011444244, -0.059056938, 0.08476411, 0.20332877, -0.012074825, -0.0039784717) * inp_2_1_2; + result3 += M4(-0.033710867, 0.13790971, -0.029413365, 0.041634776, -0.030713236, 0.035875082, 0.028113496, 0.0027906392, -0.03885695, 0.12731767, 0.012205976, 0.0035707527, -0.01529997, -0.15364954, 0.04945567, -0.023066707) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.038062073, 0.2141279, 0.06481006, -0.12940322, -0.0027764095, 0.08240676, -0.008070355, -0.011360152, -0.018044285, -0.22364011, -0.016826315, 0.04532728, -0.021932011, 0.17901145, -0.04023682, 0.00414411) * inp_3_0_0; + result0 += M4(0.024813054, 0.053320397, -0.068416364, 0.085439764, 0.019156259, 0.09772809, 0.013872583, 0.003128646, -0.0377687, 0.06855879, -0.023625996, -0.013501507, -0.037352577, -0.12048335, -0.06935224, 0.079339765) * inp_3_1_0; + result0 += M4(-0.0008948348, -0.05550685, 0.007604002, -0.0158738, 0.00076379447, 0.020687131, 0.015978998, 0.02077568, 0.017053058, -0.004057524, -0.12129772, 0.058062665, 0.053945795, 0.1649665, -0.030655291, 0.05742684) * inp_3_2_0; + result0 += M4(0.103066035, -0.7300315, 0.085574366, -0.038748726, -0.052253325, -0.27357453, -0.035952266, 0.055022333, 0.024551407, -0.25668055, 0.0007889168, -0.0007591933, -0.0949221, 0.072160475, 0.016339399, -0.09055286) * inp_3_0_1; + result0 += M4(0.07770222, 0.1035488, 0.11635461, -0.19613256, -0.17844269, -0.10049437, -0.032167118, -0.069166064, 0.22103043, 0.06767758, -0.16874984, 0.17686485, 0.24360006, -0.088182166, 0.06325561, 0.04732989) * inp_3_1_1; + result0 += M4(0.01281408, -0.052539933, -0.036869086, -0.0019218755, 0.033333823, 0.058557454, -0.047289293, 0.0734493, -0.011906149, -0.09344646, -0.1792974, 0.21100967, -0.12567343, 0.08980369, 0.03961268, -0.0020021321) * inp_3_2_1; + result0 += M4(0.23851325, -0.2964688, -0.024860052, 0.0076622204, 0.08764992, 0.050132558, -0.0065116147, -0.0029406226, -0.019137815, -0.11900036, 0.011086529, -0.0067911097, -0.28993663, 0.076079234, -0.011847647, -0.100516155) * inp_3_0_2; + result0 += M4(0.04419162, 0.10790811, 0.050464034, -0.052768122, -0.13191228, 0.01942084, 0.02409991, 0.013205228, -0.215829, 0.010005103, -0.061933685, 0.05324168, -0.4616059, -0.070461564, -0.064849354, 0.11797088) * inp_3_1_2; + result0 += M4(-0.04070436, -0.09416829, -0.04929169, 0.067432515, -0.0864388, 0.01788289, 0.04142661, -0.042931058, 0.03439083, 0.009610911, 0.0030174495, 0.005878064, 0.07801756, 0.08367224, 0.04520196, -0.06358246) * inp_3_2_2; + result1 += M4(0.040575773, 0.009816436, 0.00020496556, -0.027174527, 0.0061966665, -0.010212162, -0.007030445, -0.09197709, -0.014679208, -0.11147172, -0.0038630906, -0.059626117, -0.064454876, -0.18848884, -0.026746308, -0.2612213) * inp_3_0_0; + result1 += M4(0.025270196, -0.008648287, -0.006241156, 0.11304264, 0.002291121, -0.17409967, -0.0030635125, -0.15197915, 0.31160298, -0.18276493, -0.007551214, -0.29215118, 0.032651596, -0.09381023, -0.033310868, -0.30864105) * inp_3_1_0; + result1 += M4(0.029827468, -0.07212181, -0.0059149708, -0.02832478, -0.0036889983, 0.11503275, -0.0133342985, 0.35067505, 0.069052294, 0.021306505, -0.006124511, -0.052335735, -0.051988155, -0.010415701, 0.0292754, -0.16619146) * inp_3_2_0; + result1 += M4(-0.017186752, -0.024710158, -0.054002713, 0.09658648, 0.021105714, 0.09553063, 0.005458199, 0.1535918, -0.052033518, 0.05249869, 0.023075325, 0.0017748644, -0.007927314, 0.21851934, 0.076110005, 0.1549553) * inp_3_0_1; + result1 += M4(-0.24649884, 0.2037065, 0.0050564874, -0.0838121, -0.053290866, 0.24137548, 0.03268435, -0.19582611, 0.2728014, 0.11516617, -0.2776526, 0.29564765, 0.056608714, 0.066695906, 0.039385546, 0.3590516) * inp_3_1_1; + result1 += M4(0.021940233, 0.09766358, -0.0024492894, 0.056543294, -0.042301793, -0.18701898, -0.04649817, -0.39435723, 0.17607027, -0.14804529, -0.13436085, -0.038023666, 0.017116247, 0.12693964, 0.040699497, 0.32045344) * inp_3_2_1; + result1 += M4(0.030560251, 0.033483144, 0.06478091, -0.08260862, -0.0003347912, -0.28518027, -0.014617922, -0.10500096, -0.0015620848, -0.038950246, 0.028218228, -0.03802862, -0.01546767, -0.9264438, -0.008355967, -0.5635481) * inp_3_0_2; + result1 += M4(-0.03922487, -0.115100004, 0.18206236, 0.031616636, 0.010903155, -0.21015875, -0.06844489, 0.08924375, 0.0004909406, -0.19463973, -0.25094545, -0.17086059, 0.022693226, -0.2251329, -0.014191069, -0.22457352) * inp_3_1_2; + result1 += M4(0.005867922, -0.07154546, -0.041601587, -0.0068623656, -0.001936714, 0.11745422, 0.03150495, -0.093714595, 0.029465571, 0.08250033, -0.1579151, -0.028160485, -0.02360907, 0.0055461796, -0.009449481, -0.07122842) * inp_3_2_2; + result2 += M4(0.014997094, -0.073501885, 0.0132263275, 0.12340946, 0.018715253, -0.03774917, -0.030047366, -0.13164493, -0.019094057, -0.019109681, -0.008549362, -0.020587744, -0.014902967, -0.09828911, -0.023465153, -0.07441592) * inp_3_0_0; + result2 += M4(-0.0036458373, -0.077869564, 0.046160117, 0.0006182458, -0.04060173, 0.041398875, 0.017186413, 0.2170062, 0.15190022, 0.00671332, 0.007910316, -0.03564122, 0.07395223, 0.043946113, -0.023532797, -0.09109481) * inp_3_1_0; + result2 += M4(-0.009333379, -0.07201044, 0.34406257, -0.008108068, 0.017962933, 0.07170349, -0.13883772, -0.097861245, 0.10507732, -0.017253805, 0.22346519, -0.060781628, -0.042994563, -0.034118805, 0.11651774, 0.068822056) * inp_3_2_0; + result2 += M4(0.107567824, -0.014996469, 0.0468502, -0.03507376, -0.016626038, -0.11044043, 0.012853235, 0.022993937, -0.03965704, -0.013101877, -0.005181674, 0.0720093, -0.04458476, -0.044698216, -0.056906916, -0.15644144) * inp_3_0_1; + result2 += M4(-0.24450101, -0.05021081, 0.28329143, 0.052905396, 0.03132615, 0.024134472, 0.025940863, -0.31099752, -0.15341069, 0.053456385, 0.11059655, -0.22808413, -0.03157951, 0.02424628, 0.17435497, -0.13484989) * inp_3_1_1; + result2 += M4(0.038007554, -0.07408078, -0.31231526, -0.046669047, -0.075324856, 0.009619571, -0.30759802, 0.14287001, 0.049111176, 0.04579521, -0.10265535, 0.047160428, 0.014466494, 0.058858827, -0.40376583, -0.01559601) * inp_3_2_1; + result2 += M4(0.029162662, -0.08115085, 0.0015537582, -0.047456466, -0.025844254, 0.07617664, -0.014251737, 0.024603898, 0.028121594, 0.019586843, 0.0012635064, -0.021388637, -0.043075148, -0.084901094, 0.0054910085, -0.17058848) * inp_3_0_2; + result2 += M4(0.15652397, -0.023679573, 0.10785547, -0.023840956, -0.03806573, -0.041285273, 0.025743026, 0.1401332, -0.11558319, 0.019962313, -0.035437133, 0.12046317, 0.0058546956, 0.021801556, 0.08483396, 0.16000974) * inp_3_1_2; + result2 += M4(-0.01603148, 0.0026883425, 0.10843955, 0.04351186, -0.036719613, -0.109948635, -0.061967216, -0.14250335, -0.05838408, 0.0007986963, -0.14958149, 0.03388766, 0.04054899, 0.081719644, 0.05053678, -0.03529535) * inp_3_2_2; + result3 += M4(-0.085353546, 0.08461731, -0.13915083, -0.036257822, -0.008904922, -0.09930966, 0.13293777, 0.03638514, 0.03201791, 0.1338242, -0.09031037, -0.03228892, 0.034745544, -0.18244584, -0.20624673, -0.08474406) * inp_3_0_0; + result3 += M4(0.07409441, -0.053643093, -0.07329052, -0.029934444, 0.047175847, 0.043111406, -0.20345508, 0.07938889, -0.016340598, -0.38565966, 0.21107996, -0.04949173, 0.11025018, 0.2827765, 0.27820566, 0.03526538) * inp_3_1_0; + result3 += M4(0.030461181, -0.07242497, 0.046613485, 0.01554022, -0.021772174, -0.10526904, 0.121392906, -0.01915928, -0.06995953, -0.08755693, -0.1146613, -0.056353655, -0.030497294, 0.38102558, -0.14643161, 0.013574363) * inp_3_2_0; + result3 += M4(0.02252646, 0.19843449, 0.01796448, -0.114927374, 0.009417218, -0.14562178, 0.009520882, -0.24945049, -0.03411223, 0.019948045, -0.059774544, -0.16049027, -0.160916, 0.2315701, -0.33952394, -0.16819766) * inp_3_0_1; + result3 += M4(-0.120750055, -0.101981714, -0.6174327, 0.04210056, -0.12963599, -0.26512286, -0.15236779, 0.23088011, 0.17519988, -0.18581973, 0.2061288, 0.1486004, 0.15724893, -0.035897397, 0.27736568, 0.06209648) * inp_3_1_1; + result3 += M4(-0.043066334, -0.2650026, 0.13015231, -0.021486249, -0.021243062, 0.12762718, -0.16992107, -0.017701978, -0.1198713, -0.14685233, 0.08095718, 0.016187131, 0.027274022, 0.17814746, -0.1705369, 0.037348423) * inp_3_2_1; + result3 += M4(-0.020911487, 0.012172589, 0.030367784, -0.19994633, 0.004376709, 0.09316046, -0.05491899, -0.12120255, 0.048024613, 0.055273246, -0.004435442, -0.00016166511, -0.22648303, -0.30258325, -0.01430347, -0.21556045) * inp_3_0_2; + result3 += M4(0.07303654, 0.16753973, -0.03591846, -0.018747568, 0.025375472, -0.26433265, 0.12862511, 0.02518775, -0.14287944, -0.17940018, -0.02466985, 0.11916799, -0.242104, -0.108683094, 0.055211473, -0.13809764) * inp_3_1_2; + result3 += M4(-0.026391529, -0.11112396, 0.030737549, -0.011259499, 0.023542786, -0.0055174553, -0.049245745, 0.027468752, 0.057162017, -0.12012449, -0.03709937, -0.0076213237, 0.0522986, 0.131559, 0.044747207, -0.006477326) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result3, V4(0.0))); +} + +//!DESC ArtCNN C4F16 DS (Conv2D-5) +//!COMPUTE 24 32 12 16 +//!HOOK LUMA +//!BIND conv2d_4 +//!SAVE conv2d_5 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.016554128, 0.0026448318, 0.013652129, -0.013316665); + V4 result1 = V4(0.0044759065, 0.006209177, -0.013305955, -0.0016899946); + V4 result2 = V4(0.009802427, 0.011932272, 0.0051619564, 0.0023012678); + V4 result3 = V4(-0.0024697422, 0.007943644, 0.033936143, -0.01641893); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.08474402, -0.22917373, -0.14206196, -0.010539577, -0.046236325, 0.0013173359, 0.060659897, -0.055962656, 0.08355562, 0.013202813, -0.12521583, 0.08384832, -0.18861641, -0.047398612, 0.15795282, -0.09313713) * inp_0_0_0; + result0 += M4(-0.461722, -0.94063747, -0.22885977, -0.35344717, 0.072716385, 0.059156727, 0.015389428, -0.030055461, -0.038264215, -0.033173826, 0.033325374, -0.025504412, -0.026117543, 0.051860537, 0.028839415, 0.04346096) * inp_0_1_0; + result0 += M4(0.5087371, -0.34765637, -0.6182863, -0.3837225, 0.15503408, 0.10887861, 0.10084102, -0.20092858, -0.06793961, -0.07963712, -0.0017726015, 0.00066041463, 0.001742279, 0.047694772, -0.02344845, 0.02737981) * inp_0_2_0; + result0 += M4(-0.009285821, 0.11000235, -0.031392742, 0.11225282, 0.05141218, 0.12055548, 0.082777604, -0.020320954, -0.06680321, -0.049921807, -0.04921422, -0.03562363, 0.06059489, 0.017469844, -0.09669497, -0.0026134958) * inp_0_0_1; + result0 += M4(0.14124833, 0.19630684, 0.1194282, 0.26702908, 0.18400134, 0.10256528, 0.4572562, 0.15124409, 0.3166469, -0.6715967, 0.014648809, -0.102525435, -0.5180954, 0.66877353, -0.019614657, -0.002470084) * inp_0_1_1; + result0 += M4(0.18672962, -0.017508673, -0.16939771, 0.047094487, -0.060122382, 0.29416057, -0.11709289, 0.025598915, -0.14421585, -0.11846913, 0.03920522, 0.10352751, 0.18691705, 0.1590042, 0.02073003, -0.11663061) * inp_0_2_1; + result0 += M4(0.0056254803, 0.0057388344, 0.0374958, -0.004648934, -0.043297503, 0.0689816, 0.027923174, -0.03876041, -0.06407546, -0.025186531, 0.16828129, 0.0034699684, 0.031381328, 0.023971673, -0.20254338, -0.02430013) * inp_0_0_2; + result0 += M4(0.15775095, -0.15862629, 0.23583956, 0.049442884, 0.15699472, 0.13332577, -0.2572897, -0.040875558, -0.0002704255, 0.02988306, -0.006920376, 0.03397873, -0.28567457, 0.042112727, -0.3724105, -0.023333224) * inp_0_1_2; + result0 += M4(-0.014858677, 0.032062486, -0.076343395, -0.00083215634, -0.10055656, 0.09093586, 0.17731445, -0.057983246, 0.12641528, 0.04933168, -0.023279864, 0.028127778, -0.26475126, 0.0478974, -0.015684502, -0.039201133) * inp_0_2_2; + result1 += M4(0.392307, 0.03353582, 0.07128573, 0.3369635, -0.051541477, -0.04448266, 0.04055149, -0.021615157, 0.048823766, 0.090479605, -0.0072554573, 0.09644649, -0.053131856, -0.1262546, 0.105549574, -0.06123314) * inp_0_0_0; + result1 += M4(-0.15502161, -0.46141383, -0.09890623, 1.527269, -0.28750673, -0.008933071, -0.15267625, -0.01864867, 0.074853286, -0.028399043, -0.11274298, 0.007967588, 0.031121511, 0.077898726, 0.049051795, 0.053952634) * inp_0_1_0; + result1 += M4(-0.83457303, -0.31433025, 0.7315325, 0.4259749, -0.19004081, -0.067098886, -0.45684782, -0.0074499478, 0.02546783, -0.028332973, -0.045866985, -0.005292344, -0.017153805, 0.010074401, 0.016775275, 0.041146822) * inp_0_2_0; + result1 += M4(0.09953403, -0.0014643228, 0.10400452, 0.0056565623, -0.18444373, 0.04270818, -0.011462894, -0.0616828, 0.03475264, -0.065023266, 0.11439611, -0.0103913285, -0.093443975, -0.04991801, -0.17465092, 0.060669404) * inp_0_0_1; + result1 += M4(0.205716, -0.007968987, -0.21627533, -0.040425707, -0.09754452, 0.018082334, -0.00956709, 0.0848001, 0.43502063, 0.15083931, -0.052782185, -0.07282074, -0.3702116, -0.16925444, 0.0008385632, 0.088931836) * inp_0_1_1; + result1 += M4(0.09588992, -0.20940185, 0.10019888, 0.08854741, -0.40017736, -0.10545165, 0.14159274, -0.13410604, -0.01952819, -0.10284345, -0.22501552, 0.039318863, -0.010106364, 0.1133827, 0.22189315, 0.088626176) * inp_0_2_1; + result1 += M4(0.009421535, 0.02838454, 0.029579297, 0.014318628, -0.10293239, -0.018695444, 0.07494177, -0.1269828, 0.013530136, 0.067722216, 0.12684286, -0.022022089, 0.05124597, -0.13029617, -0.14270568, -0.061728578) * inp_0_0_2; + result1 += M4(-0.050228037, 0.06668443, 0.14026366, 0.26039708, -0.13540196, -0.13174525, -0.24864364, -0.22513062, 0.02472696, -0.14155997, -0.08290799, -0.020995213, 0.007919788, -0.03275966, 0.023754396, -0.28459167) * inp_0_1_2; + result1 += M4(0.023433143, -0.012505106, -0.039584465, -0.079250574, -0.06416037, -0.038407087, 0.11237008, -0.1196359, -0.026753819, -0.028015738, 0.0019825825, -0.07621049, 0.095602036, -0.0055057956, -0.12222531, -0.142331) * inp_0_2_2; + result2 += M4(0.21173902, -0.13234012, -0.4541014, 0.061877493, 0.0068946453, 0.022941818, -0.056972146, 0.01937574, 0.011626747, -0.020704554, 0.014839189, 0.020399058, 0.064279646, 0.008993624, -0.119472414, 0.011998723) * inp_0_0_0; + result2 += M4(-0.58199537, 0.36287612, -1.4199176, -0.39885208, -0.22821763, -0.007374069, 0.086480334, -0.016935853, 0.019518664, -0.015480163, -0.08576964, -0.024676455, -0.010108951, 0.037544332, 0.14300823, 0.06268861) * inp_0_1_0; + result2 += M4(-0.50271744, 0.025554385, -0.5727786, -0.17825632, -0.37914005, 0.051398177, 0.15490708, 0.046360016, 0.10120417, 0.02269559, -0.009419459, -0.03541369, -0.07406952, 0.002039037, -0.0006407997, -0.009875078) * inp_0_2_0; + result2 += M4(0.03687174, -0.01882471, 0.03676522, 0.021757437, -0.079064965, -0.037517067, 0.0642965, 0.014232467, 0.08768756, 0.018420901, -0.020334335, -0.0012831561, -0.114168204, -0.01205998, -0.11075036, 0.029242856) * inp_0_0_1; + result2 += M4(-0.047860306, -0.09711567, -0.17504969, -0.15081553, -0.3049216, -0.12750636, 0.02584121, 0.2795914, 0.4429374, -0.13278486, -0.17154583, -0.021857448, -0.5705778, 0.24980383, -0.042743698, 0.31541702) * inp_0_1_1; + result2 += M4(-0.19484288, -0.038754307, -0.07002575, 0.0040455586, -0.29587415, -0.044193868, -0.23622102, 0.029706014, 0.013432993, 0.083246335, 0.04279412, -0.08268909, -0.08376078, -0.07014374, -0.07676366, 0.18538836) * inp_0_2_1; + result2 += M4(0.010501982, -0.0005035494, 0.0004140859, 0.011096164, -0.039264694, -0.0066616437, 0.00040288252, -0.05843721, 0.047616445, -0.011402459, 0.082378514, 0.1362359, -0.022662984, -0.057075776, -0.071417384, -0.14695801) * inp_0_0_2; + result2 += M4(0.050130617, 0.113135085, 0.058322534, -0.13720304, -0.14341824, -0.051400222, 0.0505717, -0.15685362, 0.045417894, 0.07490942, -0.0060528195, 0.10542394, -0.12937509, -0.13544343, -0.11515363, -0.15704823) * inp_0_1_2; + result2 += M4(0.027637873, -0.02083409, -0.06730315, 0.015425108, -0.18975328, -0.003320729, 0.17947742, -0.04795124, -0.10879897, 0.005358679, -0.039596763, -0.061216958, 0.10180654, -0.03081845, 0.0511258, 0.14519742) * inp_0_2_2; + result3 += M4(0.014618818, 0.47584814, -0.17367727, 0.07147966, 0.034681022, 0.04903415, -0.02405715, -0.056848254, 0.05098864, -0.010156212, -0.04675307, 0.072642356, -0.036260676, -0.046609793, 0.053831514, 0.052008834) * inp_0_0_0; + result3 += M4(-0.20621313, 0.83789265, -0.13280529, -0.06215082, 0.18894519, 0.21933381, -0.09273566, -0.10503467, 0.14807668, -0.032840773, 0.029420458, -0.021397702, -0.29949743, -0.0031396316, -0.0962584, 0.04149515) * inp_0_1_0; + result3 += M4(-0.1368257, 0.52912736, 0.2355702, -0.123453274, -0.121077135, 0.0942226, 0.038726307, -0.17363513, 0.052847683, 0.07187939, -0.025024164, -0.008812916, -0.0051011033, 0.0018807795, -0.007282722, 0.023519143) * inp_0_2_0; + result3 += M4(-0.025657542, -0.002634332, -0.05383891, 0.14213623, -0.017881516, 0.11927832, 0.045409627, -0.05097621, 0.11048047, -0.29666448, 0.0103217615, 0.021556247, -0.06984235, 0.20101684, -0.007980527, 0.09391604) * inp_0_0_1; + result3 += M4(0.15439488, -0.20458573, -0.26687387, -0.054746483, -0.103493385, 0.60655016, -0.005280907, -0.12099173, 0.42942765, 0.13243759, -0.077581435, 0.23282799, -0.452252, -0.14954813, 0.15053895, -0.13070299) * inp_0_1_1; + result3 += M4(-0.1478404, 0.003927139, -0.017289838, 0.14824122, 0.26184613, 0.33273512, -0.0047554015, -0.20846145, 0.11270909, 0.09684709, -0.118098505, 0.20708843, -0.27642372, -0.13249397, 0.17980523, -0.16313562) * inp_0_2_1; + result3 += M4(0.008574112, 0.05413337, 0.01967447, -0.011820304, 0.08030224, 0.09292828, 0.006041947, -0.039917428, 0.15336455, 0.048226394, 0.026484624, 0.010617635, -0.14265074, -0.08177329, -0.074674845, 0.03954346) * inp_0_0_2; + result3 += M4(-0.035967097, -0.051198352, -0.0147744715, -0.006058455, 0.018199014, 0.20261578, 0.02218917, 0.02864353, 0.20123912, -0.20021546, -0.10024832, 0.1425623, -0.01632511, 0.19673872, 0.11388972, -0.09187605) * inp_0_1_2; + result3 += M4(-0.051516704, -0.037184518, -9.7836884e-05, -0.033820845, 0.2095811, 0.2926858, -0.07219224, -0.043460887, 0.055939294, -0.018073456, -0.010785669, 0.07900805, -0.032115173, -0.0025410457, -0.030606363, -0.12241656) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.0073166075, 0.045552894, -0.007951411, -0.023334121, 0.025722718, 0.064874984, -0.10358456, 0.04715832, 0.017686395, -0.041548744, -0.081770375, 0.039507207, 0.06641115, 0.023399614, -0.06840236, -0.0043447604) * inp_1_0_0; + result0 += M4(0.20941794, 0.09051338, -0.14984657, -0.074408896, -0.18479207, 0.33516723, 0.3928294, 0.14506263, -0.1711134, -0.17116591, 0.13062029, 0.07105616, 0.14903083, 0.049338274, -0.24173051, 0.004623255) * inp_1_1_0; + result0 += M4(0.07846061, 0.10122042, 0.0720976, 0.047867063, 0.14466134, 0.1670706, -0.08569032, -0.065952614, -0.18422887, -0.17921495, -0.14734626, 0.059171673, 0.03520425, -0.07958087, -0.019477837, -0.011459567) * inp_1_2_0; + result0 += M4(0.0014838969, 0.06830755, 0.06123817, 0.021657676, -0.024793208, 0.09558475, -0.031950496, 0.025265368, 0.03680227, -0.038717628, -0.1164916, -0.0011885002, -0.11559365, -0.093189925, -0.08363963, -0.04834404) * inp_1_0_1; + result0 += M4(0.40580162, 0.22511373, 0.0917264, 0.085031815, 0.36542302, 0.070314296, 0.27281147, 0.056904998, 0.3947338, -0.24021517, 0.30139968, -0.07091092, 0.6364601, -0.4326636, -0.09677784, 0.21916817) * inp_1_1_1; + result0 += M4(0.06285387, 0.063603476, 0.01333808, -0.11350428, -0.09640258, -0.01745298, 0.016524717, -0.084454134, -0.044837467, -0.05721756, 0.043622483, 0.046772335, -0.06767603, -0.054249935, 0.05514638, -0.031198056) * inp_1_2_1; + result0 += M4(0.0037593278, 0.058119446, 0.007772395, -0.045545187, -0.02386189, 0.033547785, 0.012052209, -0.014283093, -0.027987773, -0.008577758, 0.026769858, 0.01840433, -0.0116568385, -0.10390512, 0.18343972, -0.05923133) * inp_1_0_2; + result0 += M4(0.15633376, -0.024260672, 0.13842222, 0.09513615, 0.22078265, -0.086084336, 0.11120577, 0.02944383, 0.08267881, 0.040523216, 0.18060447, -0.055403788, -0.049887385, -0.15995465, 0.051882185, 0.027126146) * inp_1_1_2; + result0 += M4(0.08325832, -0.03183006, 0.017627114, 0.0028026348, 0.066393, -0.03619683, 0.08243465, 8.244323e-05, 0.00065900537, -0.042117447, 0.029968508, 0.022710547, 0.032688536, 0.0069056484, -0.10295506, -0.03543248) * inp_1_2_2; + result1 += M4(-0.057469558, 0.0059905495, -0.079491735, -0.03306272, 0.22499478, 0.122497976, -0.19126062, 0.06376063, 0.19904874, 0.107790366, -0.025252093, 0.021401089, -0.012737553, 0.05863985, -0.11861096, 0.05267514) * inp_1_0_0; + result1 += M4(-0.048021965, 0.009858718, 0.14495559, -0.15178134, -0.028742641, -0.1255706, -0.23628315, -0.099888876, 0.2575705, 0.158808, -0.14856035, -0.063091286, -0.063021936, -0.008114058, 0.19375907, -0.10753101) * inp_1_1_0; + result1 += M4(-0.11135972, -0.036761303, -0.0040923324, -0.089887746, -0.08558438, 0.1262421, 0.23975913, -0.08594608, 0.1670396, 0.06534481, 0.10865409, -0.103865735, 0.07964133, 0.008221018, 0.04624729, 0.017136093) * inp_1_2_0; + result1 += M4(-0.13777937, 0.076541856, 0.068616554, 0.054874852, 0.00012002991, 0.059381004, 0.0116826305, -0.06327681, 0.06994238, 0.03399867, -0.075316906, 0.07877732, 0.0399726, -0.0532057, 0.13116238, -0.09443346) * inp_1_0_1; + result1 += M4(-0.3907863, -0.08430246, -0.11643456, 0.2000658, 0.045306966, 0.17947012, -0.18730734, 0.055325676, 0.07598895, 0.40362227, 0.3625906, 0.3149084, -0.14925346, 0.33247408, 0.2575065, -0.30229175) * inp_1_1_1; + result1 += M4(-0.11553566, -0.23831218, -0.09813154, -0.06359181, 0.0940421, 0.07896055, 0.16879584, 0.21001212, 0.04249928, 0.12710789, 0.18103158, 0.119974695, -0.073143214, -0.22413246, -0.21876724, 0.1720369) * inp_1_2_1; + result1 += M4(-0.07137546, -0.03094973, 0.003292551, -0.041568562, -0.031684592, -0.016679576, 0.044499274, -0.052121527, 0.0154636195, 0.023929989, 0.0068467464, 0.0066959793, -0.0034232545, 0.07880061, 0.08291338, 0.064238854) * inp_1_0_2; + result1 += M4(-0.014572152, -0.013946868, -0.019180208, 0.11636705, -0.030346757, 0.12613934, 0.03705543, 0.0452622, -0.023375073, 0.08974235, -0.008709684, -0.044204757, -0.18795705, -0.18832888, 0.1379181, 0.13087544) * inp_1_1_2; + result1 += M4(-0.057705898, -0.031566918, 0.0013814529, 0.09302121, 0.008427629, 0.020180352, 0.05593306, 0.1297789, 0.008376333, -0.005297203, 0.021587873, 0.04491888, -0.0134414965, 0.0054050824, -0.057093758, -0.22655176) * inp_1_2_2; + result2 += M4(-0.080743715, 0.017110262, 0.085858025, -0.049398597, 0.14745821, 0.048592985, 0.12289114, 0.009377926, 0.1671251, -0.11968603, 0.055208463, -0.030808775, -0.052694857, -0.050542895, 0.108538054, -0.03228694) * inp_1_0_0; + result2 += M4(0.115866296, -0.07366202, 0.042411987, 0.08331246, -0.25421214, 0.24341306, 0.010557693, -0.102649584, 0.10870931, -0.12877654, -0.04819396, -0.34243214, 0.11449533, -0.12116078, -0.03230502, -0.02296135) * inp_1_1_0; + result2 += M4(-0.16150624, -0.058298904, 0.069828205, -0.0060394495, -0.05517869, -0.04788711, 0.08831893, -0.047414172, 0.20191658, 0.10358992, -0.0038464211, -0.121002756, 0.031794656, -0.010044565, -0.08703155, 0.015908001) * inp_1_2_0; + result2 += M4(-0.012656746, 0.081062734, 0.093692675, 0.1958319, 0.1272179, -0.012527262, 0.10199331, 0.18368192, 0.043714743, 0.018916927, 0.027921028, -0.11653393, 0.060847517, -0.062236406, -0.019688752, 0.0077735567) * inp_1_0_1; + result2 += M4(0.17710909, -0.07107738, 0.08273162, 0.0046328073, -0.08467732, 0.10024806, 0.047003683, -0.123511486, -0.015360459, 0.102026045, -0.08240464, 0.029658364, 0.4172425, -0.14342386, 0.1480498, -0.18634751) * inp_1_1_1; + result2 += M4(-0.12391618, -0.05871014, 0.040260173, -0.025818344, 0.012931218, -0.04979273, -0.001939683, -0.03158152, 0.056002043, -0.016798038, -0.050334938, 0.03402695, -0.079693966, 0.025994321, 0.020700725, 0.10635983) * inp_1_2_1; + result2 += M4(-0.026964232, -0.022047423, 0.06918982, 0.048541494, -0.038205724, 0.008799015, -0.0026270822, -0.026919778, -0.010267494, 0.013637323, 0.014320703, 0.04809512, 0.026248137, -0.032727137, 0.054396283, 0.028740866) * inp_1_0_2; + result2 += M4(-0.029081121, 0.04486759, 0.09537123, -0.04666429, -0.0030022755, 0.01980827, 0.11681267, 0.10332237, -0.05755216, -0.023530334, 0.10857501, -0.014354214, 0.021850962, 0.10997835, 0.096964404, -0.21275812) * inp_1_1_2; + result2 += M4(-0.021180212, 0.018354837, -0.014735963, -0.06836179, 0.032596614, 0.0017078082, -0.007971494, -0.026358705, 0.047004454, 0.0073685586, 0.05836899, -0.0055675255, 0.004838257, 0.0485349, -0.048474196, -0.04883732) * inp_1_2_2; + result3 += M4(0.03244459, -0.034479953, -0.0064135827, -0.08737613, -0.089818925, 0.04632484, -0.10045086, 0.008881872, -0.13907796, -0.062879585, -0.012990814, 0.15110466, 0.038008627, 0.04984243, 0.044478714, 0.009779906) * inp_1_0_0; + result3 += M4(0.1842782, -0.008685026, -0.042807627, -0.08820507, -0.50758076, 0.2103546, 0.11072308, 0.06511318, -0.3334045, 0.20163654, -0.029536664, 0.011301137, 0.4022046, -0.04273883, -0.026847176, -0.039757486) * inp_1_1_0; + result3 += M4(0.009022588, -0.023068365, -0.027991936, 0.00427787, -0.32369635, -0.11838789, -0.06324538, -0.16311373, -0.08104427, -0.026818093, -0.101193525, 0.1561913, 0.0131432135, -0.059175897, 0.03514937, 0.025877465) * inp_1_2_0; + result3 += M4(0.20467058, 0.112527, 0.011012977, -0.028550608, -0.08784855, -0.062379327, -0.021806065, -0.011393705, -0.16238952, -0.26693502, 0.06391084, 0.06478358, 0.1172006, -0.24499363, 0.039030664, 0.05566198) * inp_1_0_1; + result3 += M4(0.6883158, -0.3521105, -0.096033536, -0.011642683, -0.68677497, 0.17748499, -0.16916241, 0.038282525, -0.26609233, -0.10134399, 0.25453985, 0.06322925, 0.80599284, -0.20447275, 0.096553475, -0.02597967) * inp_1_1_1; + result3 += M4(0.38438025, 0.14472944, 0.086811066, -0.13257246, 0.028960865, 0.0317766, 0.045688264, -0.23838268, -0.12198645, -0.036164884, -0.041628513, -0.010525341, 0.2980953, 0.18289775, 0.092270166, 0.09970921) * inp_1_2_1; + result3 += M4(0.046299033, -0.0038731368, -0.00625676, -0.009460825, 0.00062204845, 0.047890205, -0.0041801203, -0.028481482, -0.0037050957, 0.039239805, -0.008649513, -0.03477906, 0.12597682, 0.08933818, 0.042497773, -0.06470036) * inp_1_0_2; + result3 += M4(0.14617918, 0.005229593, -0.0501567, 0.069478005, -0.31181592, -0.10519494, -0.029231973, 0.06010956, -0.13888495, 0.12517981, -0.00579049, -0.09823023, 0.6077278, 0.055234488, 0.078748465, 0.022114666) * inp_1_1_2; + result3 += M4(0.05200068, 0.055454627, 0.02337076, 0.011462933, -0.006175603, 0.057744995, 0.012468431, 0.05055063, -0.082297675, 0.006953254, -0.024784455, 0.013913281, -0.041024067, -0.06821284, -0.005379725, 0.025868118) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.03519386, 0.020771546, -0.06092822, 0.06694439, 0.009966364, 0.08845796, -0.087970845, -0.036957614, -0.22353762, 0.054692257, 0.32780975, 0.0006839374, -0.01862221, 0.11244745, 0.049653698, -0.040946584) * inp_2_0_0; + result0 += M4(-3.3792534e-05, -0.037827175, -0.0021955103, 0.038683914, -0.027731497, -0.008400333, -0.039806634, -0.062449142, -0.16357751, 0.046085265, -0.077466585, 0.17157899, 0.16051912, -0.009569097, -0.15054378, 0.07224473) * inp_2_1_0; + result0 += M4(-0.12121477, 0.00741661, 0.049274296, 0.0367287, -0.046093628, 0.040898, 0.05136005, 0.08081049, 0.012140579, -0.037353013, -0.07112558, -0.034909766, 0.16167422, 0.03786511, -0.015378625, -0.01624157) * inp_2_2_0; + result0 += M4(-0.0663365, -0.06115137, 0.09096096, -0.031260535, -0.025968976, -0.010863611, -0.016588423, 0.012816596, -0.736851, 0.15209731, 0.10394599, -0.672264, 0.15394175, -0.23876093, -0.00424517, -0.08416222) * inp_2_0_1; + result0 += M4(-0.040628262, -0.18910486, 0.24239047, -0.02539226, -0.032604747, -0.0074777473, 0.021508304, 0.010910954, -0.07856097, 0.11829924, -0.09963228, 0.20279798, -0.11184747, 0.20169383, -0.12306833, 0.0010044349) * inp_2_1_1; + result0 += M4(0.06593747, -0.021727772, -0.078049734, -0.027246097, 0.042461947, 0.020668674, -0.07633065, 0.008510407, -0.059274238, 0.0015911838, 0.119982466, 0.009135035, 0.109331414, 0.22766785, 0.09203822, 0.021122389) * inp_2_2_1; + result0 += M4(0.02380947, 0.061284587, -0.05441463, 0.0042443695, 0.0030761897, -0.015208306, 0.078272484, 0.07259532, -0.69980097, 0.053883918, -0.66474944, -0.28192675, -0.0073506925, -0.02169072, -0.0030826845, 0.056019828) * inp_2_0_2; + result0 += M4(-0.09168379, 0.1576644, -0.21850447, -0.02639354, -0.057879586, 0.040835056, 0.04107616, -0.051199373, 0.14163044, -0.041191746, 0.00058892305, 0.18929687, 0.15363866, 0.0118714785, 0.045324255, 0.059029303) * inp_2_1_2; + result0 += M4(-0.05409983, 0.035369724, -0.054201934, -0.029860638, 0.07611687, 0.03037094, -0.017978035, -0.02643063, 0.054626707, -0.053077925, -0.07135389, 0.021989368, 0.27177697, -0.120982274, 0.05465457, -0.0055884663) * inp_2_2_2; + result1 += M4(0.03493821, 0.043080125, 0.0035047126, 0.03849063, 0.06393502, 0.080511086, 0.016567344, -0.04203288, -0.13447708, -0.18894845, -0.019703919, -0.38417652, -0.23795354, -0.05671812, -0.116186336, -0.19162156) * inp_2_0_0; + result1 += M4(0.11228363, 0.03397793, -0.07902017, 0.058452863, -0.06233874, 0.006367689, -0.015540989, -0.04156123, 0.08450284, 0.062186997, 0.11030411, 0.25390634, 0.07090044, -0.031088028, 0.26935562, -0.20305486) * inp_2_1_0; + result1 += M4(0.0050216704, 0.007666345, -0.09408847, -0.027508035, 0.07744078, -0.0858829, -0.027486075, 0.08274661, 0.006676095, -0.013881031, 0.04249068, 0.069553934, -0.041518852, -0.005108007, 0.036308933, 0.0030829133) * inp_2_2_0; + result1 += M4(0.033124767, 0.02691598, 0.12422652, 0.022402922, 0.003461032, 0.0834087, 0.0049670525, -0.08223503, 0.19833384, -0.39163148, -0.0032815367, -1.0814372, 0.12159805, -0.010273577, -0.23912533, 0.37317404) * inp_2_0_1; + result1 += M4(-0.08536951, -0.17612375, 0.05276799, -0.20962986, -0.08263536, -0.052930966, 0.00743057, -0.029009147, 0.10561041, 0.2818868, -0.29869884, -0.27491766, 0.05908428, 0.30368373, -0.26572517, 0.9404553) * inp_2_1_1; + result1 += M4(0.0016916043, 0.028522108, 0.07193734, 0.056363445, -0.046301708, -0.092516795, -0.08134731, 0.077689245, 0.040148728, 0.035003696, -0.07245444, 0.033462606, -0.0028245777, 0.053184345, -0.09853116, -0.10275217) * inp_2_2_1; + result1 += M4(-0.10386956, 0.036102064, -0.04801716, 0.024403296, 0.03979467, -0.010715334, -0.092453316, 0.009072639, -0.14853695, -0.4095759, -0.13726044, -1.181292, 0.12713557, -0.049974903, -0.0067785005, -0.025925767) * inp_2_0_2; + result1 += M4(0.17170316, -0.13200247, -0.10278675, -0.21036159, 0.010567157, -0.06862603, 0.044727184, -0.06545584, 0.062359527, 0.089575015, 0.020037299, 0.030505616, -0.14575754, 0.23602366, -0.0005095541, 0.34895372) * inp_2_1_2; + result1 += M4(0.043262783, 0.0039280364, -0.03025543, -0.03344463, -0.04560934, -0.034239992, 0.004803988, -0.03988103, -0.015801929, -0.03631273, 0.07549837, -0.050647344, -0.19037472, -0.051564816, 0.18334927, 0.317741) * inp_2_2_2; + result2 += M4(0.017939113, 0.033808067, 0.013337525, 0.013338571, -0.026104536, 0.0021523843, 0.063422084, -0.008435395, 0.0014796632, -0.01593725, 0.3626783, 0.053695522, -0.23224196, -0.02838407, 0.19632407, -0.10586231) * inp_2_0_0; + result2 += M4(0.07115929, -0.10127339, -0.08562357, 0.014140073, -0.08980039, -0.05160459, 0.07157348, 0.068261, 0.023636142, 0.06479512, 0.12661268, 0.021240188, 0.06230698, -0.04328473, -0.22837892, -0.001120956) * inp_2_1_0; + result2 += M4(0.035445914, 0.044792846, 0.043199282, -0.058268394, -0.025570352, -0.07725152, 0.06447988, 0.08822611, -0.01431678, -0.0058982414, -0.09265362, 0.008680186, -0.13813685, -0.031577934, -0.07259829, 0.031110931) * inp_2_2_0; + result2 += M4(0.046934675, -0.046772964, -0.079469174, -0.041171886, 0.08315339, -0.030660095, -0.046969607, -0.044603206, 0.1088084, -0.3271513, 0.4827227, -0.00073664036, -0.11883226, -0.04861558, -0.107335076, 0.019172063) * inp_2_0_1; + result2 += M4(-0.06326496, 0.17220448, 0.18118903, -0.07713064, 0.05416083, 0.027322814, 0.09561443, 0.083409004, -0.15603146, -0.080915086, -0.32056457, 0.29618284, 0.6779934, 0.23570892, 0.05733165, -0.0550815) * inp_2_1_1; + result2 += M4(-0.09341537, -0.012737399, -0.11717243, 0.13527763, -0.03188427, 0.081400484, -0.08873576, -0.08301504, 0.059625685, 0.020269057, 0.010163222, 0.01648694, -0.023158077, -0.10110675, -0.03397466, -0.03787835) * inp_2_2_1; + result2 += M4(0.009182551, 0.020346174, 0.022581046, -0.058744755, 0.024768678, -0.057315476, 0.002723283, 0.02727885, -0.10255867, -0.24883124, 0.11087838, 0.20040388, -0.022830166, -0.020115368, -0.038202837, 0.094623245) * inp_2_0_2; + result2 += M4(0.028593393, -0.009744626, -0.15439138, 0.18110561, -0.058348615, 0.08616409, -0.04128328, 0.043372136, -0.19122921, -0.026798584, 0.0474954, -0.2528174, -0.101200946, -0.062434033, 0.03201408, 0.057487406) * inp_2_1_2; + result2 += M4(-0.0013166185, -0.018694969, -0.06734548, 0.06859655, 0.08430593, -0.01940095, 0.041605387, -0.055890627, -0.026176976, 0.011013619, 0.008539067, -0.019987924, -0.05475008, 0.027200852, 0.06283524, -0.2617577) * inp_2_2_2; + result3 += M4(0.013725179, -0.061932757, 0.045672245, 0.050379913, 0.0788672, -0.07998998, -0.016853781, -0.083918825, -0.15966989, 0.019984895, 0.0062870965, 0.28606316, 0.04915436, -0.011288526, 0.014948044, -0.07217862) * inp_2_0_0; + result3 += M4(0.099728964, 0.019777179, -0.05474517, 0.07847718, 0.08612672, -0.0842426, -0.060081817, 0.042335063, -0.08624977, 0.019552974, -0.09990619, 0.13993576, 0.2796346, -0.19697501, -0.035683982, -0.064266436) * inp_2_1_0; + result3 += M4(0.04046714, 0.044116072, -0.02477698, 0.046863623, -0.023625096, -0.05061273, 0.097901285, 0.04918668, 0.05531759, -0.0047716047, 0.03271952, 0.012900423, 0.010711064, -0.06245105, 0.038325533, -0.013503033) * inp_2_2_0; + result3 += M4(-0.016706655, -0.025500009, -0.002248052, -0.033774734, -0.079098985, -0.0051736236, -0.03546944, 0.07374924, -0.808723, -0.54684496, 0.05268168, 0.43765536, -0.08996461, 0.09093547, -0.0009905121, -0.0023711629) * inp_2_0_1; + result3 += M4(-0.14838111, -0.09827265, 0.2247343, -0.07767093, -0.08234698, 0.017499017, 0.048514254, 0.041478686, 0.20503302, -0.06761944, -0.26098138, 0.22514617, 0.19708426, 0.43080166, -0.17789333, -0.005553808) * inp_2_1_1; + result3 += M4(-0.09141383, -0.05565759, 0.052848406, 0.07877255, 0.092179105, 0.024564177, -0.010492621, 0.03952363, -0.011052075, -0.020905806, -0.014796553, -0.010458158, 0.16574955, 0.017756697, -0.112289995, -0.19061698) * inp_2_2_1; + result3 += M4(-0.012942791, -0.09701864, 0.039916683, 0.014046996, 0.02276102, -0.038104624, -0.05454621, -0.017268764, 0.14468248, 0.22772491, -0.13311438, 0.021296846, 0.018167509, 0.07592232, -0.043419812, 0.070708245) * inp_2_0_2; + result3 += M4(0.027744744, -0.04099133, -0.047819644, 0.0120844925, -0.033083685, -0.08534956, -0.07539677, -0.057747744, -0.0737084, -0.09107881, -0.0014842128, 0.4171075, -0.2807641, -0.14693853, 0.020089995, 0.12872282) * inp_2_1_2; + result3 += M4(-0.02645917, -0.036230065, 0.0013453881, -0.053119272, -0.04390945, -0.07620047, -0.061788194, 0.100186884, -0.021604344, 0.018383984, -0.006580493, 0.07360969, 0.06294429, 0.114074826, 0.0922581, 0.10860966) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.19773234, 0.0040025134, -0.19928102, 0.05982445, 0.10238352, -0.04136469, -0.10717808, 0.11060676, -0.024479374, 0.006888121, -0.049817488, -0.032475132, 0.0005060402, 0.027150108, -0.01389521, 0.03011166) * inp_3_0_0; + result0 += M4(-0.10382486, 0.016261084, 0.10074889, -0.036058605, -0.28665686, -0.22176702, 0.16188395, 0.072151855, 0.16958801, 0.19100334, -0.07586979, -0.008691376, -0.15168019, -0.076181546, 0.10785355, -0.044232473) * inp_3_1_0; + result0 += M4(-0.034232676, 0.12174497, 0.12540244, -0.00615272, -0.104418986, -0.1441321, -0.061950747, -0.039816953, -0.020058908, 0.09946141, 0.06271718, 0.03362542, -0.081220925, -0.07135675, -0.09202891, 0.031732865) * inp_3_2_0; + result0 += M4(-0.019257972, 0.23448941, 0.2296378, -0.013084976, 0.14259407, -0.23327808, 0.18332508, -0.0981734, -0.13848236, 0.21527474, -0.18854348, 0.03302416, -0.11364098, -0.062779635, -0.0003776771, 0.056423634) * inp_3_0_1; + result0 += M4(0.39262342, -0.60916656, 0.11890576, 0.008154147, -0.25903428, -0.6944411, -0.30703035, -0.26949775, 0.33802876, 0.5117939, 0.30353963, 0.22217596, -0.3185454, -0.19438665, -0.38905796, 0.20958135) * inp_3_1_1; + result0 += M4(-0.31000933, -0.095929846, -0.09873588, 0.0526352, -0.13051024, -0.06996045, 0.05097093, 0.12195579, 0.16819753, 0.06406409, -0.037765402, -0.05460069, -0.025167787, -0.6610153, -0.1280548, -0.18461606) * inp_3_2_1; + result0 += M4(-0.07626507, -0.027585149, 0.16430154, -0.068786874, -0.11812134, -0.20239244, 0.20651695, 0.117651924, 0.103023574, 0.06551238, -0.17495835, -0.053802766, 0.02019847, 0.042211883, -0.0792073, 0.04661087) * inp_3_0_2; + result0 += M4(0.18774892, -0.22588675, 0.11697573, -0.02098111, -0.098473765, -0.12450782, -0.2092941, -0.0026268938, 0.19874147, 0.13118155, 0.1781314, -0.00842974, -0.031992726, -0.05670131, 0.20423128, -0.00074609526) * inp_3_1_2; + result0 += M4(-0.06835169, 0.016473854, 0.029923515, -0.008443641, 0.23226224, -0.08359965, 0.1304451, 0.040005654, -0.050561354, 0.048547532, 0.04456618, 0.016158111, 0.062703654, 0.0092108315, -0.10469197, -0.06267775) * inp_3_2_2; + result1 += M4(0.15233582, 0.19007146, -0.041311294, 0.11373788, 0.11148112, 0.04161408, 0.022334483, 0.092816405, 0.028468959, 0.026755488, 0.008363913, 0.06473331, 0.0011780987, -0.019047763, 0.09523404, -0.08244701) * inp_3_0_0; + result1 += M4(-0.0098125795, -0.04201503, -0.1326031, -0.08045925, 0.20360228, 0.026760735, -0.26419288, 0.15499987, 0.056399953, 0.14250176, 0.028358502, -0.033754945, 0.12579347, -0.052264683, 0.2556933, 0.18257244) * inp_3_1_0; + result1 += M4(-0.095059596, 0.021393813, -0.026516682, -0.007583113, 0.048850205, -0.046467386, 0.030013174, 0.10140715, 0.05695302, 0.089559756, 0.021871507, -0.014836824, 0.1737422, 0.13004734, 0.20477152, 0.23618454) * inp_3_2_0; + result1 += M4(0.05689886, 0.1384205, 0.055440158, -0.2634709, 0.40263698, -0.018188346, -0.19718939, -0.021893239, -0.25167263, -0.0302215, 0.1494233, -0.060639318, 0.17440826, -0.005995121, 0.1752686, 0.08358246) * inp_3_0_1; + result1 += M4(-0.11837638, -0.27371556, 0.20988613, -0.92515045, 0.7948933, 0.19478232, 0.08756208, 0.09321127, -0.6920545, -0.11605966, -0.0602716, -0.47996294, 0.5221947, -0.036128834, -0.085451365, -0.52814066) * inp_3_1_1; + result1 += M4(0.09521452, -0.08006706, -0.08897774, -0.21125159, -0.03079481, 0.046952967, -0.026647106, -0.047232367, -0.124124646, 0.033768218, 0.052450426, -0.12203157, 0.47032583, -0.22275928, -0.102736816, 0.026622942) * inp_3_2_1; + result1 += M4(-0.07079185, 0.14451918, 0.17062652, 0.025385572, 0.22244516, 0.034709886, 0.17516658, -0.033176485, -0.19369905, -0.020304324, -0.14346293, 0.16571403, 0.049146105, 0.019382618, -0.058748543, 0.12871866) * inp_3_0_2; + result1 += M4(0.102248736, -0.0337236, 0.0071350574, -0.03248206, 0.06347463, -0.041544788, -0.1049145, 0.010971773, -0.085705966, 0.18427896, 0.17459114, 0.3247006, 0.20611103, 0.119550996, 0.08841569, 0.15119329) * inp_3_1_2; + result1 += M4(0.17931168, 0.16252843, -0.020840246, -0.08419524, -0.12440272, -0.006738672, 0.14970261, 0.157197, 0.039103635, 0.099136084, -0.07311536, 0.09651158, 0.05364095, -0.15176328, -0.13609104, -0.0833755) * inp_3_2_2; + result2 += M4(0.090288036, -0.055971667, 0.1480006, 0.04578793, 0.09695163, -0.03401928, -0.05294258, 0.07264915, 0.034997385, 0.033377692, -0.012243337, 0.006176055, 0.0420061, 0.0017590974, 0.059313867, 0.055868845) * inp_3_0_0; + result2 += M4(0.12215243, 0.049981244, 0.078155525, -0.03721692, 0.00081549905, 0.070513256, 0.023916868, -0.068173625, 0.21320094, -0.0793969, 0.12491556, 0.06683648, 0.12349867, 0.09697064, -0.19347167, 0.16261415) * inp_3_1_0; + result2 += M4(0.0036620256, -0.008251636, 0.16044019, 0.0038811674, 0.17711705, 0.056581743, -0.059190765, 0.00294404, 0.024791382, 0.013117927, 0.1321051, -0.023086015, 0.21306372, -0.060495336, -0.06985338, 0.12514174) * inp_3_2_0; + result2 += M4(0.0312112, -0.11488951, 0.31389415, -0.11953462, -0.068046354, -0.14420296, 0.12760502, -0.09679173, 0.08755888, 0.07094847, -0.095602505, -0.016698444, 0.012757536, 0.045577306, -0.10753733, -0.042271823) * inp_3_0_1; + result2 += M4(-0.49250764, -0.12012084, 0.2342404, -0.6256464, 0.367146, 0.14924204, 0.6591491, 0.048179522, -0.35884148, -0.1678469, -0.3900169, -0.30488762, -0.22384477, 0.004431448, -0.00562058, -0.24071592) * inp_3_1_1; + result2 += M4(0.12204024, 0.074117884, 0.12283045, -0.07810565, 0.13246378, 0.08325109, 0.22934341, -0.2973156, -0.043851215, -0.085699715, -0.25161895, 0.020704068, 0.21119992, 0.04622388, -0.055380527, 0.14471737) * inp_3_2_1; + result2 += M4(-0.074895434, -0.06270641, 0.060614184, 0.13333398, -0.035534456, -0.018466184, -0.10737744, 0.14484845, 0.12699716, 0.07270939, 0.10774756, 4.7753732e-05, 0.14590403, 0.03653374, -0.01690645, 0.05341992) * inp_3_0_2; + result2 += M4(0.165294, 0.12768765, 0.16723107, -0.12056439, 0.12686896, -0.030246196, -0.15657917, 0.07142477, -0.0709559, -0.008950173, -0.036407184, -0.078462794, 0.22401553, 0.11724086, -0.09732008, 0.26752585) * inp_3_1_2; + result2 += M4(0.05091784, -0.0036859773, -0.025390401, 0.22719525, -0.06461589, 0.036899187, 0.099762656, -0.20599271, 0.054967627, -0.008055024, -0.031206395, 0.106771916, 0.056380093, 0.058899213, -0.121471696, -0.055402637) * inp_3_2_2; + result3 += M4(-0.026850104, 0.032930214, -0.07506575, 0.029188028, 0.028521763, 0.099263564, -0.015998442, 0.15630326, 0.006329006, -0.053651378, 0.022603864, -0.027682748, 0.012513269, -0.03688965, 0.009188487, 0.066707715) * inp_3_0_0; + result3 += M4(0.13048565, 0.1046288, 0.059150916, 0.046943232, -0.12111611, -0.058344387, 0.06613853, 0.15171036, -0.026610931, 0.059549157, -0.0065440265, -0.030438675, -0.3000826, -0.10964842, -0.019215975, 0.042909347) * inp_3_1_0; + result3 += M4(-0.14147408, 0.020621499, -0.061839666, -0.0786287, 0.05444145, 0.09064469, 0.051645663, 0.02046913, -0.12140889, -0.06441972, -0.14962567, -0.07454032, -0.21723782, -0.12441716, 0.0063856477, 0.07751481) * inp_3_2_0; + result3 += M4(-0.15052302, 0.12364792, -0.07333968, -0.106281765, -0.26465237, 0.18124165, -0.15878557, -0.0863266, 0.28953597, -0.104721405, 0.010609605, 0.00013846748, 0.023336895, -0.09811715, -0.062712066, 0.15814303) * inp_3_0_1; + result3 += M4(-0.1505338, -0.25127456, -0.010185877, 0.10018608, -0.46148112, 0.7820113, -0.2994022, 0.16474903, 0.393985, -0.53803116, 0.2856222, -0.1782298, 0.10528467, -0.16190316, 0.018561272, 0.008876788) * inp_3_1_1; + result3 += M4(0.16577095, 0.07553432, 0.074692585, 0.05206232, -0.087388374, 0.090719454, -0.25296533, 0.09053648, 0.20446649, 0.0515907, 0.13263685, -0.122028425, -0.04356239, -0.15438107, 0.17627592, 0.03334808) * inp_3_2_1; + result3 += M4(0.038740914, 0.18525128, 0.04935017, -0.058124084, 0.054568756, 0.21678539, -0.08873143, 0.01656806, 0.026606297, -0.4565078, 0.09821042, 0.04551522, -0.059372384, -0.22013853, 0.015601125, 0.093543395) * inp_3_0_2; + result3 += M4(-0.0804898, 0.0008990494, -0.030963572, 0.12500906, -0.104006045, -0.014657448, 0.022204293, 0.12654208, 0.06328144, -0.09054795, 0.096949615, -0.06529515, 0.06216197, -0.20189077, -0.014465873, -0.061704617) * inp_3_1_2; + result3 += M4(-0.16651894, -0.15619473, -0.038332544, 0.05948654, 0.04223932, 0.110509776, 0.015117032, 0.13600627, -0.161015, -0.1257106, -0.037504923, -0.059075683, 0.09092152, -0.022672275, 0.017996153, -0.10931976) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(2, 2); + imageStore(out_image, output_base + ivec2(0, 0), result0); + imageStore(out_image, output_base + ivec2(1, 0), result1); + imageStore(out_image, output_base + ivec2(0, 1), result2); + imageStore(out_image, output_base + ivec2(1, 1), result3); +} + +//!DESC ArtCNN C4F16 DS (Conv2D-6) +//!COMPUTE 12 16 12 16 +//!HOOK LUMA +//!BIND conv2d +//!BIND conv2d_5 +//!SAVE conv2d_6 +//!WIDTH LUMA.w 1.0 * +//!HEIGHT LUMA.h 1.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[4][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(2, 2); + inp[0][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(0, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(1, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(0, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 1), 0)); + inp[3][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(1, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.07942048, 0.07821269, 0.082289174, 0.07892917); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.11636982, -0.059329264, -0.032452207, -0.05000699, 0.0027298967, -0.014784354, -0.018898953, -0.026387399, -0.04866522, -0.0034517667, -0.036040183, -0.015461949, 0.15003136, 0.1010024, 0.06595967, 0.08420603) * inp_0_0_0; + result0 += M4(-0.17095192, -0.23162094, -0.0027919277, 0.018584667, 0.0009346624, 0.006145241, -0.06807188, 0.005982439, -0.10259334, -0.23113409, 0.05056581, 0.015863553, 0.021340631, 0.13316575, 0.05575838, 0.008457389) * inp_0_1_0; + result0 += M4(-0.008553572, -0.054848403, -0.01347387, -0.04445713, -0.08472665, -0.08376867, -0.077503465, -0.10499659, -0.056032624, -0.013359254, -0.030728646, 0.043963596, 0.08870928, 0.045146573, 0.05971686, 0.03278427) * inp_0_2_0; + result0 += M4(0.19588293, -0.04648465, 0.027297234, 0.05453258, 0.06473069, -0.043464746, 0.223268, -0.02648231, 0.0062739355, 0.024977092, 0.08271271, -0.005075647, 0.17125973, 0.10962147, 0.1618092, 0.11265603) * inp_0_0_1; + result0 += M4(0.098922394, 0.26493427, -0.08755517, -0.13988777, -0.24570113, 0.14201127, -0.18969332, 0.32599792, -0.06624849, 0.08593866, -0.022810698, -0.05292953, 0.19407418, 0.19186307, 0.14618841, 0.22404681) * inp_0_1_1; + result0 += M4(0.0024095443, 0.09542953, 0.05893327, 0.04963878, 0.043981288, -0.09458787, 0.048440147, -0.13017173, 0.010817999, 0.009894588, -0.007898175, 0.11123364, 0.15274785, 0.18122944, 0.14603429, 0.21482544) * inp_0_2_1; + result0 += M4(-0.015920863, 0.0045611686, 0.030535664, -0.0011332423, -0.005275443, -0.0005943754, -0.025727643, -0.0031081287, 0.04642552, 0.018361727, 0.058243725, 0.029665668, 0.10241001, 0.02798229, 0.18251711, 0.004523951) * inp_0_0_2; + result0 += M4(-0.043556556, -0.065940246, 0.09670369, 0.07387089, 0.046474013, -0.00025676662, 0.04237812, -0.08965837, 0.037509654, 0.017891284, -0.09904582, 0.07562159, 0.038349077, 0.067137405, 0.06425105, 0.1743836) * inp_0_1_2; + result0 += M4(-0.019333778, -0.01060451, -0.0059877997, 0.06399235, 0.09297337, 0.07869079, 0.11191077, 0.041706722, 0.010740478, 0.011300985, -0.030533317, -0.109226234, 0.061926227, 0.124412335, 0.073686674, 0.10737882) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.07330701, -0.026571156, -0.043166053, -0.057155345, -0.06023793, -0.08201396, -0.017985104, 0.00259785, -0.046082836, 0.025884246, 0.015084661, -0.012299801, 0.07279219, 0.08398021, 0.01444768, 0.013628334) * inp_1_0_0; + result0 += M4(0.028485537, -0.13664272, -0.14637338, -0.03216143, 0.15768725, 0.17180555, 0.22409278, 0.07486649, 0.054554522, -0.06476858, 0.029637309, 0.03151017, -0.031520635, -0.13686366, 0.0027829686, -0.0009537584) * inp_1_1_0; + result0 += M4(-0.07279511, 0.047922287, -0.039518423, -0.03210193, -0.001693885, 0.10270714, 0.011595117, 0.141228, -0.041493673, 0.068810634, -0.011981957, 0.05599499, 0.02523943, -0.058428146, 0.016682947, -0.020516759) * inp_1_2_0; + result0 += M4(-0.011101113, -0.09268024, 0.078101635, -0.06144573, -0.20039465, -0.10002031, -0.27066922, -0.23258542, 0.13703087, 0.015634691, -0.00731571, 0.06905305, 0.007901865, 0.06765415, 0.1434028, 0.09154159) * inp_1_0_1; + result0 += M4(0.20163926, 0.020502245, 0.22196925, 0.04834591, 0.14234507, 0.12385057, -0.14618975, 0.05025507, -0.08665632, 0.028551226, -0.03954753, -0.07490453, 0.08381951, -0.0992167, -0.122530974, 0.047114052) * inp_1_1_1; + result0 += M4(0.050744314, 0.12697436, 0.014369487, 0.062857516, -0.03313285, 0.013857357, -0.08860406, -0.14726935, 0.01688374, -0.078021325, 0.011625158, 0.01023778, 0.027463386, 0.046657313, 0.023117632, -0.013085234) * inp_1_2_1; + result0 += M4(-0.009447039, -0.0062994813, -0.030561144, 0.015915044, -0.09330408, -0.0530166, -0.12407174, -0.015852062, 0.0051147086, -0.007351941, 0.002542378, -0.008233577, -0.014825013, -0.0015592017, -0.05729564, -0.017423365) * inp_1_0_2; + result0 += M4(-0.004105685, 0.07282294, 0.069418795, -0.05498573, -0.00208156, -0.040487334, 0.1445179, 0.051521864, -0.025368946, -0.013219188, -0.006728517, -0.07625849, -0.024420908, -0.0044598207, -0.015377865, -0.13657852) * inp_1_1_2; + result0 += M4(0.03599884, -0.0105478745, 0.038746145, 0.0507682, -0.025521498, -0.024232486, 0.011020209, 0.10047172, 0.05457663, 0.006208522, 0.055378985, -0.08648434, -0.0041283113, -0.01650629, 0.004291274, 0.023595793) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.02625175, 0.044448208, 0.025820026, 0.042625286, -0.14325926, -0.07368913, -0.035370324, -0.0483055, 0.022411536, 0.07837778, 0.014711007, 0.0089601325, 0.14614141, -0.013843195, -0.00183343, 0.030992392) * inp_2_0_0; + result0 += M4(-0.13943392, -0.027668366, -0.00605077, -0.010792682, -0.13432038, -0.06360804, 0.023869146, 0.018617587, 0.010982281, -0.12519816, -0.01816795, -0.012343567, -0.14264211, 0.0608064, -0.057635155, -0.12452771) * inp_2_1_0; + result0 += M4(-0.0023510873, -0.10876355, -0.020073038, -0.06581549, 0.024724813, 0.02788125, 0.012666816, 0.0075549004, 0.05302175, 0.062297385, 0.05456386, 0.035653763, -0.023079487, 0.04906416, 0.003889142, 0.048161693) * inp_2_2_0; + result0 += M4(0.013490228, 0.07731822, 0.024770379, 0.07787996, -0.24148642, -0.060349345, -0.287201, -0.058063217, 0.022927651, 0.07323395, 0.052245375, 0.14675435, 0.13006328, -0.0066324794, 0.13043395, -0.049508587) * inp_2_0_1; + result0 += M4(-0.06425463, -0.22909608, -0.30965263, -0.26137868, -0.34838507, -0.29899263, -0.1757177, -0.14641738, 0.04428377, -0.120601766, -0.072301604, -0.20429672, -0.029560901, -0.09850866, -0.010453421, 0.10752421) * inp_2_1_1; + result0 += M4(-0.12946495, -0.026556134, -0.054903407, -0.053088266, 0.4175077, -0.0046152826, 0.4301187, 0.08127058, -0.07252503, -0.1153844, -0.047318444, -0.099470355, -0.041942548, -0.054621693, 0.0133567965, 0.042263526) * inp_2_2_1; + result0 += M4(0.025980724, 0.014801285, 0.072112806, 0.0075275926, -0.0875942, -0.0022423542, -0.13813959, 0.011640581, 0.0011581844, 0.010904438, 0.009565574, 0.025610453, -0.006016893, 0.008746938, 0.007246336, -0.0147160785) * inp_2_0_2; + result0 += M4(0.0027364742, -0.043662306, 0.12877765, 0.017689677, 0.068794884, 0.019460868, -0.15110509, -0.13969134, 0.029709235, 0.078996494, 0.09302569, -0.1334812, 0.0063821794, -0.04602352, -0.024196027, -0.041869137) * inp_2_1_2; + result0 += M4(0.0033705158, 0.023012036, 0.00072865334, -0.013672455, 0.122846015, 0.15923437, 0.16657215, 0.10410814, 0.004356331, 0.010504295, 0.022496942, 0.07418264, -0.012007829, 0.032746863, 0.0027330485, 0.046688467) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.051054563, -0.00456595, -0.042562753, -0.024147434, -0.00081743393, 0.013612098, 0.01936531, 0.002067961, 0.024665983, 0.012183512, 0.021107063, 0.009794894, -0.117395766, -0.0810702, -0.04262109, -0.062447358) * inp_3_0_0; + result0 += M4(-0.03957509, -0.09165404, 0.007803734, -0.0041818433, 0.03165929, 0.027758801, -0.029112441, -0.0097638285, -0.03506947, -0.05936886, -0.05541801, -0.042584933, -0.059623193, -0.078187235, 0.024642546, 0.025905272) * inp_3_1_0; + result0 += M4(0.020659385, 0.05987362, 0.019810732, 0.054049026, -0.11781507, 0.03852306, -0.06292107, 0.0017821233, 0.040627886, 0.060671348, 0.02914991, 0.040991165, -0.07832766, -0.089677714, -0.055762652, -0.051040996) * inp_3_2_0; + result0 += M4(-0.040154513, -0.05843724, 0.06427843, -0.017596226, -0.051048756, 0.02946234, -0.07376165, 0.0671994, 0.035830647, -0.025981605, 0.022482721, 0.029612, -0.060820963, 0.005068918, -0.095560856, 0.030644644) * inp_3_0_1; + result0 += M4(0.24542196, 0.28494206, -0.21151958, -0.045248456, 0.14401782, -0.25568277, 0.1352637, -0.14852664, -0.48348254, -0.38713354, -0.39508206, -0.36013454, 0.35612994, 0.3228882, 0.34563643, 0.2669279) * inp_3_1_1; + result0 += M4(0.019076044, -0.0065221814, 0.03210429, -0.044332933, -0.06425407, 0.15088789, -0.10005643, 0.058653727, 0.026831932, -0.028788581, -0.019654373, -0.021367684, -0.11187411, -0.13136683, -0.10140025, -0.14363958) * inp_3_2_1; + result0 += M4(-0.03955165, -0.01919648, -0.06769437, -0.015274202, -0.012194205, 0.019330177, -0.0036170697, -0.0025878681, 0.1370301, 0.068571426, 0.18895936, 0.022519762, -0.032886382, 0.019316927, -0.05880236, 0.016897488) * inp_3_0_2; + result0 += M4(0.0019176262, -0.017462652, 0.126458, 0.06268182, 0.033145472, -0.025241157, 0.03292383, -0.102716744, 0.17617765, 0.16449314, -0.025039112, 0.07926759, 0.14934446, 0.055328105, 0.08959302, -0.0035233765) * inp_3_1_2; + result0 += M4(-0.03253326, -0.031951077, -0.018886896, -0.010784618, 0.009762149, 0.025690984, 0.034363244, 0.12997335, 0.10610043, 0.17722273, 0.09206027, 0.11330327, -0.018846225, 0.0020707906, -0.032037612, -0.03225054) * inp_3_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(1, 1); + imageStore(out_image, output_base + ivec2(0, 0), result0); +} + +//!DESC ArtCNN C4F16 DS (Depth-To-Space) +//!COMPUTE 12 16 12 16 +//!HOOK LUMA +//!BIND conv2d_6 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +void hook() { + vec4 result = vec4(0.0, 0.0, 0.0, 1.0); + vec2 f0 = fract(conv2d_6_pos * conv2d_6_size); + ivec2 i0 = ivec2(f0 * vec2(2.0)); + result.x = conv2d_6_tex((vec2(0.5) - f0) * conv2d_6_pt + conv2d_6_pos)[i0.y * 2 + i0.x]; + imageStore(out_image, ivec2(gl_GlobalInvocationID), clamp(result, 0.0, 1.0)); +} diff --git a/shaders/ArtCNN_C4F32_DS.glsl b/shaders/ArtCNN_C4F32_DS.glsl new file mode 100644 index 0000000..70254f6 --- /dev/null +++ b/shaders/ArtCNN_C4F32_DS.glsl @@ -0,0 +1,3927 @@ +// MIT License + +// Copyright (c) 2024 Joao Chrisostomo, Kacper Michajłow + +// Permission is hereby granted, free of charge, to any person obtaining a copy +// of this software and associated documentation files (the "Software"), to deal +// in the Software without restriction, including without limitation the rights +// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +// copies of the Software, and to permit persons to whom the Software is +// furnished to do so, subject to the following conditions: + +// The above copyright notice and this permission notice shall be included in all +// copies or substantial portions of the Software. + +// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +// SOFTWARE. + +//!DESC ArtCNN C4F32 DS (Conv2D) +//!COMPUTE 48 32 12 16 +//!HOOK LUMA +//!BIND LUMA +//!SAVE conv2d +//!WIDTH LUMA.w 4.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared F inp[1][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(1, 1); + inp[0][y][x] = F(LUMA_mul * texelFetch(LUMA_raw, input_base + ivec2(0, 0), 0).x); + } + } + + barrier(); + V4 result0 = V4(0.00059421, -0.0026045588, -0.0006108253, -0.08492119); + V4 result1 = V4(-0.00035372374, -0.0003572344, -0.0013393819, 0.0005660144); + V4 result2 = V4(0.002993011, 0.0070888526, 0.0020018439, 0.002501177); + V4 result3 = V4(-0.0024211009, -0.05971874, -5.7197096e-05, 0.000981694); + V4 result4 = V4(-0.0008129696, 0.0007712776, 0.00034729243, -0.0001277347); + V4 result5 = V4(-0.00021367395, 9.3650204e-05, 0.0008922946, 0.0001584326); + V4 result6 = V4(-0.0030164458, -9.39177e-06, 0.029349048, 0.0389926); + V4 result7 = V4(-0.0009346589, -0.0003968174, 0.0067445743, -0.00035754472); + const F inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const F inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const F inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const F inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const F inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const F inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const F inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const F inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const F inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += V4(-0.05720956, -0.06903012, 0.068310924, -0.038781982) * inp_0_0_0; + result0 += V4(0.040161997, 0.2013884, -0.070959255, -0.00211659) * inp_0_1_0; + result0 += V4(-0.027866466, -0.1263024, 0.03945074, 0.03977398) * inp_0_2_0; + result0 += V4(0.09448115, -0.012722074, -0.017741358, -0.18534198) * inp_0_0_1; + result0 += V4(-0.025378618, -0.03839837, -0.04376362, 0.11720926) * inp_0_1_1; + result0 += V4(0.012214564, 0.039207757, 0.023578104, 0.12853287) * inp_0_2_1; + result0 += V4(-0.026298959, 0.08818499, -0.040490296, -0.0063463673) * inp_0_0_2; + result0 += V4(-0.033232253, -0.15830266, 0.089201175, 0.059763063) * inp_0_1_2; + result0 += V4(0.021248993, 0.078120664, -0.046352822, 0.08057135) * inp_0_2_2; + result1 += V4(0.0084586125, 0.06546896, 0.089953765, 0.09739724) * inp_0_0_0; + result1 += V4(0.07370753, -0.052235793, 0.06624783, -0.11533037) * inp_0_1_0; + result1 += V4(-0.058357798, 0.024528306, -0.13545036, -0.038999118) * inp_0_2_0; + result1 += V4(-0.008160546, -0.040027905, -0.10843342, -0.1526205) * inp_0_0_1; + result1 += V4(-0.086275786, 0.05316023, 0.049899112, 0.16811445) * inp_0_1_1; + result1 += V4(0.045399483, -0.07085666, 0.029709175, 0.07084875) * inp_0_2_1; + result1 += V4(-0.022196436, -0.056992456, 0.0076457784, 0.063735776) * inp_0_0_2; + result1 += V4(0.034277212, 0.017756267, -0.11179555, -0.055455405) * inp_0_1_2; + result1 += V4(0.013569325, 0.0612484, 0.11416159, -0.037677463) * inp_0_2_2; + result2 += V4(-0.018447109, 0.016015902, 0.0638154, -0.015687577) * inp_0_0_0; + result2 += V4(0.031911608, 0.08540334, -0.15331753, 0.003208568) * inp_0_1_0; + result2 += V4(-0.03360432, -0.01761468, 0.04523877, -0.025072247) * inp_0_2_0; + result2 += V4(-0.07640721, -0.20427635, -0.063998245, -0.07356574) * inp_0_0_1; + result2 += V4(-0.3287912, 0.5197998, 0.35349694, 0.09646598) * inp_0_1_1; + result2 += V4(-0.0007118964, -0.32668594, -0.21552823, 0.10529735) * inp_0_2_1; + result2 += V4(0.120177075, -0.06988313, 0.009631942, 0.011986648) * inp_0_0_2; + result2 += V4(0.25396907, 0.008469441, -0.16536789, -0.12251586) * inp_0_1_2; + result2 += V4(0.04895496, -0.011422383, 0.12547605, 0.015737237) * inp_0_2_2; + result3 += V4(-0.00071473006, 0.034433134, -0.007700647, -0.008681562) * inp_0_0_0; + result3 += V4(-0.039788723, 0.19000232, -0.0065628244, -0.024851965) * inp_0_1_0; + result3 += V4(0.03886775, 0.025879256, 0.04063019, 0.015064802) * inp_0_2_0; + result3 += V4(0.007172039, 0.10771867, -0.05134853, 0.017718824) * inp_0_0_1; + result3 += V4(-0.018345907, 0.23767412, 0.03607096, 0.08546286) * inp_0_1_1; + result3 += V4(0.052992802, 0.18220265, -0.040996663, -0.054348283) * inp_0_2_1; + result3 += V4(0.021435615, 0.11114274, 0.041500676, -0.015510711) * inp_0_0_2; + result3 += V4(-0.088456504, 0.014998645, -0.0077594114, -0.05686206) * inp_0_1_2; + result3 += V4(0.02980781, 0.08559099, -0.0027411773, 0.040014014) * inp_0_2_2; + result4 += V4(-0.010802783, 0.041537613, 0.013188507, -0.0100586405) * inp_0_0_0; + result4 += V4(0.02343228, -0.039955676, -0.064961195, -0.001099957) * inp_0_1_0; + result4 += V4(-0.030414548, 0.008641178, 0.0730152, 0.033116963) * inp_0_2_0; + result4 += V4(-0.00615819, -0.028239103, -0.008127953, -0.058925588) * inp_0_0_1; + result4 += V4(-0.05042115, 0.044934776, 0.10996656, -0.008548018) * inp_0_1_1; + result4 += V4(0.06839975, -0.010754858, -0.09766665, 0.019332128) * inp_0_2_1; + result4 += V4(0.025619071, -0.011547161, 0.011049605, 0.05791401) * inp_0_0_2; + result4 += V4(0.030315332, -0.01088887, -0.054349568, 0.033717196) * inp_0_1_2; + result4 += V4(-0.049095597, 0.0049878936, 0.018198276, -0.06530356) * inp_0_2_2; + result5 += V4(-0.01616407, 0.0008555966, 0.021815524, 0.0802821) * inp_0_0_0; + result5 += V4(0.008259966, -0.011062282, 0.03494704, -0.024195926) * inp_0_1_0; + result5 += V4(0.002716732, 0.008612918, -0.034620512, -0.08136076) * inp_0_2_0; + result5 += V4(-0.028693613, -0.005875763, 0.009658498, -0.09647011) * inp_0_0_1; + result5 += V4(0.01297196, 0.023385055, -0.06589606, -0.0076495893) * inp_0_1_1; + result5 += V4(0.020628722, -0.010835739, 0.0860356, 0.143927) * inp_0_2_1; + result5 += V4(0.03235066, 0.00762383, -0.035273455, 0.02806298) * inp_0_0_2; + result5 += V4(0.015449638, -0.012428944, 0.03868852, 0.029288178) * inp_0_1_2; + result5 += V4(-0.047466204, -0.00035494898, -0.05860554, -0.072583735) * inp_0_2_2; + result6 += V4(-0.041209485, 0.049689256, 0.03848615, -0.02230328) * inp_0_0_0; + result6 += V4(-0.015236934, -0.03890892, 0.24399142, -0.11847331) * inp_0_1_0; + result6 += V4(0.0753005, -0.004737102, 0.12888695, 0.007313608) * inp_0_2_0; + result6 += V4(-0.13407758, -0.032969758, -0.25555563, -0.013154287) * inp_0_0_1; + result6 += V4(0.18857452, 0.032050285, -0.354498, -0.18323424) * inp_0_1_1; + result6 += V4(-0.021725243, -0.0043262867, 0.19019929, 0.027484423) * inp_0_2_1; + result6 += V4(0.17300096, -0.0017002843, -0.05499701, 0.026156604) * inp_0_0_2; + result6 += V4(-0.17121573, -0.013974816, -0.003403842, 0.08982031) * inp_0_1_2; + result6 += V4(-0.049816374, 0.0146233495, -0.022609651, 0.111714736) * inp_0_2_2; + result7 += V4(0.012295933, -0.18987696, -0.046402045, -0.016141297) * inp_0_0_0; + result7 += V4(-0.0012115657, -0.19670378, -0.012887067, 0.06507453) * inp_0_1_0; + result7 += V4(0.029934919, -0.025932675, -0.025668262, -0.0581377) * inp_0_2_0; + result7 += V4(-0.016512442, -0.21443945, 0.01515749, 0.06466304) * inp_0_0_1; + result7 += V4(-0.076333076, 0.49315628, 0.08659942, -0.055057593) * inp_0_1_1; + result7 += V4(0.015373549, 0.115858175, 0.009898049, 0.02554801) * inp_0_2_1; + result7 += V4(-0.008511473, -0.0421585, -0.02655636, -0.052159943) * inp_0_0_2; + result7 += V4(0.07152557, 0.09254572, -0.010450508, -0.003908911) * inp_0_1_2; + result7 += V4(-0.02420516, 0.0012162832, -0.0006933234, 0.029896354) * inp_0_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(4, 2); + imageStore(out_image, output_base + ivec2(0, 0), result0); + imageStore(out_image, output_base + ivec2(1, 0), result1); + imageStore(out_image, output_base + ivec2(2, 0), result2); + imageStore(out_image, output_base + ivec2(3, 0), result3); + imageStore(out_image, output_base + ivec2(0, 1), result4); + imageStore(out_image, output_base + ivec2(1, 1), result5); + imageStore(out_image, output_base + ivec2(2, 1), result6); + imageStore(out_image, output_base + ivec2(3, 1), result7); +} + +//!DESC ArtCNN C4F32 DS (Conv2D-1-ReLU) +//!COMPUTE 48 32 12 16 +//!HOOK LUMA +//!BIND conv2d +//!SAVE conv2d_1 +//!WIDTH LUMA.w 4.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[8][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(4, 2); + inp[0][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(2, 0), 0)); + inp[3][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(3, 0), 0)); + inp[4][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 1), 0)); + inp[5][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 1), 0)); + inp[6][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(2, 1), 0)); + inp[7][y][x] = V4(conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(3, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(-0.042714596, 0.011591515, 0.07238511, 0.03595657); + V4 result1 = V4(0.010827413, -0.36382675, -0.014524071, -0.014273523); + V4 result2 = V4(-0.00071941706, 0.03461611, 0.03235031, 0.037781585); + V4 result3 = V4(-0.016128618, 0.036656387, -0.02016149, -0.010464984); + V4 result4 = V4(0.017564462, 0.00023234202, -0.006873899, -1.1628507); + V4 result5 = V4(0.019172806, 0.010472192, 0.009836619, 0.0031299193); + V4 result6 = V4(0.0018006279, 0.02388624, 0.00819407, -0.03491282); + V4 result7 = V4(0.025965977, -0.011213607, -0.0010511605, -0.00097063923); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.020268647, 0.14825523, 0.007372486, -0.045210518, 0.0061434456, 0.23509921, 0.06850672, 0.14130206, -0.04479972, -0.34290636, -0.029150475, 0.011045418, 0.08095481, 0.17917089, -0.12147151, -0.07294466) * inp_0_0_0; + result0 += M4(0.05458638, -0.048679367, 0.022237385, -0.14177488, -0.03144672, -0.04454854, 0.019220626, 0.013696505, 0.075617835, 0.12123587, -0.045615565, 0.11063499, -0.028505491, 0.09205069, 0.07092868, 0.08160769) * inp_0_1_0; + result0 += M4(-0.07180649, -0.026103359, -0.027361687, 0.15016098, -0.050517555, 0.04939807, -0.034428593, 0.09034812, -0.031054338, 0.04080863, 0.060605668, -0.14733653, 0.06970039, -0.074839495, 0.031730924, -0.01834558) * inp_0_2_0; + result0 += M4(0.020511141, 0.19019808, 0.011577099, -0.018903792, 0.1428631, 0.20722544, 0.034837175, -0.05836752, -0.05286037, 0.008573406, -0.01266339, 0.023769394, -0.08835682, 0.21767567, 0.09204842, -0.014379353) * inp_0_0_1; + result0 += M4(-0.074524745, -0.27822876, 0.013350811, 0.03883656, 0.034003742, -0.12169725, -0.001302453, -0.15816908, 0.08625305, -0.04697309, 0.048174124, -0.014137186, -0.059876204, 0.22270301, -0.013324488, 0.2222257) * inp_0_1_1; + result0 += M4(0.026421938, 0.07146637, -0.014214964, 0.004115642, 0.097909145, 0.070237145, -0.105134584, -0.09889645, -0.04722841, 0.034669243, 0.0005260954, -0.008091203, -0.24982406, -0.07029222, 0.17892233, -0.08811164) * inp_0_2_1; + result0 += M4(-0.04663377, -0.27243048, 0.0391867, 0.11637642, -0.05228384, -0.5024352, 0.16150029, 0.020510964, 0.036365733, 0.39841992, -0.057961017, -0.07950254, -0.01859421, 0.20775238, -0.036983132, -0.13551942) * inp_0_0_2; + result0 += M4(0.011411134, 0.22569728, -0.0152920475, -0.022221385, -0.1562097, 0.05529353, -0.09342427, 0.053615596, -0.082741335, -0.16765948, 0.03603018, -0.005320681, 0.043266498, 0.083909445, 0.12812527, 0.030047817) * inp_0_1_2; + result0 += M4(0.078962885, -0.0071162875, -0.04424544, -0.07724012, -0.053223457, 0.009493869, 0.123284, 0.026991306, 0.049395826, -0.029972022, -0.059212867, 0.088321514, -0.009095844, -0.020606572, -0.015364895, -0.055298522) * inp_0_2_2; + result1 += M4(-0.06232669, -0.026769124, 0.021521335, -0.027186217, -0.054370288, -0.18382342, 0.03233994, 0.03575063, 0.03396374, 0.109278314, -0.08659539, 0.019022297, -0.16251917, 0.18142869, 0.006772278, 0.006308613) * inp_0_0_0; + result1 += M4(-0.06621316, 0.008242259, -0.02455648, 0.041844133, 0.24871416, 0.19029002, 0.028239056, 0.038674828, -0.08053818, 0.009687939, -0.21889219, -0.0036235754, -0.07284282, 0.13503881, 0.0470514, -0.008415604) * inp_0_1_0; + result1 += M4(0.3297149, -0.027571684, 0.053300206, -0.05690302, 0.105289154, -0.10117306, 0.018809851, -0.024461899, -0.20733619, 0.031998433, 0.16168839, -0.0073598498, -0.18165122, 0.10275211, -0.16246904, 0.11249039) * inp_0_2_0; + result1 += M4(0.15595962, -0.116506785, -0.031276602, -0.01604919, -0.062258553, 0.066844955, -0.20105594, 0.07654626, 0.06442371, -0.063042715, 0.33330128, -0.05215178, 0.05460772, 0.17684814, 0.0145007055, 0.0033711654) * inp_0_0_1; + result1 += M4(-0.025682015, 0.22786757, 0.037356365, -0.22583298, -0.05409413, 0.09852505, 0.07245512, -0.06894147, -0.035620697, -0.047470212, -0.12066471, 0.19949281, -0.111082375, -0.0654596, 0.0113748815, -0.04759167) * inp_0_1_1; + result1 += M4(-0.35541508, -0.054041676, -0.10126022, 0.28670153, -0.38971886, 0.07401345, -0.278561, 0.30413467, 0.30421135, -0.07436365, 0.063763194, -0.1575792, -0.23363066, 0.019641457, -0.13043486, -0.3374282) * inp_0_2_1; + result1 += M4(-0.093819425, 0.14299177, -0.023607735, 0.015175345, -0.0017927431, 0.14492702, -0.034533955, -0.036500532, -0.035934616, -0.13721408, -0.087653875, -0.007531532, 0.017685894, 0.13622876, 0.061079826, -0.14280173) * inp_0_0_2; + result1 += M4(0.088514924, -0.26559612, 0.075079374, 0.18216874, 0.02842939, -0.14897862, 0.3180968, 0.17789103, -0.008417494, 0.09965723, -0.020617135, -0.1571512, -0.063983515, -0.015497844, -0.13906275, 0.18156528) * inp_0_1_2; + result1 += M4(0.055296432, 0.031179115, -0.032635134, -0.17856987, 0.1516071, -0.065819584, 0.0015008441, -0.37496942, -0.028610846, 0.09001752, 0.038358472, 0.12101329, 0.1332594, -0.055094093, 0.12954836, -0.12312948) * inp_0_2_2; + result2 += M4(0.04436205, 0.03272969, 0.082117066, -0.14897831, 0.02078067, 0.025371421, -0.030298583, 0.059800632, -0.17460795, -0.049655095, -0.09496556, 0.23973551, 0.1732751, 0.05343574, 0.03247581, -0.13606766) * inp_0_0_0; + result2 += M4(-0.044836625, -0.084655724, -0.08816038, 0.20282699, -0.087223254, 0.018615223, 0.062091693, 0.12016283, 0.12447433, 0.017893136, -0.007466032, -0.12877573, -0.20169918, 0.07549086, 0.02625559, -0.014327254) * inp_0_1_0; + result2 += M4(0.000937708, -0.02372029, 0.020972041, -0.128782, 0.062136948, 0.17730762, 0.051112503, -0.23772344, -0.011192493, 0.020326655, 0.019522913, -0.030132089, 0.24831614, -0.05930657, 0.056801796, -0.041750364) * inp_0_2_0; + result2 += M4(0.15253678, 0.043978646, -0.089194424, -0.21455081, 0.052367248, 0.1811088, 0.017147724, -0.12380393, 0.09191318, -0.058358476, 0.06501043, 0.09066592, 0.0033466078, -0.009727251, 0.03180371, -0.055824853) * inp_0_0_1; + result2 += M4(-0.030182308, 0.13921423, 0.22085072, -0.044830274, 0.15198313, 0.026134778, 0.062357165, -0.236567, -0.22224993, -0.171287, -0.04902561, 0.039041862, -0.1989534, -0.03544617, 0.11422371, 0.28444847) * inp_0_1_1; + result2 += M4(-0.09683194, -0.06575642, -0.16387081, 0.24180213, -0.09752453, -0.08713728, -0.07650153, 0.07277323, 0.07279966, 0.08250263, 0.0554538, -0.05801922, 0.26159686, -0.041010123, 0.36876974, -0.0647169) * inp_0_2_1; + result2 += M4(-0.094095476, -0.11886874, 0.00802891, 0.3476756, -0.115224175, -0.37381357, -0.082234, 0.43452987, 0.08289792, 0.3091707, 0.033544444, -0.3748588, 0.22480658, 0.13475405, 0.009263132, -0.13467726) * inp_0_0_2; + result2 += M4(0.094794214, 0.026683906, -0.11798103, -0.06924625, -0.08918871, 0.17676891, -0.2580804, -0.026375275, 0.05834822, -0.14829479, 0.22193226, 0.08323461, -0.17417352, 0.06335608, 0.117469855, 0.066684686) * inp_0_1_2; + result2 += M4(-0.012913879, 0.08232436, 0.11017771, -0.1420779, 0.12082714, -0.11514996, 0.10867421, -0.0032127697, -0.06889167, -0.014451363, -0.19325945, 0.09126042, 0.03257303, 0.07660392, -0.009940959, -0.09966804) * inp_0_2_2; + result3 += M4(-0.03400627, -0.045000874, -0.0949746, 0.026569195, 0.06374851, -0.17913724, -0.19537579, -0.03434123, -0.06285008, 0.15525737, 0.029252583, -0.07730218, 0.053348646, -0.028284214, 0.12554094, -0.03291163) * inp_0_0_0; + result3 += M4(-0.030196393, 0.0037547438, 0.115746655, 0.025105454, 0.07107014, 0.2682187, 0.05420887, 0.19181426, 0.17047271, -0.2724168, 0.04234023, -0.036664255, 0.054103628, -0.086841956, 0.09969301, 0.035592698) * inp_0_1_0; + result3 += M4(0.025260808, 0.10315893, 0.098687105, 0.16703038, -0.08844072, -0.16284281, 0.065202735, -0.07724701, -0.1090906, 0.038361132, -0.14185512, -0.13649403, -0.026836146, -0.16204, 0.045830395, 0.068950005) * inp_0_2_0; + result3 += M4(0.082908, 0.13440077, 0.077045225, 0.07258829, -0.12576218, 0.009103286, 0.14698924, -0.029685715, 0.006657362, -0.09412345, 0.016172243, -0.03407008, -0.023893334, 0.08817615, 0.010146429, -0.02195622) * inp_0_0_1; + result3 += M4(-0.088707946, -0.045973614, -0.24971655, -0.09218938, 0.08437918, 0.1120485, -0.02448813, -0.02257737, -0.13258657, 0.102566965, 0.018650232, 0.071094155, -0.11432819, -0.025290389, -0.08326027, -0.060312666) * inp_0_1_1; + result3 += M4(0.03387024, -0.10360934, -0.028582208, -0.07575261, -0.017623954, -0.11637099, -0.05440311, 0.0050957855, 0.031124162, 0.03894565, 0.10123033, -0.026114851, -0.20205021, 0.07022736, -0.18413247, 0.0194989) * inp_0_2_1; + result3 += M4(-0.108792946, -0.0476312, 0.023044622, -0.24801922, 0.09023104, -0.03946855, -0.0955286, -0.30579472, 0.07547969, -0.028301805, 0.01026302, 0.15100634, -0.06813315, -0.022987626, 0.1409446, 0.093881756) * inp_0_0_2; + result3 += M4(0.19563086, 0.073493905, 0.07173341, 0.122236766, 0.37825328, 0.06642939, 0.026379375, 0.16976514, -0.15878633, 0.008712973, -0.051333435, 0.04743582, -0.044011317, 0.026162548, -0.004637235, -0.07723268) * inp_0_1_2; + result3 += M4(-0.074678436, -0.04435617, -0.008446457, 0.009106448, -0.3312373, 0.020591788, 0.04238421, 0.058908988, 0.14680266, 0.043868694, 0.0080179935, 0.0635707, 0.22655982, 0.061260827, 0.071055666, 0.04536601) * inp_0_2_2; + result4 += M4(0.0229897, 0.02600789, 0.04318227, 0.056938473, -0.013260426, 0.049922977, 0.107270665, -0.11426942, 0.008280311, -0.11023846, -0.15509868, -0.05803795, -0.15925965, 0.22990064, 0.14649814, 0.0013334672) * inp_0_0_0; + result4 += M4(-0.0022188416, 0.028027121, -0.04351062, -0.03842035, 0.17062525, -0.28407684, -0.43236062, 0.05971821, -0.23882908, 0.19171847, 0.25826785, -0.067961186, 0.14045641, -0.07047913, 0.12744413, 0.106645554) * inp_0_1_0; + result4 += M4(0.14434227, -0.15819654, -0.0059702517, -0.016392978, -0.024154976, 0.1443129, -0.07554423, -0.06573592, 0.012800963, 0.07304977, -6.6139386e-05, 0.11498108, 0.02571318, 0.12532328, 0.016042177, 0.3123708) * inp_0_2_0; + result4 += M4(0.18629986, 0.036145207, -0.108486876, -0.136735, -0.19689055, 0.055105306, 0.09007838, -0.016723143, -0.1460224, -0.019618722, 0.0543125, 0.07821289, 0.06944181, -0.09431772, -0.10837417, 0.007129244) * inp_0_0_1; + result4 += M4(-0.071403734, -0.018617045, 0.22160384, 0.1664269, 0.22846742, -0.10504693, 0.1437707, 0.074150465, -0.005945418, -0.052323215, -0.18881448, -0.03688276, -0.117976084, 0.15536022, -0.03742899, 0.20489633) * inp_0_1_1; + result4 += M4(-0.090433575, 0.078805365, -0.03887117, 0.021071453, -0.15162127, 0.05586981, 0.106780864, -0.016416641, 0.13776517, -0.07841334, -0.01674541, -0.07283049, -0.0008834937, -0.03916034, -0.16555677, 0.4699897) * inp_0_2_1; + result4 += M4(-0.25001028, -0.029027645, 0.09952708, 0.101661116, -0.2679267, 0.095195495, 0.09379947, 0.1216375, 0.29544395, 0.027807252, -0.101648994, -0.046678584, 0.09552274, -0.052846547, 0.039143153, -0.0690439) * inp_0_0_2; + result4 += M4(0.22638567, 0.016796492, -0.13556087, -0.19024307, 0.412845, -0.017504351, 0.10858891, -0.053032245, -0.19192916, -0.03050747, 0.013893807, 0.11865209, -0.116778165, 0.02883949, -0.09647645, 0.050611652) * inp_0_1_2; + result4 += M4(-0.16161689, 0.015135912, -0.033341687, 0.038444266, -0.1922627, -0.053408332, -0.16698006, -0.0020355517, 0.14271554, 0.020662053, 0.14828636, -0.034547646, 0.14668879, -0.090679035, 0.007595928, 0.18698914) * inp_0_2_2; + result5 += M4(-0.0038233844, -0.038643777, 0.117101975, -0.059352893, -0.012787684, 0.24478847, 0.043947425, 0.07901965, 0.0504098, -0.10846988, 0.032506287, 0.004304464, 0.045535903, -0.041623328, -0.09968747, -0.021789601) * inp_0_0_0; + result5 += M4(-0.04190915, -0.19893633, 0.055619072, -0.0012225655, -0.12322451, -0.47732323, -0.029736735, 0.09959535, 0.12064738, 0.46465406, -0.016973807, -0.13848215, -0.16638878, 0.10477461, 0.031585794, -0.10217614) * inp_0_1_0; + result5 += M4(0.045396797, 0.16388787, -0.16659987, 0.03792452, 0.15256222, 0.3771389, -0.16345283, 0.032161742, -0.15623413, -0.36288205, 0.064247295, 0.08032743, 0.03550602, 0.04714798, 0.030401254, -0.027422825) * inp_0_2_0; + result5 += M4(0.034030367, -0.009880312, -0.0606243, 0.0031811611, -0.053606708, -0.3738472, -0.24991377, 0.034458816, 0.08033743, 0.15036906, 0.21669243, 0.039792303, -0.013246069, 0.05664165, -0.111542955, -0.0656939) * inp_0_0_1; + result5 += M4(-0.08368354, 0.25769064, 0.17398253, -0.0627979, 0.07862928, -0.042130668, 0.33294833, 0.058403995, -0.11751697, -0.12091897, -0.27666116, 0.044058878, -0.02899958, 0.08770914, -0.114922404, -0.03758022) * inp_0_1_1; + result5 += M4(0.14295524, -0.25768724, -0.10228744, -0.09517184, 0.00926862, -0.3636604, -0.15237527, -0.046143975, -0.056292277, 0.35790715, 0.10204301, 0.07962385, -0.13975208, -0.063685015, 0.1364752, -0.09239288) * inp_0_2_1; + result5 += M4(-0.020055655, -0.11828783, -0.065835916, 0.02850138, 0.06953426, 0.49303243, 0.42563468, -0.04613442, -0.09335638, -0.29731086, -0.19983943, -0.04392246, 0.0021257664, -0.02911612, -0.15023233, -0.018344644) * inp_0_0_2; + result5 += M4(0.09818633, -0.18110804, -0.18017022, 0.069634296, 0.16736735, -0.36072952, -0.47928768, -0.292124, -0.107961655, 0.37833214, 0.2901414, 0.06649407, -0.13551697, 0.078865446, 0.058791302, 0.041213896) * inp_0_1_2; + result5 += M4(-0.18019322, 0.33037, 0.20374258, 0.08476501, -0.25367123, 0.77855486, 0.21106005, 0.013510977, 0.26010516, -0.5287344, -0.19865678, -0.13735598, 0.0902484, 0.027938409, 0.12040936, -0.03467567) * inp_0_2_2; + result6 += M4(-0.20870009, -0.095222, -0.033454984, -0.065400735, 0.19313292, 0.0778578, 0.002091675, -0.39748082, 0.0069972547, -0.00045686567, -0.06270034, -0.115122885, 0.010889092, 0.093473785, 0.09048789, 0.050676074) * inp_0_0_0; + result6 += M4(0.035944436, -0.00023661536, 0.036038686, -0.09033171, -0.18661729, -0.13165267, -0.020340957, 0.03470277, 0.13611473, 0.077908404, 0.015176395, 0.38270426, -0.056219827, -0.009706887, -0.014937278, -0.06941049) * inp_0_1_0; + result6 += M4(0.061547503, 0.028232034, 0.015545255, 0.13273421, 0.23441736, -0.10307353, 0.1523606, 0.0034006871, -0.11043485, 0.0070839, 0.051696766, -0.119535744, 0.033249278, -0.030094182, -0.030192496, 0.22019497) * inp_0_2_0; + result6 += M4(0.30155244, 0.10360127, -0.04568099, 0.015849667, 0.08678474, 0.049520385, 0.01668733, 0.12139963, -0.28237268, -0.0009562847, 0.070742935, 0.2980231, 0.003981847, -0.030517148, 0.0048703533, 0.013675119) * inp_0_0_1; + result6 += M4(-0.02006746, 0.16300954, -0.017004231, 0.023949746, -0.08723611, 0.17485526, -0.048874076, 0.07336817, 0.012077663, -0.1714553, 0.048649255, -0.22175668, 0.036483366, -0.060560513, 0.13527189, -0.012682368) * inp_0_1_1; + result6 += M4(0.10679554, -0.20853277, 0.056777637, -0.010504056, 0.07880457, -0.043011382, 0.024917016, 0.29063034, 0.007874969, 0.13584907, -0.07431608, -0.10681921, -0.122501686, 0.13690814, -0.081902854, -0.022833277) * inp_0_2_1; + result6 += M4(-0.25533035, -0.019635295, 0.068325914, 0.22342893, -0.16536735, 0.07877552, -0.06696354, 0.04288555, 0.30344808, -0.06477599, 0.019130379, -0.38249543, -0.022517884, 0.049166884, -0.034824107, 0.3166459) * inp_0_0_2; + result6 += M4(0.008439721, -0.11620232, -0.0069008577, -0.037752226, -0.16271615, -0.3832438, 0.0734745, -0.032145612, 0.022684911, 0.13126016, -0.09333663, 0.11692364, 0.04440292, -0.08241177, -0.012808084, -0.06410111) * inp_0_1_2; + result6 += M4(-0.037885435, 0.13372825, -0.082009785, -0.17489593, -0.18538077, 0.23994179, -0.100767754, -0.012191402, -0.05329288, -0.11883949, 0.03176475, 0.09746631, 0.057389986, -0.052946683, 0.003021464, -0.251393) * inp_0_2_2; + result7 += M4(-0.05867251, 0.25848675, -0.1612531, -0.08174625, -0.021039482, 0.4373792, 0.060481038, -0.031800665, -0.007747895, -0.36429894, 0.14456034, 0.18798897, -0.048320886, -0.06578663, -0.08032537, 0.056976337) * inp_0_0_0; + result7 += M4(0.018457683, -0.19182694, -0.03582228, 0.15457691, -0.06334163, -0.13673481, 0.10631329, 0.05914127, 0.13031517, 0.15806162, 0.17825839, -0.10722788, 0.16217902, 0.033583954, -0.12307302, -0.03471117) * inp_0_1_0; + result7 += M4(-0.0049308287, -0.1278006, 0.17576715, 0.00090446474, -0.02590912, -0.22393094, 0.32716277, 0.064345494, -0.057403553, 0.068951264, -0.34291607, -0.03876382, -0.1171293, 0.085463725, 0.020035058, -0.06453559) * inp_0_2_0; + result7 += M4(-0.023636397, -0.33568785, -0.0004893112, 0.13354896, -0.0019806025, -0.36691913, -0.3346849, 0.22677845, -0.0026762953, 0.58283377, -0.0128265405, -0.2886498, -0.09229235, 0.06482395, -0.12154484, 0.20681357) * inp_0_0_1; + result7 += M4(-0.03378907, -0.063677326, 0.005017251, -0.10975505, 0.063447826, 0.13067761, 0.012144856, -0.12877822, -0.13016011, -0.1723573, -0.03400687, 0.07360175, -0.09057396, 0.020246202, 0.06956209, -0.028035002) * inp_0_1_1; + result7 += M4(0.1145418, 0.28175843, -0.18074696, -0.10356304, 0.049322665, 0.21088168, 0.08970878, -0.16297705, -0.062385745, -0.19887838, 0.06635873, 0.12842949, -0.12965013, -0.13581395, 0.091474965, 0.17882681) * inp_0_2_1; + result7 += M4(0.03414605, 0.05431703, 0.09918046, 0.09376892, -0.20312515, 0.33837643, -0.1967059, 0.02985413, 0.10720804, -0.36743656, -0.10219911, 0.07127951, 0.18000656, 0.08950406, 0.05820729, 0.29237443) * inp_0_0_2; + result7 += M4(0.09274097, 0.3050205, 0.09827579, -0.12308496, 0.41528732, 0.06950069, -0.13905844, -0.24611962, -0.13515018, -0.06351798, 0.07261992, 0.10880329, 0.07941072, -0.22679578, -0.08862112, 0.11709439) * inp_0_1_2; + result7 += M4(-0.13006866, -0.1612075, 0.015155341, 0.051324762, -0.17869024, -0.2783368, 0.1851676, 0.17934461, 0.15468724, 0.30552292, -0.020170752, -0.111704215, 0.23055096, 0.09930267, -0.16835861, -0.007239737) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.08056164, 0.024221394, 0.01469956, -0.0018052512, 0.032743286, 0.19394612, 0.02556068, -0.005149667, 0.11348067, 0.33189735, 0.08544284, 0.03634659, -0.029906813, -0.11994978, -0.052395586, 7.1166514e-06) * inp_1_0_0; + result0 += M4(-0.047035396, 0.06665783, 0.013006395, 0.06069598, -0.10577905, -0.080583654, -0.060090564, 0.097482756, -0.07978745, -0.042081367, 0.10970377, 0.06696193, -0.043079987, -0.11010037, 0.089139275, 0.05448903) * inp_1_1_0; + result0 += M4(-0.0024540473, -0.0784394, -0.06775936, -0.0139979655, 0.082527906, -0.058007278, 0.005939752, -0.015822219, -0.053953923, 0.039333954, 0.022269873, -0.01603982, -0.023703689, -0.0076323156, 0.08039281, -0.04987313) * inp_1_2_0; + result0 += M4(-0.0384695, 0.46037552, -0.04974805, -0.030770607, 0.123112746, -0.43623227, 0.07064719, 0.032745123, 0.108739614, -0.026427317, -0.12740321, 0.08232159, -0.07402766, 0.07857299, -0.0047419285, 0.03221524) * inp_1_0_1; + result0 += M4(0.111686476, -0.26939228, -0.01332168, -0.14614257, -0.08132169, 0.22978422, -0.120018594, -0.036263626, -0.10410683, 0.14793888, -0.06916599, -0.13419534, -0.09913267, 0.2571546, -0.009713434, 0.16305831) * inp_1_1_1; + result0 += M4(-0.034815054, -0.058604963, 0.01788539, -0.020877058, -0.0026703759, 0.016175224, 0.11238556, -0.016412891, 0.0396129, -0.10579109, -0.028854193, -0.09521144, 0.045456354, -0.12565531, -0.044188254, 0.012353671) * inp_1_2_1; + result0 += M4(0.0554219, -0.3841396, 0.07359661, -0.006964435, -0.09853514, 0.20009996, -0.13575329, -0.05170514, 0.28403568, -0.31017357, 0.12442697, 0.034799702, 0.20441908, -0.01245577, -0.037548214, 0.0032466718) * inp_1_0_2; + result0 += M4(-0.13931926, 0.20444494, -0.05902571, 0.10644682, 0.17043424, -0.03851538, 0.13023897, -0.071787, -0.1250542, -0.01450753, -0.14225888, -0.017005814, 0.12584496, 0.011672021, -0.028076801, -0.1728474) * inp_1_1_2; + result0 += M4(-0.0027912275, 0.039617404, 0.07478198, 0.039330017, -0.13748494, -0.032679155, -0.05495757, 0.061556093, -0.26208976, -0.05195373, 0.11226525, 0.048988525, -0.12599872, 0.011813674, 0.023555873, -0.015039726) * inp_1_2_2; + result1 += M4(0.025044475, 0.030789735, -0.03794999, 0.08355566, -0.037364226, -0.008631991, 0.047075126, 0.006358587, -0.016443051, -0.010585548, 0.05896397, -0.03327511, -0.012239931, 0.00022359488, 0.02688734, -0.037074383) * inp_1_0_0; + result1 += M4(-0.15739962, 0.016209977, -0.11209033, -0.018605288, -0.12759252, 0.0726407, 0.012900522, 0.08673423, -0.04963404, -0.0518699, 0.102750875, 0.12054366, 0.2524198, 0.19522701, 0.2270189, 0.05231933) * inp_1_1_0; + result1 += M4(0.065714635, -0.03201214, -0.0171613, -0.07176564, 0.08428725, -0.07058684, -0.08709468, -0.07990058, -0.11686441, -0.09357895, -0.046912536, -0.023992062, -0.346282, 0.018036636, 0.03106855, 0.004082807) * inp_1_2_0; + result1 += M4(-0.005530766, -0.030518299, -0.07603567, 0.03752808, -0.03442721, 0.0029709316, 0.016444348, 0.07020296, -0.2016699, 0.21103077, -0.21100645, 0.119907945, 0.07548786, -0.103522554, 0.16498852, -0.012907791) * inp_1_0_1; + result1 += M4(-0.13843097, -0.061295003, 0.08772917, 0.0026598852, 0.119397156, -0.10213916, -0.035292555, -0.010960033, -0.01906532, -0.065163784, 0.027820924, -0.19135024, -0.09620281, 0.021738928, -0.28489172, -0.23192978) * inp_1_1_1; + result1 += M4(0.10790299, 0.027455572, 0.124303855, 0.011661894, 0.015253414, 0.054605566, 0.07886824, -0.019315444, 0.24176191, 0.034416646, 0.15283495, -0.33742723, 0.0823504, -0.14790276, 0.010342285, -0.22003831) * inp_1_2_1; + result1 += M4(-0.008874464, 0.12386641, -0.038760047, -0.016628882, -0.023460234, 0.018141951, 0.01832356, -0.05300698, 0.027816936, -0.029332621, -0.03777799, -0.002010302, -0.04299754, -0.096677415, -0.046877865, -0.019539319) * inp_1_0_2; + result1 += M4(0.17264172, -0.010743867, 0.11931309, 0.051326703, -0.009686467, -0.0062824595, -0.061936192, 0.12647447, 0.20229132, 0.21170805, 0.0062494637, 0.17988499, 0.0199236, 0.12213678, -0.21522295, 0.33548972) * inp_1_1_2; + result1 += M4(-0.072410546, -0.016178316, -0.027966136, -0.08857723, -0.005089261, 0.045857616, 0.046204444, -0.16591106, -0.0718399, -0.16617773, 0.0019136791, 0.15967074, 0.09774043, -0.0921577, 0.054268777, 0.092463665) * inp_1_2_2; + result2 += M4(0.14622211, 0.033930864, -0.020485567, -0.1412074, 0.14930843, 0.029972134, 0.121572874, -0.13651608, 0.30585966, 0.021851046, 0.07745108, -0.30486628, -0.13050433, -0.08180961, -0.027708324, 0.1253036) * inp_1_0_0; + result2 += M4(-0.022820612, -0.047209058, -0.12912439, 0.27083746, -0.18040411, -0.07130721, -0.048366297, 0.23729746, -0.23206307, 0.017609343, 0.019341638, 0.23706292, -0.22414765, 0.045835372, 0.012590579, -0.19633743) * inp_1_1_0; + result2 += M4(-0.013300152, 0.05599519, 0.051164817, -0.10179973, 0.02498066, 0.08604088, 0.11978064, -0.12570824, 0.08215409, -0.012000469, 0.038303167, -0.062917545, -0.012392567, -0.08683338, -0.09427509, 0.092526846) * inp_1_2_0; + result2 += M4(-0.05845668, 0.22507024, 0.0018911348, -0.03416973, -0.109933645, -0.15901743, -0.13169557, 0.2489902, -0.33019328, 0.15455498, -0.11574075, 0.18240502, 0.15918145, 0.04729387, -0.0056689186, -0.14884417) * inp_1_0_1; + result2 += M4(-0.09453401, -0.028965047, 0.20463869, -0.20698904, 0.32099605, 0.23075835, -0.049196653, -0.038442433, 0.26262686, 0.021751644, 0.055904813, -0.24745686, 0.1149247, -0.03805222, -0.11372666, 0.34570286) * inp_1_1_1; + result2 += M4(0.0062108114, -0.16136009, -0.123568416, 0.16272284, -0.034562103, -0.17603487, -0.110900074, 0.031481136, 0.12558918, -0.011668643, 0.027736813, -0.07511172, 0.21581094, 0.120602116, 0.33665705, -0.23707451) * inp_1_2_1; + result2 += M4(-0.003585816, -0.25195944, -0.056518134, 0.14234741, -0.06723524, 0.13331363, -0.07638646, -0.029029816, -0.006666353, -0.36124042, -0.06354365, 0.43837893, -0.11160402, 0.072009884, -0.06312557, 0.1011857) * inp_1_0_2; + result2 += M4(-0.03955385, 0.1990065, -0.018960109, 0.0051917713, -0.06469263, -0.123042256, 0.032065373, -0.17905955, -0.23264244, 0.10426899, -0.14723136, -0.15927729, -0.095671035, -0.26988465, 0.02837742, -0.013923805) * inp_1_1_2; + result2 += M4(0.112933464, -0.043436788, 0.091250494, -0.13463621, -0.031227566, -0.0042501013, 0.17211096, -0.061046902, 0.08391018, -0.0077616447, 0.07812146, -0.009916928, 0.07397046, 0.14718248, -0.04669793, 0.041616086) * inp_1_2_2; + result3 += M4(-0.012139267, -0.046823397, 0.055270605, -0.062974416, 0.011565813, -0.18060294, -0.0098689515, -0.22953819, 0.024000261, -0.23664816, 0.029873438, 0.00925146, 0.13210218, 0.10714866, 0.041282352, 0.054962005) * inp_1_0_0; + result3 += M4(-0.00425852, 0.022288367, -0.00839515, -0.024816163, -0.05498923, 0.14509243, 0.005224275, 0.026971063, -0.12811832, 0.30412883, -0.22113481, -0.12445393, 0.044661216, 0.19499756, -0.16970544, 0.09098386) * inp_1_1_0; + result3 += M4(-0.049442146, -0.02676701, 0.0037601877, -0.19303954, -0.06461184, 0.03424987, 0.033616573, -0.058749903, -0.0767509, -0.02933055, -0.11261291, 0.029727368, -0.047365442, -0.14790945, -0.04035033, -0.030160617) * inp_1_2_0; + result3 += M4(0.0010656733, -0.02668284, 0.19471397, -0.077152856, -0.1119675, 0.16642164, -0.3056485, 0.09701516, -0.032464765, -0.1422366, 0.19361593, -0.022385882, 0.10217149, -0.017202012, 0.26548624, 0.24587213) * inp_1_0_1; + result3 += M4(-0.10229535, -0.048520923, -0.25836796, -0.18611394, 0.20844075, -0.21864392, 0.18385902, -0.012027308, 0.298919, 0.09894794, 0.21712577, -0.16338934, 0.067203484, -0.12321382, 0.42670172, 0.18046945) * inp_1_1_1; + result3 += M4(0.09465788, 0.026927982, 0.0634101, 0.094085574, 0.028902758, 0.026592772, -0.0062900553, -0.069339275, -0.16002378, -0.0043187323, 0.19384632, 0.35121834, -0.46105996, 0.061926972, -0.031174311, 0.16591823) * inp_1_2_1; + result3 += M4(0.021849016, 0.024172232, 0.027865706, -0.024844088, 0.11537251, -0.0017808388, 0.3383794, 0.095728055, -0.03370364, 0.042807557, 0.054379217, 0.016522884, -0.14881603, 0.024019856, -0.14619574, 0.13468431) * inp_1_0_2; + result3 += M4(0.26974118, -0.03020653, 0.0467989, 0.09997283, -0.225319, 0.03123994, -0.18730874, -0.06313059, 0.28838465, -0.021311061, -0.032295976, -0.5687233, -0.19154316, -0.023533309, -0.23153263, -0.6694247) * inp_1_1_2; + result3 += M4(-0.20564198, 0.08846197, -0.08741238, 0.38190806, 0.097369835, -0.020990869, -0.04059183, 0.23045994, -0.08535688, 0.021872237, -0.3087969, 0.44408107, 0.5135046, 0.00416095, -0.1617329, -0.2927917) * inp_1_2_2; + result4 += M4(-0.092348225, -4.899312e-05, 0.03408428, 0.023627887, -0.09361741, 0.16219872, 0.1223944, -0.111906864, -0.10880166, 0.07419288, 0.11647858, -0.037658542, 0.002272355, -0.24778526, -0.13656938, 0.00033563402) * inp_1_0_0; + result4 += M4(-0.11030891, 0.16916846, 0.039946288, 0.03924557, 0.13571824, -0.022200687, -0.051298134, 0.22357553, 0.17479928, -0.12342663, -0.3123425, 0.15854663, 0.101564355, -0.13469937, -0.01255922, 0.0003415467) * inp_1_1_0; + result4 += M4(-0.039500963, -0.13591114, -0.015334244, -0.03921458, -0.18489632, -0.01989155, -0.038351458, -0.046835713, 0.03292734, -0.018222192, 0.028025731, -0.12396908, 0.12390516, 0.25767827, 0.040885437, 0.01972028) * inp_1_2_0; + result4 += M4(0.083130196, 0.06320318, -0.0065529994, -0.05116796, -0.036242407, -0.10908108, -0.07056251, 0.071343794, 0.006586246, 0.010524152, -0.097992346, 0.034147367, 0.3068846, 0.08153612, -0.05943433, -0.06644572) * inp_1_0_1; + result4 += M4(-0.015684007, -0.2458967, -0.02259713, 0.12468715, -0.15357973, -0.021078438, -0.044963464, -0.21710123, -0.110970125, -0.035599485, 0.008899505, -0.102642685, -0.12679641, 0.20587976, -0.1199974, -0.019224681) * inp_1_1_1; + result4 += M4(-0.034645144, 0.09334104, 0.012576891, -0.057651788, 0.1513382, 0.020500252, 0.11296834, 0.10840535, 0.13800332, 0.021486238, 0.08097467, 0.064888544, 0.01159645, -0.049670298, -0.03630892, 0.23323674) * inp_1_2_1; + result4 += M4(-0.16977705, 0.0045283246, 0.007889421, 0.040079966, 0.13847128, 0.0013577606, -0.042398177, 0.0013113774, -0.2161196, 0.13272226, 0.01906356, -0.011640492, -0.061170332, 0.00032892992, -0.009517682, 0.06042073) * inp_1_0_2; + result4 += M4(0.22956204, 0.07805039, 0.05952152, -0.15416096, -0.079069436, -0.042201176, 0.07723746, 0.03249371, 0.022645092, -0.073189326, 0.19537999, -0.06800382, -0.48296648, -0.091830455, -0.072290905, -0.09205237) * inp_1_1_2; + result4 += M4(0.15360396, -0.034861278, -0.09555026, 0.069429584, 0.15559883, 0.036359265, -0.041642964, -0.06434541, 0.09091873, -0.037409402, -0.0210764, 0.06874098, 0.063656576, -0.018393736, 0.37723267, -0.1220581) * inp_1_2_2; + result5 += M4(0.009315057, -0.039793894, -0.039893407, 0.0025300442, 0.04252286, 0.018308887, -0.053301472, -0.15878326, -0.019864243, 0.113979325, -0.07052441, 0.012375545, -0.072993726, 0.11117269, -0.015672868, 0.19543935) * inp_1_0_0; + result5 += M4(0.10393496, 0.04860575, -0.036490183, 0.009639758, -0.036475956, -0.11311589, -0.09545132, 0.1937704, -0.20127577, -0.3004165, 0.01927337, 0.09949358, 0.011086824, 0.07412309, -0.11477256, 0.00016277973) * inp_1_1_0; + result5 += M4(-0.15286039, 0.024039598, 0.060999203, 0.0032689837, -0.10542675, 0.049775787, 0.10901487, 0.023451982, 0.003536342, 0.08355868, 0.026118478, 0.038982097, 0.07624663, -0.19437374, 0.10103605, -0.20783526) * inp_1_2_0; + result5 += M4(0.046537817, -0.067554325, -0.104323365, 0.019169385, -0.09484351, -0.112971164, 0.002150195, 0.1475723, -0.13917124, -0.3035873, -0.3067636, 0.00963338, 0.14426696, -0.23026484, -0.02267922, -0.2867485) * inp_1_0_1; + result5 += M4(-0.22787493, 0.08626521, 0.037516505, 0.052527238, 0.062326893, 0.03717344, -0.036514126, -0.13794681, 0.17301907, 0.018499771, 0.10670954, 0.09111631, 0.07034519, 0.16229908, -0.06396752, 0.020276068) * inp_1_1_1; + result5 += M4(0.20937552, -0.112115905, 0.07686836, 0.048358228, 0.041537207, 0.042966317, 0.05794905, 0.08860813, 0.0010343207, -0.16032727, 0.16665968, 0.06552188, -0.2985938, 0.26402467, -0.04158525, 0.17088705) * inp_1_2_1; + result5 += M4(0.0025579182, 0.024243172, 0.10205318, -0.04828209, 0.0150477905, 0.161029, -0.120338276, -0.06609394, 0.08371926, 0.74200994, 0.30742526, 0.008071951, -0.022323387, 0.39530528, 0.0062952586, 0.3320767) * inp_1_0_2; + result5 += M4(0.11514749, -0.119992435, -0.19644433, -0.076094754, -0.005266124, -0.015505989, 0.108957216, -0.013609759, 0.0806063, -0.6925446, -0.17420325, -0.16026042, -0.096812725, -0.17777766, 0.33779812, 0.05635807) * inp_1_1_2; + result5 += M4(-0.088664286, 0.19366497, 0.10373365, -0.046089854, 0.08397202, -0.081216104, 0.04968403, -0.07730271, 0.0080527365, 0.637737, -0.10831294, -0.25297433, 0.20753402, -0.45137322, -0.178694, -0.23293279) * inp_1_2_2; + result6 += M4(0.08850388, -0.0207107, 0.04370057, 0.36592868, -0.001342386, 0.08674775, -0.063615225, 0.09765095, 0.36543256, 0.07968661, -0.020770753, 0.874285, 0.3238145, -0.016411122, -0.07228315, 0.024823766) * inp_1_0_0; + result6 += M4(0.088917665, 0.029564336, 0.024139253, 0.0076451465, -0.0016998065, -0.12345348, 0.18237911, -0.062208608, -0.1746227, -0.110413626, 0.07799642, -0.3398364, 0.019212412, 0.056892037, -0.0986248, 0.07186395) * inp_1_1_0; + result6 += M4(-0.21642865, 0.041386344, -0.06339776, -0.032001905, 0.19339882, 0.03231188, -0.10204557, -0.13758013, -0.14904295, -0.01914844, -0.122796305, -0.2899267, -0.016563937, -0.04511764, 0.07832353, 0.04315966) * inp_1_2_0; + result6 += M4(0.116379075, 0.0008428704, -0.024717761, -0.20803684, -0.17048179, -0.13372083, 0.043566026, -0.046027888, -0.009384611, -0.07614973, 0.06241372, -0.6883269, -0.41987732, 0.15585467, 0.006527491, -0.08820382) * inp_1_0_1; + result6 += M4(-0.09509065, 0.03147108, -0.06814291, -0.053576887, -0.031626772, 0.12722825, -0.11581037, 0.17612085, 0.10111232, 0.0444588, -0.18220901, -0.053302433, 0.018732227, -0.14842227, 0.080189824, -0.04557651) * inp_1_1_1; + result6 += M4(0.27167615, 0.026115578, 0.056058075, -0.21269938, -0.13086309, 0.061571274, 0.009969623, -0.20542078, -0.20713961, 0.14651333, 0.07305179, -0.041693557, -0.12575068, -0.004305788, -0.0960623, -0.065216325) * inp_1_2_1; + result6 += M4(-0.070646174, -0.061003357, -0.06869981, 0.094543554, 0.083361164, -0.006915605, 0.016996851, -0.05128535, 0.050152298, 0.14309838, -0.09049835, 0.657594, 0.25067973, -0.07734688, -0.0031592245, -0.10498131) * inp_1_0_2; + result6 += M4(-0.11258726, -0.09268773, 0.10271882, -0.21289156, 0.07725714, -0.024649115, -0.0081682205, -0.089328445, -0.023620116, -0.14418346, 0.046693396, -0.69523656, -0.014066392, 0.09000784, -0.07501272, -0.08271815) * inp_1_1_2; + result6 += M4(-0.12243556, 0.029113041, 0.020471686, 0.2813676, 0.010630583, -0.007916172, 0.02552108, 0.32475835, -0.11740228, -0.112512216, 0.16220617, 0.7037821, -0.053055238, 0.018653948, 0.12827374, 0.15126385) * inp_1_2_2; + result7 += M4(-0.068574496, 0.16661608, 0.09277685, -0.10065855, -0.026894188, 0.24174578, -0.0015142026, 0.06333797, -0.03589406, 0.19774821, 0.22234689, -0.3098714, -0.030794185, -0.4666243, 0.119494334, 0.06997651) * inp_1_0_0; + result7 += M4(0.06763326, 0.04033184, 0.05536772, -0.057854787, 0.0012180824, -0.15242608, 0.06596476, -0.1705138, -0.12524039, -0.10267546, -0.25720495, -0.00084344787, 0.0015356123, 0.042152084, 0.12603982, -0.04137867) * inp_1_1_0; + result7 += M4(0.01939239, -0.0051865047, -0.02208035, 0.052681167, 0.032672696, 0.09629823, -0.017163428, 0.0006626341, 0.008928037, 0.40452057, 0.4547712, -0.11422701, -0.034344185, 0.089008346, 0.2120114, -0.107786134) * inp_1_2_0; + result7 += M4(0.12871139, -0.13950281, -0.065428756, 0.3491906, -0.11650786, -0.13134636, 0.13280089, -0.029576441, -0.0059103365, -0.5508263, -0.22791469, 0.6133408, 0.025263406, 0.051196218, -0.16464914, -0.08928937) * inp_1_0_1; + result7 += M4(-0.33673334, -0.26939452, 0.169822, -0.18601708, 0.13333264, -0.008554966, -0.16594854, 0.23139794, 0.11931796, -0.040443167, 0.01947117, -0.07756305, 0.3151091, 0.48643693, -0.1501797, 0.20290323) * inp_1_1_1; + result7 += M4(0.0037983016, 0.15611055, 0.031716086, -0.059497457, -0.083625734, 0.10151506, -0.036348563, -0.12573546, -0.04825114, -0.20393659, 0.12873755, 0.13184042, 0.016729718, -0.09499213, -0.016527524, -0.051121287) * inp_1_2_1; + result7 += M4(-0.16464926, -0.05180886, -0.13005428, 0.1214983, 0.21278372, -0.1711272, -0.060071763, -0.11382805, -0.2974423, 0.49421692, 0.061519757, -0.14829051, -0.009842123, 0.03393404, -0.17658482, -0.21789874) * inp_1_0_2; + result7 += M4(0.41086602, 0.17370336, -0.19637585, -0.0014512275, -0.21273008, 0.20512007, -0.032933477, -0.0783052, 0.16782628, 0.09549614, -0.21877618, 0.07099654, -0.6722047, -0.18026075, 0.20123404, 0.1915319) * inp_1_1_2; + result7 += M4(-0.05910126, -0.04967091, 0.07895229, -0.08397946, 0.05595711, -0.21496674, 0.11178259, 0.20505239, 0.22368243, -0.26222184, -0.045761608, -0.20781557, 0.34694645, 0.033016797, -0.08783061, -0.026765328) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.04006396, -0.093271196, -0.0096289655, -0.11205657, -0.013179008, -0.4888647, 0.04780535, 0.016062947, 0.006696561, 0.41703635, -0.026678808, 0.21811746, -0.10373398, 0.22838922, -0.042051118, 0.062496066) * inp_2_0_0; + result0 += M4(0.029921327, -0.13498737, -0.21944141, 0.036896, -0.008876765, 0.10946289, 0.027396487, -0.020041306, -0.05376922, -0.07171024, 0.14145331, -0.12944715, -0.11785168, -0.05215759, 0.19542274, 0.045778714) * inp_2_1_0; + result0 += M4(0.010232067, 0.009027865, 0.06280113, -0.005551291, 0.061293773, -0.018812973, 0.07981425, -0.00823472, -0.097053416, -0.016432412, -0.00866586, 0.0040405495, -0.101947494, -0.10372762, -0.055717018, 0.18776363) * inp_2_2_0; + result0 += M4(0.084877305, 0.36530042, 0.04482282, -0.025205128, -0.052687638, -1.4062189, 0.2331636, 0.20114876, 0.17389625, -1.097782, 0.009419999, 0.05726068, 0.005323745, 0.34690902, -0.0043693217, -0.15299302) * inp_2_0_1; + result0 += M4(0.24011506, -0.2369298, 0.12749569, -0.09491782, -0.30143183, 0.50683093, -0.114192486, 0.22762431, -0.27143052, 0.5292441, -0.07288178, 0.15642613, -0.09021754, 0.17313053, -0.0075788074, 0.176452) * inp_2_1_1; + result0 += M4(0.009803549, -0.20905402, -0.02659497, -0.003000505, 0.007216942, -0.014926389, 0.2527909, -0.060462914, -0.034895502, -0.08333173, 0.024605725, -0.008002653, -0.06315284, 0.067963235, 0.07755725, 0.059077345) * inp_2_2_1; + result0 += M4(0.075668044, -0.043190833, 0.0088273985, 0.05178253, -0.2121789, -0.19092418, -0.048636794, 0.07709776, -0.026524719, 0.25015098, -0.098095335, 0.07913606, 0.076073155, -0.011904691, -0.00997183, -0.1295254) * inp_2_0_2; + result0 += M4(-0.32758933, 0.0030028427, -0.015581309, -0.051850066, 0.20927404, 0.18228866, -0.023237212, 0.08565571, 0.33623222, -0.0012938008, 0.050019436, -0.2070059, 0.119549364, 0.09375155, 0.034198433, 0.0281211) * inp_2_1_2; + result0 += M4(0.025983714, -0.02273698, -0.00834317, 0.09938862, -0.06958064, 0.04463224, -0.011163134, -0.00744886, -0.09676307, 0.0104306955, 0.043315828, -0.13753454, 0.06448966, -0.024151303, -0.027766991, 0.041412592) * inp_2_2_2; + result1 += M4(-0.25290313, 0.19666754, -0.09577112, -0.037330758, -0.12433887, -0.10995768, -0.20430726, 0.0113121215, -0.13665694, -0.035303738, 0.09452789, 0.010197449, 0.068448514, -0.2187964, 0.12905982, 0.05560437) * inp_2_0_0; + result1 += M4(-0.87789756, 0.32822713, -0.54594296, 0.066028394, 0.08900635, -0.13787487, 0.2355097, 0.026656104, 0.051272012, 0.0007108152, 0.3357397, -0.041287974, 0.3000717, -0.11498494, 0.24920359, 0.116323985) * inp_2_1_0; + result1 += M4(-0.8281388, -0.05207503, -0.22037, 0.06782141, -0.368362, 0.02836894, -0.24745329, -0.12641783, 0.109644875, -0.056541838, -0.059078168, 0.052099805, 0.30368358, 0.08141452, -0.04582999, -0.058582276) * inp_2_2_0; + result1 += M4(0.049841173, -0.09109075, 0.055836778, -0.012549697, -0.048306625, 0.3592706, -0.08224678, -0.07649658, -0.1710119, 0.08557986, -0.10904593, -0.056076586, -0.028904108, 0.12440374, 0.012864014, 0.08310742) * inp_2_0_1; + result1 += M4(-0.035251543, -0.20624669, 0.06317375, 0.4335416, 0.3559351, -0.12239683, 0.060257185, 0.032789163, 0.29632062, -0.06737258, 0.019616304, -0.122070186, -0.107673295, -0.05875411, -0.08953578, -0.21576707) * inp_2_1_1; + result1 += M4(0.031954102, 0.042747285, -0.1693705, 0.49983233, -0.30091783, 0.033248916, -0.24386583, -0.75089025, 0.032218333, -0.021452343, 0.07603394, -0.38572457, -0.3042465, 0.047610722, -0.21036297, -0.51623404) * inp_2_2_1; + result1 += M4(0.010616683, 0.080342054, 0.015937759, -0.0072870483, -0.059890237, -0.053708665, -0.15250191, 0.06853063, -0.079073265, -0.029861968, 0.06857587, -0.08221009, -0.032185487, -0.015071679, 0.12374374, 0.14812705) * inp_2_0_2; + result1 += M4(-0.016411439, 0.08448781, 0.040359493, -0.08547065, 0.102580406, -0.043145485, -0.019781213, 0.09795827, 0.014702368, 0.046223257, -0.33862883, 0.35797995, -0.0065781316, 0.07393134, -0.067422196, 0.29117906) * inp_2_1_2; + result1 += M4(0.02807433, -0.01187277, 0.07435808, -0.20751515, 0.061271455, 0.05244012, -0.046069704, -0.46324798, -0.081953414, -0.034002166, -0.07702094, 0.24715763, 0.08846798, 0.07901789, 0.06372052, -0.2204595) * inp_2_2_2; + result2 += M4(0.079209946, 0.024314685, 0.06825805, -0.19656268, -0.18495592, -0.22297944, -0.027041707, -0.0039204457, 0.010487721, 0.026769398, 0.27211088, -0.044124667, 0.0708275, 0.13799185, -0.0909649, -0.16712058) * inp_2_0_0; + result2 += M4(0.04129076, -0.034979448, -0.016573476, -0.12149206, 0.06150161, -0.08209856, -0.1905845, 0.0974782, -0.064913124, -0.033978187, 0.042167306, -0.12530461, -0.21253434, -0.072775096, 0.0860898, 0.021017795) * inp_2_1_0; + result2 += M4(0.38701406, -0.036220368, 0.053439543, -0.43865678, 0.07939769, -0.08243855, 0.17258961, -0.22275402, 0.062249318, -0.0686973, 0.2565318, -0.0683011, -0.08728593, -0.0028681478, 0.061261933, 0.18323076) * inp_2_2_0; + result2 += M4(-0.039497472, -0.15987717, 0.09388128, -0.03861348, -0.44152698, -0.37033457, -0.21767667, 0.28547382, -0.26163006, -0.25115827, -0.30968404, 0.26306158, 0.03804344, 0.19295283, 0.12113197, -0.11471205) * inp_2_0_1; + result2 += M4(-0.30163613, -0.26301563, -0.034511514, -0.45088667, 0.30495808, 0.31131884, -0.31674165, 0.4868328, 0.49399623, 0.3275035, -0.36139163, 0.26530102, -0.10982368, 0.21751544, 0.07969837, 0.29188502) * inp_2_1_1; + result2 += M4(0.23773795, -0.36192465, -0.05976584, -0.19862168, 0.36314234, -0.08991466, 0.35342932, -0.02457932, 0.10577849, 0.037139118, 0.1183281, 0.01917593, -0.09016436, 0.0890603, 0.36950955, -0.08724207) * inp_2_2_1; + result2 += M4(-0.07765637, -0.07627282, -0.011678986, 0.08661498, -0.2874765, -0.2616753, -0.08173318, 0.091032155, -0.03560941, -0.046116207, -0.033399954, 0.16050923, 0.2213573, 0.040242396, -0.1254936, -0.040743522) * inp_2_0_2; + result2 += M4(-0.011835813, 0.1610244, -0.060223717, 0.026901042, 0.027034983, -0.039814804, -0.2395877, 0.039017636, -0.06570181, -0.22634281, -0.013846767, -0.3682364, -0.06921134, 0.004998505, -0.055614, 0.1219175) * inp_2_1_2; + result2 += M4(0.26495653, 0.00018914929, -0.096524045, -0.070989974, 0.3021856, -0.1294938, 0.31535223, -0.16457504, -0.156344, 0.10761199, -0.0054053986, -0.0012636378, 0.103739135, 0.020149903, 0.24023418, 0.12121273) * inp_2_2_2; + result3 += M4(-0.031075776, -0.4635887, -0.47420534, -0.07199863, 0.07125954, -0.12359186, -0.491971, -0.008747496, -0.00752531, -0.33726844, 0.041804176, -0.027972763, -0.020819692, 0.12383843, 0.36148933, 0.07167745) * inp_2_0_0; + result3 += M4(0.037511352, -0.9477205, 0.17954215, 0.03551973, 0.1667754, 0.050922755, 0.019038, 0.021886162, -0.070391804, 0.49917763, -0.14287363, -0.12820308, 0.0030683058, 0.49931148, -0.10055244, 0.177764) * inp_2_1_0; + result3 += M4(-0.024921156, -0.4117021, 0.09828512, -0.06818989, -0.013338524, 0.06989925, -0.089514956, 0.02602123, 0.07610413, -0.059325233, -0.13381743, 0.06674027, -0.0043520755, 0.16602825, -0.02947413, 0.0313993) * inp_2_2_0; + result3 += M4(-0.04545174, 0.044156343, 0.20290965, 0.08909125, 0.014040267, -0.047601722, -0.75170505, -0.104715414, -0.039344367, 0.17603794, -0.35120603, 0.23853277, 0.053033274, -0.17841052, 0.1820609, -0.058806483) * inp_2_0_1; + result3 += M4(-0.40018386, 0.123856135, -0.16877863, -0.116433814, 0.39704683, -0.026472786, 0.1411099, 0.18997066, 0.5697698, -0.19037497, 0.42247203, 0.07268722, 0.020476446, -0.039052613, 0.07832102, 0.048717983) * inp_2_1_1; + result3 += M4(0.2724097, -0.06511224, -0.13722713, -0.00060539367, -0.20470375, 0.00876838, -0.050319098, 0.18581828, -0.18101513, 0.006082236, -0.02139074, 0.19804642, -0.31850263, -0.0954505, -0.30005115, 0.08748218) * inp_2_2_1; + result3 += M4(-0.0954268, 0.00050760794, -0.26310194, -0.012543817, -0.03426465, -0.03957793, -0.1720142, 0.17730446, 0.13332754, 0.004262412, 0.09753719, 0.16221963, 0.073697865, -0.050598513, 0.41145912, -0.10411897) * inp_2_0_2; + result3 += M4(0.3464752, -0.021848112, -0.10102162, 0.12555195, -0.36431295, -0.06230273, -0.055010866, 0.064280584, -0.71468693, -0.0010118448, 0.05051672, -0.60622525, 0.15103918, 0.14874057, -0.034544896, -0.23608753) * inp_2_1_2; + result3 += M4(-0.18470794, 0.0020429478, 0.092647046, 0.001578774, 0.07782735, -0.056376178, -0.04893872, 0.14143008, 0.2539951, 0.005463176, -0.07962956, -0.03562753, 0.23646769, -0.16915001, -0.11215036, -0.13418357) * inp_2_2_2; + result4 += M4(-0.4048387, 0.2746327, 0.29115272, 0.014415946, 0.027654655, 0.061988186, -0.05398835, 0.015199468, -0.022000216, 0.3168487, 0.2148722, 0.13543734, 0.1928623, -0.17625928, -0.084206864, -0.0791183) * inp_2_0_0; + result4 += M4(-0.6260922, 0.85466826, 0.77320504, 0.10223002, 0.2373547, -0.34480003, -0.06116979, 0.0547156, 0.30961192, -0.4166198, -0.32632014, 0.06924924, 0.36943367, -0.5072109, -0.481058, -0.031789046) * inp_2_1_0; + result4 += M4(-0.10124026, 0.3977555, 0.34342486, 0.25692475, -0.024685882, -0.015863132, -0.25324908, 0.07294063, 0.037476826, 0.027836466, 0.02573071, -0.15145361, 0.044554383, -0.038837407, -0.31043664, -0.21714881) * inp_2_2_0; + result4 += M4(0.046663757, 0.014939641, 0.06879724, -0.04942035, -0.045889072, -0.11144033, -0.19458978, 0.021895248, 0.03571556, -0.17301705, -0.24958733, -0.023675848, -0.037575014, 0.066391654, 0.13448313, -0.089484215) * inp_2_0_1; + result4 += M4(-0.048059803, -0.21505676, -0.118837744, -0.13431357, 0.04294499, 0.22801062, 0.17858784, -0.28958902, -0.2126441, 0.21744238, 0.059451975, -0.23975925, -0.0014333368, 0.088576786, 0.10778986, 0.31530976) * inp_2_1_1; + result4 += M4(0.049664397, -0.016129503, -0.11917058, -0.39864028, 0.14846401, 0.020106375, -0.18104424, 0.30159464, 0.00887667, 0.052817456, 0.014414665, 0.20041718, -0.112646736, 0.22074835, 0.023366554, 0.37090588) * inp_2_2_1; + result4 += M4(-0.037570477, 0.059925936, 0.0005708728, 0.04009829, -0.10829278, 0.062199626, 0.0501179, -0.014424939, 0.2726312, -0.028666759, 0.013104774, -0.026145717, -0.113269396, -0.021442631, 0.16822442, -0.062231436) * inp_2_0_2; + result4 += M4(0.23156382, 0.04554089, 0.09250202, -0.07079888, -0.15285629, 0.059867956, -0.0085961195, -0.05141432, -0.49627265, 0.04150607, 0.025709234, 0.016941035, -0.064730234, -0.08857849, -0.04150067, 0.022848075) * inp_2_1_2; + result4 += M4(-0.05030157, 0.057781357, -0.08614188, 0.06977365, 0.052806154, 0.087339506, -0.08356403, 0.07599338, 0.08267073, -0.022146773, 0.24039426, 0.019475978, -0.18833315, -0.005756401, 0.00854118, 0.009617167) * inp_2_2_2; + result5 += M4(0.06307451, 0.14723757, 0.0039552962, -0.46614376, 0.07030183, 0.2916851, 0.106686614, -0.14141798, 0.007910899, 0.06727706, -0.15440355, -0.10023372, -0.10300651, 0.026727919, -0.21182077, 0.23669715) * inp_2_0_0; + result5 += M4(0.13375978, 0.1353753, 0.08232549, -0.7362596, 0.11077691, 0.013017048, 0.043357693, -0.031101087, -0.13479967, -0.36879787, -0.08803066, 0.20864883, -0.10869737, -0.36136195, -0.15707602, 0.37448788) * inp_2_1_0; + result5 += M4(-0.095676385, 0.23106195, -0.02147711, -0.2541901, -0.08606613, 0.10505495, 0.11301647, 0.043804143, -0.006948173, -0.1263802, -0.04224032, -0.0042616166, -0.11794068, 0.22114182, 0.027413925, 0.14881836) * inp_2_2_0; + result5 += M4(0.011850981, -0.07968426, -0.1710306, 0.08712769, -0.10804343, 0.27625656, 0.46241727, 0.023772454, -0.08796408, 0.24824676, -0.06773852, -0.15036978, 0.05319369, -0.20618536, -0.1458318, -0.12122452) * inp_2_0_1; + result5 += M4(-0.23144136, 0.06455041, 0.01652961, -0.11405431, 0.5178468, 0.179509, 0.041685622, -0.15093309, 0.49060193, -0.15313472, 0.054447133, -0.087239854, -0.06193237, -0.009340936, 0.07510365, -0.020017758) * inp_2_1_1; + result5 += M4(0.18669872, 0.07155456, -0.11710658, 0.004780165, -0.45215398, -0.183132, 0.42877966, -0.043604154, -0.2451027, 0.04137121, 0.06478309, -0.07089735, -0.2714047, -0.061828386, 0.120099574, -0.18344322) * inp_2_2_1; + result5 += M4(0.035631984, 0.38638332, 0.05854191, -0.023932468, 0.010584838, 0.11353454, 0.3659448, -0.07387023, -0.0034249292, 0.9132789, -0.11330348, 0.02410176, -0.06093434, 0.0474977, -0.120164394, 0.1047797) * inp_2_0_2; + result5 += M4(-0.0998373, -0.024269396, 0.046595313, -0.17640395, 0.17191735, 0.06510432, -0.14431018, -0.10624873, -0.13430345, -0.47117662, 0.3615993, 0.2840675, -0.08423247, -0.14638855, -0.026378112, 0.06795413) * inp_2_1_2; + result5 += M4(0.035158098, 0.34198627, -0.007857903, -0.041475654, -0.1796877, 0.14854921, 0.22959937, -0.07888798, 0.14298303, -0.2011923, 0.023641603, -0.04346798, -0.12600255, 0.30773756, 0.14908876, 0.030534623) * inp_2_2_2; + result6 += M4(0.13131043, 0.15043007, 0.020211749, 0.4891068, 0.45132312, -0.010635054, 0.0011205637, -0.3122684, 0.050189145, 0.236809, 0.008488413, 0.32962832, -0.15746759, -0.19045612, 0.10334398, -0.3065638) * inp_2_0_0; + result6 += M4(-0.10746205, 0.184805, 0.019237475, 0.69931763, -0.26008403, 0.049077857, -0.13350248, -0.10074571, -0.12030742, -0.21424854, 0.029700996, -0.5003061, -0.07593551, -0.006682179, 0.036656495, -0.31372914) * inp_2_1_0; + result6 += M4(-0.021457711, -0.0019900585, 0.05084926, 0.081936136, 0.3753494, 0.09493894, -0.18673326, -0.11794002, 0.25595453, 0.08400333, -0.018064985, -0.048310984, 0.16797653, -0.060853757, 0.06483727, 0.011189334) * inp_2_2_0; + result6 += M4(0.13941164, -0.063394785, -0.0034332005, 0.17111054, -0.3990753, 0.02632524, -0.06816667, -0.21834038, -0.4288934, -0.22325225, 0.037174102, -0.5405136, 0.010273852, -0.0105224075, 0.013248547, 0.40732837) * inp_2_0_1; + result6 += M4(-0.08962223, -0.2226498, -0.1872196, -0.10598174, 0.3465477, 0.18969187, 0.053831596, 0.14565082, 0.123044804, 0.06839405, -0.1236372, 0.10534083, -0.038496677, -0.025535641, 0.04961797, -0.050057862) * inp_2_1_1; + result6 += M4(-0.086797, 0.042154882, -0.014092746, -0.044417284, -0.44362223, 0.13151413, -0.12720887, 0.10942756, -0.41959015, -0.036553595, -0.17896748, -0.06546312, 0.1287178, 0.06980131, 0.047464374, -0.04425047) * inp_2_2_1; + result6 += M4(0.058752462, -0.046499122, -0.06560196, 0.076821715, 0.065221585, -0.06323381, 0.075904384, -0.2815891, 0.10167673, 0.085431844, 0.0006833184, 0.19864999, -0.003908989, 0.014096975, 0.061565712, 0.18922071) * inp_2_0_2; + result6 += M4(-0.023859497, -0.04909467, 0.10589662, -0.1687173, -0.10612011, 0.036622375, 0.0424893, -0.035365675, 0.27256072, 0.17770343, -0.01699957, 0.044754315, -0.016159957, 0.050832182, 0.011317852, 0.08291619) * inp_2_1_2; + result6 += M4(-0.100903265, 0.040046252, -0.006190383, 0.12496574, -0.08680196, 0.116084926, -0.008635489, 0.05128598, 0.18719034, -0.08555466, 0.16260944, 0.41563207, -0.17537746, 0.03593093, -0.08937214, -0.11530117) * inp_2_2_2; + result7 += M4(-0.01982062, 0.19227089, 0.07580118, -0.01564463, -0.015477902, -0.06434723, -0.04389325, -0.26967463, -0.032943662, -0.087399565, 0.045613937, -0.26502544, -0.059663635, 0.07896823, -0.13964859, -0.07113337) * inp_2_0_0; + result7 += M4(0.015122787, 0.057662565, -0.07610588, -0.10633816, 0.19621149, 0.114655145, 0.0044023055, -0.11868959, -0.087640546, -0.09909117, -0.30400592, 0.087860994, -0.1193111, -0.07933329, 0.09902344, 0.08256956) * inp_2_1_0; + result7 += M4(-0.11638451, -0.075316876, -0.3201672, 0.004718106, -0.0046146857, 0.14694384, 0.21839611, -0.07057222, -0.027985927, 0.2378717, 0.12468581, 0.04222978, 0.0016323507, -0.024048518, 0.59261656, -0.16611645) * inp_2_2_0; + result7 += M4(-0.22592212, 0.31972498, -0.08404233, 0.25021684, 0.008496462, -0.28084508, 0.06923707, -0.504983, -0.23233496, -0.29443064, 0.030090403, -0.43786904, 0.15586951, -0.1291383, -0.20086162, 0.35093188) * inp_2_0_1; + result7 += M4(-0.6406366, -0.2729402, 0.051681057, -0.18627988, 0.20781448, 0.29175138, -0.11135165, 0.13569482, 0.64130014, 0.37666848, -0.13812494, 0.23377776, 0.33473015, 0.36425686, -0.1265133, 0.15076241) * inp_2_1_1; + result7 += M4(-0.21743536, -0.000865273, -0.040638417, -0.03576051, 0.07567566, -0.18737459, -0.0038226645, 0.16512613, -0.025816003, -0.06373682, -0.14041999, 0.31136355, 0.18746994, 0.03762397, 0.34165812, -0.09347466) * inp_2_2_1; + result7 += M4(0.08801469, -0.26115394, -0.23565757, 0.15650904, -0.071703225, 0.15424898, 0.47631714, -0.5078269, 0.2222719, 0.07514514, 0.30085883, -0.46507084, -0.3119526, 0.11053857, -0.19479504, 0.33909222) * inp_2_0_2; + result7 += M4(0.25041574, 0.11308088, 0.081072845, -0.12108119, -0.11785, -0.19794494, 0.06143605, -0.20587383, -0.72203565, -0.028817391, 0.20734191, 0.25097057, 0.05389864, -0.21997295, -0.37290296, -0.07274896) * inp_2_1_2; + result7 += M4(0.16635342, -0.0983293, 0.041527614, -0.01580731, -0.05419251, -0.30510548, 0.022088433, -0.005240212, 0.23356004, -0.10731173, -0.039573394, 0.08254777, -0.05703987, -0.21068281, -0.06326769, 0.13715531) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.14220184, 0.29581806, -0.1050509, 0.043722827, -0.022809098, 0.014713366, 0.014747514, -0.0151712205, -0.043942932, 0.008298421, 0.04066298, 0.033041958, -0.018717512, 0.23739426, 0.022260787, -0.046938676) * inp_3_0_0; + result0 += M4(-0.11163785, -0.23318845, 0.18948416, -0.03891877, -0.10855645, -0.07921256, 0.055309527, -0.116694175, 0.008841264, -0.0031489702, 0.022865087, -0.053723924, -0.024241634, -0.06823317, 0.00038335618, -0.025687473) * inp_3_1_0; + result0 += M4(0.002644073, -0.045697205, -0.03577432, 0.123700306, 0.012543277, 0.048040003, -0.025159027, -0.023060577, 0.027704353, -0.013723579, -0.04032055, 0.0072777257, 0.049085204, -0.0488234, 0.013184984, 0.08190091) * inp_3_2_0; + result0 += M4(0.11121829, 0.5713805, -0.098629035, -0.023255708, 0.08053442, -0.041370448, -0.05503379, -0.045689344, -0.0048542405, -0.044403378, -0.023725266, -0.10501844, 0.053676195, -0.37625402, -0.0012022955, 0.05435941) * inp_3_0_1; + result0 += M4(-0.079213396, -0.29827237, -0.0061785034, -0.06528836, -0.08570464, -0.0123205725, -0.09306517, 0.040397964, 0.09289772, 0.07834141, -0.0033718874, 0.10375401, -0.00702443, 0.11942383, 0.017393963, 0.053092834) * inp_3_1_1; + result0 += M4(0.12211842, -0.15758839, -0.10383393, 0.036095593, 0.124916494, 0.10678813, -0.039751172, 0.012379173, 0.041472487, -0.06389625, 0.04722299, -0.04202216, -0.059994843, 0.11173252, -0.004779031, -0.03157209) * inp_3_2_1; + result0 += M4(0.059037857, 0.23064092, -0.07214555, -0.17619008, -0.025874231, -0.11362508, 0.028976435, 0.03689161, -0.0012436241, 0.039338402, -0.028161326, -0.015724905, -0.0072414353, -0.03485324, -0.057183366, 0.054221116) * inp_3_0_2; + result0 += M4(0.014086952, -0.16905811, 0.11196831, -0.042952076, -0.023245735, -0.043856297, -0.0698888, -0.011209277, -0.044448152, 0.055338155, -0.028425442, 0.052961417, 0.01909251, 0.09022248, -0.0002994758, -0.11610538) * inp_3_1_2; + result0 += M4(0.047645338, -0.02096107, -0.050075144, -0.019411907, 0.046437737, 0.10304194, 0.040795293, 0.052342955, -0.05327969, -0.05934678, 0.025403949, 0.014482732, 0.008135477, -0.039806854, 0.009638727, -0.0019236362) * inp_3_2_2; + result1 += M4(0.030199047, -0.20870818, 0.107358895, -0.032064687, -0.02958267, -0.0196711, -0.026792657, -0.031558525, -0.07817445, 0.01813162, 0.009675942, 0.012233323, -0.015329561, -0.16804257, 0.05125411, -0.0046946756) * inp_3_0_0; + result1 += M4(0.034792785, -0.07371596, -0.011460319, 0.10177153, -0.075484, 0.054401577, 0.0646406, -0.17295581, 0.03523714, -0.0014632451, 0.01590928, -0.023483954, 0.015525324, 0.15043561, 0.14282876, -0.047376197) * inp_3_1_0; + result1 += M4(0.25155142, 0.08308516, -0.040026754, -0.05491031, 0.022805769, 0.0011284436, 0.0027504563, -0.021688981, -0.110222556, -0.041732293, -0.1316083, 0.06754725, 0.14578243, -0.08555171, -0.027260132, 0.060346637) * inp_3_2_0; + result1 += M4(-0.05066411, -0.10231594, 0.11965813, -0.072973646, 0.056161065, 0.10944876, 0.017292485, 0.13306467, 0.048061624, 0.0010493994, 0.02265206, 0.018558223, -0.04680016, 0.032021124, -0.061369233, -0.03628745) * inp_3_0_1; + result1 += M4(-0.1643362, 0.023754412, -0.04421771, 0.051398635, 0.08111207, 0.1028633, -0.00028525895, -0.11980875, 0.009836645, -0.09633457, -0.0001076693, 0.10617298, 0.19398087, -0.011596129, 0.0011294374, -0.09799514) * inp_3_1_1; + result1 += M4(0.10975527, 0.064917125, 0.011518881, 0.0023385242, 0.08232439, -0.03420218, 0.005478659, 0.040814776, 0.08117036, 0.117313966, 0.03403432, -0.044782173, -0.25941944, 0.13522075, -0.11086715, 0.07043135) * inp_3_2_1; + result1 += M4(-0.016384318, 0.009222316, 0.050930314, 0.0040175584, 0.0076967096, 0.027830876, 0.043031912, 0.119638085, 0.014207303, 0.0099121835, 0.026899142, -0.019493736, -0.012690073, 0.09567006, 0.024153594, 0.04894755) * inp_3_0_2; + result1 += M4(-0.090977706, 0.013185333, 0.033491775, 0.09460563, -0.07065113, 0.05860558, -0.0001504292, 0.0417031, 0.025144998, 0.08045827, 0.04922298, -0.06822206, -0.14287035, -0.18531598, -0.04301882, 0.2223528) * inp_3_1_2; + result1 += M4(0.0094115315, 0.007858021, -0.05448468, 0.089828864, -0.07290204, 0.0018030866, 0.0012039106, 0.06237634, -0.050015524, 0.0108173685, -0.007279163, -0.053459134, 0.13459387, -0.029871335, 0.025917185, -0.22171456) * inp_3_2_2; + result2 += M4(0.11647479, 0.10076411, 0.11930618, -0.5001232, 0.040037896, -0.0004366756, -0.020107023, -0.090618476, 0.0030575655, 0.050145853, 0.0317201, 0.083271354, 0.09702204, 0.017685521, 0.14457823, -0.10257005) * inp_3_0_0; + result2 += M4(-0.13331696, -0.07726072, -0.029039314, 0.22883713, -0.01739428, 0.0469286, 0.03554923, 0.003434962, -0.009423783, -0.023191646, -0.014845551, -0.032700337, -0.079510346, -0.043419976, 0.0156192, 0.107626915) * inp_3_1_0; + result2 += M4(-0.15507331, -0.068423375, -0.041539546, 0.24189207, -0.09052856, -0.03045898, -0.0594716, -0.06372859, 0.044895723, -0.011765843, 0.01841326, -0.012792601, -0.03711853, -0.030372167, 0.02337175, -0.14652345) * inp_3_2_0; + result2 += M4(0.15467784, 0.35823032, 0.09850777, -0.15597041, 0.11420279, 0.075547986, 0.032267794, -0.14880848, -0.090415016, -0.017048024, -0.053521473, -0.11122125, -0.058699213, -0.03621905, -0.15886551, -0.061645642) * inp_3_0_1; + result2 += M4(-0.16869839, -0.04382488, 0.10822959, -0.076615535, 0.028365385, 0.16310996, 0.013281907, 0.14903001, 0.015622588, 0.011959068, -0.021492178, 0.1770453, 0.3412857, 0.14367792, -0.04293763, 0.00018098926) * inp_3_1_1; + result2 += M4(-0.05968951, 0.007490492, -0.10713938, 0.025387928, -0.15001795, 0.06333462, -0.013492463, 0.08956875, 0.019784143, -0.0657527, 0.055030365, -0.06502322, -0.0992953, -0.045847125, -0.015561308, 0.19500968) * inp_3_2_1; + result2 += M4(0.34842512, 0.17871244, -0.03964059, -0.27120742, 0.022584952, -0.13696362, -0.02976433, -0.07317687, 0.031326186, 0.0064884964, -0.044022623, 0.037614394, -0.0705752, -0.10642723, 0.058439463, 0.2230188) * inp_3_0_2; + result2 += M4(-0.059847344, -0.01139373, 0.13806899, 0.08948678, 0.01390379, -0.097241, 0.02743823, 0.016725708, -0.010654057, 0.025405332, -0.0010878934, -0.08476517, -0.08760278, 0.05094644, -0.19358766, -0.14211519) * inp_3_1_2; + result2 += M4(-0.17474808, -0.22108728, -0.21780892, 0.35220462, 0.009163019, -0.06104532, -0.053446397, -0.04392871, 0.0015393725, -0.00069702463, 0.03886848, -0.02923031, 0.00527017, 0.034089398, 0.16028263, -0.055244535) * inp_3_2_2; + result3 += M4(-0.018567495, 0.0026103545, 0.36512035, -0.018511413, 0.042726085, -0.121779025, -0.0759674, -0.027829297, 0.040537566, 0.032802176, -0.032742567, 0.01259471, 0.022687757, -0.14804396, -0.33376685, -0.033556912) * inp_3_0_0; + result3 += M4(-0.116059996, 0.12173986, -0.18802345, 0.13156602, -0.07677582, 0.06166233, -0.055367634, -0.043565907, -0.045016497, -0.056485992, -0.0025054468, 0.062424377, -0.11418986, 0.19949088, 0.16542612, 0.05149701) * inp_3_1_0; + result3 += M4(0.028589878, 0.08787085, -0.15834384, 0.008276506, 0.055699687, 0.0517054, -0.035402454, 0.022119103, 0.013805701, -0.07114713, -0.012704838, -0.095399395, 0.058038633, 0.020338465, 0.19678909, 0.13581684) * inp_3_2_0; + result3 += M4(-0.055346105, -0.022346426, 0.28103238, 0.06451777, -0.012666116, 0.049827963, 0.052170645, -0.009899708, -0.0043233866, -0.008591818, -0.002752428, -0.12905397, -0.04443095, 0.13801019, -0.030456353, 0.17349862) * inp_3_0_1; + result3 += M4(0.021500591, -0.04334728, -0.09889436, -0.0042085215, -0.027597575, 0.11979061, 0.09731146, 0.056554627, 0.03162167, 0.08822394, 0.056181837, -0.09152388, 0.13347569, -0.059502367, 0.043407016, -0.0048634615) * inp_3_1_1; + result3 += M4(0.051889032, -0.13060205, -0.053255986, 0.047219437, -0.036587156, -0.00361318, 0.11671864, -0.0060794465, -0.006730907, -0.01520898, 0.005964793, 0.040629286, 0.043768957, -0.052364953, -0.09406933, -0.09536944) * inp_3_2_1; + result3 += M4(0.048058864, 0.03373609, 0.28471413, -0.11747176, 0.03439936, -0.13080667, 0.030491013, 0.027022334, -0.0003300306, -0.039328486, 0.010704635, 0.21759433, 0.00070556474, 0.018552786, 0.168483, -0.176763) * inp_3_0_2; + result3 += M4(0.09441553, -0.015840568, -0.079968214, -0.21781057, 0.07723678, -0.046124, -0.07330958, 0.09381263, -0.01420818, -0.009802088, -0.0352734, 0.055251617, -0.028345533, -0.10139458, -0.08185518, 0.06420966) * inp_3_1_2; + result3 += M4(-0.065675996, -0.03485548, -0.1351602, 0.04892821, -0.02004268, -0.0053299735, 0.028146671, 0.008350671, -0.016548887, 0.07172998, -0.0016435798, -0.07355486, -0.06291693, 0.0022400378, -0.04194968, -0.100256324) * inp_3_2_2; + result4 += M4(0.10275624, -0.050601494, 0.055006552, -0.100944854, -0.047467656, 0.004118076, 0.054911327, 0.11621958, 0.0030265562, 0.029584533, 0.077024624, -0.017295482, 0.09255058, 0.12823223, 0.10996005, -0.006581182) * inp_3_0_0; + result4 += M4(-0.023460632, -0.07407528, -0.23225261, 0.01596762, 0.035419896, -0.102963164, -0.057545274, 0.21702328, 0.013119259, -0.019170007, 0.017791761, 0.0027059524, 0.14498927, -0.2147906, -0.1968048, 0.12059705) * inp_3_1_0; + result4 += M4(0.09735267, -0.008516496, 0.10029414, -0.12141932, -0.08180664, -0.010001622, -0.040972203, 0.17372316, -0.18491365, 0.103480205, -0.031467967, -0.068326965, 0.018889373, -0.0072864112, -0.010454968, -0.049856994) * inp_3_2_0; + result4 += M4(-0.14227402, 0.048893057, 0.15169342, 0.0589829, -0.0111398725, -0.0007021414, -0.021915037, 0.0072053983, 0.013556308, -0.06439848, -0.026270576, 0.02535592, -0.025688693, -0.03547005, -0.11827166, 0.008322918) * inp_3_0_1; + result4 += M4(0.015891457, -0.017897032, 0.007903984, 0.047343597, 0.09363182, 0.024844792, -0.05830995, 0.17132264, -0.06561783, 0.06570166, -0.015288811, 0.09247123, -0.0013438858, 0.11100324, 0.16285086, -0.082568325) * inp_3_1_1; + result4 += M4(-0.17172615, 0.11925204, 0.109492764, 0.016225312, 0.010063468, -0.025177682, 0.026810376, 0.17247847, 0.0182892, -0.08003335, -0.032131247, -0.04426509, 0.027547639, 0.0038644287, 0.0622444, 0.026596734) * inp_3_2_1; + result4 += M4(0.18723038, -0.06356827, -0.09350727, 0.010388782, -0.03361306, -0.0015997153, 0.053034473, -0.068830036, 0.028943738, -0.033172213, 0.0083861165, 0.025625488, -0.101140805, 0.006527277, 0.14642856, -0.020703917) * inp_3_0_2; + result4 += M4(0.054269917, 0.035792064, -0.050312504, 0.08075724, 0.06187946, 0.021648116, 0.05535476, 0.15620534, 0.11397159, -0.0029014526, -0.019254057, -0.10412736, 0.079952665, -0.019412525, -0.06043989, -0.0028609503) * inp_3_1_2; + result4 += M4(-0.02539215, 0.01437164, 0.020025266, -0.059849497, 0.0072748433, 0.042192727, 0.06783724, 0.05773892, 0.06520988, -0.0026089048, 0.01743468, 0.08910741, -0.20436613, 0.026470054, -0.098164715, 0.011565031) * inp_3_2_2; + result5 += M4(-0.10841221, -0.0363878, -0.231216, -0.17400073, -0.022624917, -0.0694818, -0.092000924, -0.083555214, 0.0055065965, 0.09846925, 0.030156685, 0.01904306, -0.020952217, 0.059327304, 0.030406477, -0.1143399) * inp_3_0_0; + result5 += M4(-0.13173077, -0.26147693, 0.14895892, 0.15694575, 0.035660498, -0.0038643396, 0.10676744, -0.060635388, 0.037966434, -0.04905565, -0.0766657, -0.008407624, -0.16902927, -0.29815325, 0.014726095, 0.076710515) * inp_3_1_0; + result5 += M4(0.102596186, -0.05005975, -0.048240762, 0.04147368, -0.102371044, -0.044269536, -0.083829276, -0.017138937, -0.02299257, -0.04585765, 0.047417827, -0.052792363, 0.16407567, 0.2157907, -0.10534021, 0.07732776) * inp_3_2_0; + result5 += M4(0.11040525, -0.09375575, -0.2989762, 0.09015296, 0.009494491, -0.018460311, -0.0009432192, 0.10526945, -0.043539457, -0.059871405, -0.020558301, -0.023958672, -0.14667718, -0.09243026, -0.107162826, 0.11911795) * inp_3_0_1; + result5 += M4(-0.1350197, -0.13791439, 0.06368997, 0.0135857, 0.13447742, 0.109225266, 0.16954204, 0.026523715, 0.059673406, 0.031501997, -0.017856803, 0.07762521, 0.17063937, 0.086128615, 0.12133009, -0.03999287) * inp_3_1_1; + result5 += M4(0.21358466, 0.010802508, 0.030539487, -0.100231655, -0.0720297, -0.024601962, 0.019359145, 0.23460163, -0.01684153, 0.045131125, 0.019434633, 0.059938397, -0.010893166, -0.23570989, -0.040062375, -0.21358533) * inp_3_2_1; + result5 += M4(-0.053052325, 0.7387682, -0.17492625, 0.017032824, 0.0071524233, -0.013409763, -0.057646163, -0.023101417, 0.0070181526, 0.088075995, -0.073717274, -0.009228015, 0.089969486, 0.17503998, -0.017464302, -0.033747226) * inp_3_0_2; + result5 += M4(-0.060896996, -0.20927513, 0.14395653, 0.055566028, 0.057375714, 0.023686128, -0.09188384, -0.14255336, -0.041927703, -0.104409404, 0.056969125, -0.049685113, 0.04641332, -0.26447034, -0.025084667, 0.05080997) * inp_3_1_2; + result5 += M4(0.10447019, 0.0021664004, 0.03300909, 0.013241151, -0.06567862, 0.019394988, -0.055819668, -0.09805172, 0.02324118, 0.033387065, 0.054767907, -0.00011540235, -0.1324057, 0.30173886, 0.126969, 0.103199705) * inp_3_2_2; + result6 += M4(-0.36202443, 0.17659415, 0.049923707, 0.15764862, 0.012453831, -0.0056842333, -0.003600969, 0.0120022455, 0.09898221, 0.052056625, 0.03754402, 0.14247002, -0.06303877, 0.020438142, -0.03389578, -0.27174982) * inp_3_0_0; + result6 += M4(-0.07228018, -0.031460524, 0.019936912, -0.18113697, -0.02745625, 0.04275978, -0.0007969192, -0.07990229, -0.16646542, 0.025946287, -0.020801041, -0.0667422, -0.20107456, -0.08823643, -0.012090548, -0.028368922) * inp_3_1_0; + result6 += M4(0.015523248, -0.043354906, -0.023148216, -0.19232436, 0.04778691, 0.060575824, -0.07492828, -0.007404456, 0.11407589, -0.013511919, -0.0016491567, -0.020163843, 0.45946974, -0.031038936, 0.020621896, -0.032983396) * inp_3_2_0; + result6 += M4(0.073867336, -0.1483454, 0.07699858, 0.30727065, 0.0850781, 0.05013866, -0.012111206, 0.0920334, -0.06709266, -0.025296757, -0.028023398, -0.200641, 0.09505046, -0.032021288, 0.09732993, 0.107672535) * inp_3_0_1; + result6 += M4(0.011917727, -0.18573129, -0.039482113, -0.10653897, -0.010152601, 0.033033486, 0.12093644, 0.014134082, 0.12168461, -0.046516348, 0.022690218, 0.12506135, -0.036886904, 0.21988527, -0.016690405, 0.09360803) * inp_3_1_1; + result6 += M4(0.09410977, 0.057722185, 0.045246158, -0.070580885, -0.035504244, -0.08016729, 0.02729342, 0.06084015, -0.22293359, 0.06739874, -0.032340545, 0.09744865, -0.24910265, -0.14061959, -0.06767582, 0.1866403) * inp_3_2_1; + result6 += M4(0.20498458, 0.19927391, 0.107652985, -0.064823136, -0.014122271, 0.019808032, 0.035629053, -0.006818886, 0.003651494, -0.050823458, 0.013990394, 0.052466553, -0.14694835, 0.056151833, -0.026632998, 0.09014523) * inp_3_0_2; + result6 += M4(0.032013252, -0.045949485, -0.13705537, 0.061154846, -0.026881302, 0.00795819, 0.003864972, -0.02222533, 0.00807324, 0.025598124, 0.00879293, -0.029155701, 0.16247916, -0.11350233, 0.04666391, -0.027355118) * inp_3_1_2; + result6 += M4(-0.09051523, -0.11054118, -0.03317729, 0.19976345, -0.048919074, 0.028446138, 0.006867744, 0.06268193, 0.14603335, -0.011673084, 0.0077291573, -0.104334645, 0.019944651, 0.123291865, -0.035155844, -0.121591695) * inp_3_2_2; + result7 += M4(-0.05570162, -0.04828354, 0.025604865, 0.022930326, -0.006984085, -0.02662257, -0.11230645, -0.043253038, 0.052033827, -0.039332032, 0.007263562, -0.026950626, -0.03708213, 0.29722342, -0.104873344, -0.10744328) * inp_3_0_0; + result7 += M4(-0.13841997, -0.09366951, 0.057500567, -0.027023107, 0.08486296, 0.013217785, 0.010380215, -0.007562276, -0.0484528, 0.050976504, -0.1337574, -0.0021196397, -0.040356092, -0.24493831, -0.16932893, 0.061209347) * inp_3_1_0; + result7 += M4(0.0021701625, -0.10160458, -0.15599388, -0.1465994, 0.040690985, 0.025823733, 0.02045705, -0.0101641165, 0.017131211, -0.003134739, 0.110624395, -0.006075952, 0.02849226, -0.023113988, 0.27202505, 0.058406536) * inp_3_2_0; + result7 += M4(0.044703823, 0.15965404, -0.011037147, 0.5109806, 0.10312813, -0.022608232, 0.01945682, 0.1116657, -0.046794675, -0.107846156, -0.0085611185, 0.033983912, 0.056398768, -0.36921877, 0.047346402, -0.044937726) * inp_3_0_1; + result7 += M4(0.09941285, 0.19292344, 0.026810154, -0.21716522, 0.1708566, 0.009213916, 0.042141065, 0.049008094, 0.011651048, 0.16956031, 0.06624104, -0.02835029, 0.065781936, 0.19285975, -0.13246283, 0.18810649) * inp_3_1_1; + result7 += M4(0.04972977, 0.22763842, 0.28708026, -0.18241341, 0.05483751, 0.0013328108, 0.032350052, 0.07145266, -0.049057122, -0.044888075, -0.052508757, -0.018042825, 0.0497444, 0.16587968, -0.13421802, -0.118445605) * inp_3_2_1; + result7 += M4(0.0046838266, -0.4409666, -0.2597612, 0.41250828, -0.18498208, 0.04249205, -0.013993952, -0.038135, 0.03919663, 0.108871385, -0.041990787, -0.015019912, 0.032063566, 0.24547447, 0.10318247, -0.014512095) * inp_3_0_2; + result7 += M4(0.08283574, 0.18859686, -0.0856765, 0.03837081, -0.15208305, 0.09135492, 0.06807662, -0.08459724, -0.009910099, -0.13344067, 0.011595474, -0.008545678, -0.05208831, 0.00376925, 0.11690895, -0.21521091) * inp_3_1_2; + result7 += M4(-0.034031004, 0.020283002, 0.16722825, -0.2274462, -0.10500842, -0.106952816, -0.09739804, -0.043050934, 0.0352815, -0.021185046, 0.014114931, 0.056368798, -0.10320414, -0.2784876, -0.0018532448, 0.16714536) * inp_3_2_2; + const V4 inp_4_0_0 = inp[4][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_4_1_0 = inp[4][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_4_2_0 = inp[4][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_4_0_1 = inp[4][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_4_1_1 = inp[4][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_4_2_1 = inp[4][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_4_0_2 = inp[4][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_4_1_2 = inp[4][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_4_2_2 = inp[4][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.015347963, -0.068664856, 0.04645804, -0.112937756, -0.06175871, -0.1433821, 0.0025176874, 0.069849715, 0.086089835, 0.0019525258, -0.12190901, 0.10086868, 0.025729029, -0.093065195, 0.03597414, -0.08442831) * inp_4_0_0; + result0 += M4(-0.022431038, -0.03091568, -0.037138887, 0.09393001, -0.084375724, 0.06609799, 0.011646566, -0.05158206, -0.07297696, 0.021687489, 0.060903136, -0.07121508, -0.020559458, 0.0127250785, -0.024569467, 0.13495246) * inp_4_1_0; + result0 += M4(-0.0018076265, 0.01161834, -0.07099824, 0.023369938, 0.18064553, 0.047237743, 0.029539233, -0.09658718, -0.04571645, 0.06547593, 0.096877344, -0.040239953, -0.027432956, -0.005315208, -0.003156292, -0.07669967) * inp_4_2_0; + result0 += M4(-0.054001864, 0.20098436, -0.075695276, 0.012816671, -0.034243528, 0.0369853, 0.0294349, 0.014773263, 0.09470427, -0.5302787, 0.12485596, 0.052819043, -0.0327127, -0.16616333, -0.08262571, 0.020234514) * inp_4_0_1; + result0 += M4(0.016046144, -0.024816377, 0.03831941, -0.04718623, 0.08795951, 0.046626084, -0.0014814431, 0.14859195, -0.08441955, 0.23019505, -0.08293948, -0.02791357, -0.048614882, 0.19230148, 0.008847433, -0.11809789) * inp_4_1_1; + result0 += M4(0.055004288, -0.02935283, 0.001169136, -0.016408088, -0.17689867, -0.08972158, -0.04804486, -0.020838732, 0.0470175, 0.01945906, 0.059018467, 0.0671052, 0.1538387, -0.0051397923, 0.059761774, 0.079815395) * inp_4_2_1; + result0 += M4(0.052666795, -0.047520895, 0.11395038, 0.020103414, 0.12042282, 0.09387562, -0.07250865, -0.092701346, -0.213393, 0.37187365, -0.12505738, -0.08431384, -0.03445421, 0.1239568, 0.01918598, 0.015214686) * inp_4_0_2; + result0 += M4(-0.007434616, -0.001700406, 0.020891687, 0.019420985, -0.025226265, -0.09403224, -0.053130418, -0.03489649, 0.20018843, -0.22188586, 0.14417626, -0.021490153, 0.14246203, -0.046728626, 0.03610042, 0.07541829) * inp_4_1_2; + result0 += M4(-0.028029917, -0.0024124293, -0.033305515, 0.034131464, -0.05318704, 0.026769286, 0.08884552, 0.04889907, -0.017540498, 0.043866806, -0.14486933, 0.028184127, -0.13232058, -0.014637747, -0.030744046, -0.017228112) * inp_4_2_2; + result1 += M4(0.062242445, 0.003806714, 0.020724425, -0.024530057, -0.012798401, 0.068941124, -0.023947805, -0.0113810925, -0.047811907, -0.15170345, 0.028711537, 0.007991358, 0.04701127, 0.025249818, 0.0047800844, 0.0761221) * inp_4_0_0; + result1 += M4(-0.016507741, 0.0010444475, -0.10129273, 0.024638347, 0.2018351, 0.031926427, 0.05961932, -0.07143418, -0.06696651, 0.02543501, 0.0574603, 0.15273589, -0.043569755, 0.03250557, -0.011830026, 0.0005050185) * inp_4_1_0; + result1 += M4(-0.11386541, 0.010085473, 0.039012723, -0.008058504, -0.27889687, 0.0074400264, 0.027503373, 0.088229984, 0.13352963, 0.02258644, 0.009098703, -0.116981216, -0.18986647, -0.0058585242, -0.0305771, -0.05416138) * inp_4_2_0; + result1 += M4(0.014168622, -0.05011436, -0.08866536, -0.046353772, -0.06601335, 0.07485206, 0.005486981, 0.10850929, -0.020481676, 0.14530374, 0.2014894, -0.08188897, -0.01661501, -0.027097693, 0.042672105, -0.15946302) * inp_4_0_1; + result1 += M4(-0.07654896, 0.016076213, 0.09259981, -0.04827227, -0.12736493, -0.20943747, -0.12114548, 0.14080308, 0.23179926, -0.021129597, -0.08774192, 0.026381092, 0.14526787, -0.024885917, 0.04497208, 0.08400469) * inp_4_1_1; + result1 += M4(0.02684115, -0.14352526, -0.020265132, 0.15845658, 0.32814395, 0.10192891, 0.14333038, -0.45814818, -0.08770206, -0.02511608, -0.12954372, 0.07361434, -0.009698944, 0.010982917, -0.026692523, 0.15227987) * inp_4_2_1; + result1 += M4(0.016972719, 0.057248022, -0.006755407, 0.06422271, 0.060040038, -0.17989522, 0.0419648, -0.08762649, -0.0043210527, -0.04547064, -0.0063789706, -0.031473164, 0.021232963, 0.11072973, 0.035959743, 0.06449844) * inp_4_0_2; + result1 += M4(0.11196047, 0.052243356, 0.024443861, -0.060018744, -0.097404055, 0.20103906, -0.055618595, -0.017013773, -0.07736854, -0.033415396, -0.058290437, -0.10571163, -0.015254149, 0.030456558, -0.035810467, -0.08826208) * inp_4_1_2; + result1 += M4(-0.017307289, 0.08638532, -0.02579791, -0.053784084, 0.008788286, -0.12661941, -0.042239256, 0.26640934, -0.06532419, 0.07678242, 0.017023697, 0.07988674, -0.0010988557, -0.0037944408, -0.012944977, -0.10235324) * inp_4_2_2; + result2 += M4(-0.034974206, 0.06794813, 0.0035073175, -0.13393807, -0.061614662, -0.06021737, -0.074327454, 0.28772807, -0.06250681, -0.10218942, 0.12662503, 0.022742214, -0.10975214, -0.0063361567, -0.003025205, -0.085636094) * inp_4_0_0; + result2 += M4(0.016527109, -0.057549138, -0.06709942, 0.09974007, 0.030098781, 0.10552096, 0.14710502, -0.4480764, -0.0112706125, 0.01515357, 0.04363119, -0.014222173, 0.07512766, 0.03233325, -0.02863624, 0.19654723) * inp_4_1_0; + result2 += M4(0.043013055, 0.041099627, -0.123709075, 0.07187111, -0.07306719, -0.09428668, -0.04394538, 0.10755012, 0.02070349, 0.0828876, 0.13716455, 0.019693887, 0.063882254, 0.008052695, -0.013758167, -0.048417274) * inp_4_2_0; + result2 += M4(-0.009172881, 0.051556833, 0.060726427, 0.054615013, 0.03054924, 0.07875937, -0.008581751, -0.23570366, -0.019702753, -0.1866054, -0.015674567, 0.3555879, -0.06266117, -0.050504964, 0.01076697, 0.16294156) * inp_4_0_1; + result2 += M4(-0.10031015, -0.04609069, 0.18867433, -0.055574246, -0.10392824, -0.16170603, -0.20977044, 0.35697988, 0.35071892, 0.14930168, -0.18897198, -0.07844448, -0.055208653, -0.012442662, -0.012745678, -0.22062813) * inp_4_1_1; + result2 += M4(-0.034917817, -0.016817078, -0.04597928, -0.06561386, 0.24788813, 0.110733375, 0.2607216, -0.12861831, -0.15483572, 0.0019037564, -0.14894713, -0.08121656, -0.025103018, -0.007391733, 0.09671456, -0.004736849) * inp_4_2_1; + result2 += M4(0.019239163, -0.061022103, -0.02641717, -0.02905679, 0.04629351, 0.051416274, 0.07986066, -0.028329363, -0.02207861, 0.25481695, -0.079589345, -0.31572682, -0.0018124239, 0.08753095, 0.006467953, -0.20358352) * inp_4_0_2; + result2 += M4(-0.010853391, 0.009191581, 0.0020763124, 0.00044691635, 0.014615017, -0.059548005, 0.08654007, 0.0050915014, -0.04509479, -0.18360062, 0.06771911, -0.00044550904, 0.027544696, -0.07103817, -0.027311513, 0.11955296) * inp_4_1_2; + result2 += M4(0.13112625, 0.026925191, 0.016991375, 0.10075743, -0.14101198, 0.022351323, -0.22590432, 0.06986497, -0.08234276, -0.0381189, 0.048623137, 0.1010553, 0.07715705, -0.008273326, -0.0035380786, 0.032877263) * inp_4_2_2; + result3 += M4(0.049718, -0.0606453, -0.0944228, -0.0024191968, -0.008600836, 0.1367621, 0.16765337, 0.047311954, 0.029113218, -0.14446715, 0.033425666, -0.10763291, 0.05308789, 0.021063123, -0.1392104, 0.06417157) * inp_4_0_0; + result3 += M4(-0.0403097, 0.001017961, 0.01609335, -0.123920076, 0.036830857, 0.08942833, -0.20540363, 0.19357881, 0.06437233, 0.1803794, -0.03597348, -0.003695139, 0.01393767, -0.09938359, 0.07078445, -0.17746519) * inp_4_1_0; + result3 += M4(0.008557043, 0.02948618, -0.041898903, 0.12602842, -0.059987336, -0.20075257, -0.13947296, -0.31092528, -0.1132687, -0.005653307, 0.028461065, 0.078161046, 0.028711727, -0.02853606, 0.02708031, 0.11947079) * inp_4_2_0; + result3 += M4(0.034526832, 0.020657927, 0.059900936, 0.007056605, -0.030451095, -0.12218506, 0.2213549, -0.04818652, -0.22491327, 0.10216525, -0.40150827, 0.13270788, -0.04383447, -0.043958217, -0.13285235, -0.025379898) * inp_4_0_1; + result3 += M4(-0.06988003, 0.034596894, -0.0026508719, 0.04078883, 0.027662968, -0.035777435, 0.13871337, 0.14527074, 0.23947015, -0.10171578, 0.29536808, -0.027721278, -0.000103672144, 0.060061257, 0.12627032, 0.009035187) * inp_4_1_1; + result3 += M4(-0.031302888, -0.0895872, -0.035844233, -0.14865923, 0.008552225, 0.23973386, 0.09681701, 0.30540127, 0.101203315, -0.0079374565, -0.012015204, -0.08439947, -0.013489955, -0.045119133, -0.07636911, -0.13508363) * inp_4_2_1; + result3 += M4(-0.09356465, 0.059054006, 0.10897642, 0.006153388, 0.07690732, -0.0763855, -0.34810522, 0.15194388, 0.2304762, 0.024355706, 0.21850228, 0.12032501, 0.021008208, 0.0115743885, 0.11795112, 0.065826215) * inp_4_0_2; + result3 += M4(0.20204175, -0.024561848, -0.069184594, 0.10076785, -0.17356102, -0.058159776, 0.08010355, -0.45695424, -0.45804262, -0.0034749857, -0.19004934, 0.1519923, -0.03731987, 0.0048805373, -0.041497987, 0.28867304) * inp_4_1_2; + result3 += M4(-0.048924565, 0.044160094, 0.059675954, -0.028196245, 0.11724903, 0.031242423, -0.03143809, -0.016586293, 0.12866212, -0.046329815, 0.03429844, -0.24092107, -0.029159248, 0.07122084, 0.01537091, -0.1994948) * inp_4_2_2; + result4 += M4(-0.07022611, -0.1489489, -0.049414024, -0.026796605, 0.044553045, 0.029765077, -0.10146301, 0.11443817, -0.027537528, 0.17826001, 0.058376607, -0.035831317, -0.021918504, -0.11589114, -0.06050097, -0.05082394) * inp_4_0_0; + result4 += M4(-0.04688623, 0.19128789, 0.043254264, -0.07466518, 0.21171208, -0.19197467, 0.050670788, -0.086094186, 0.08168199, -0.09633471, -0.08804017, 0.04045423, -0.12381782, 0.14991587, 0.08327295, -0.011405639) * inp_4_1_0; + result4 += M4(0.054191362, -0.029317293, 0.027033674, 0.03895992, -0.18602686, 0.19731207, 0.09325744, 0.03494674, 0.041359335, -0.07043728, -0.032838073, -0.03673499, 0.06255654, -0.01031302, -0.041171655, -0.017683838) * inp_4_2_0; + result4 += M4(0.097610936, 0.051053572, 0.026763389, 0.05238207, -0.1972272, -0.013619113, 0.077562205, -0.11514781, -0.16075905, -0.12547234, -0.032063875, 0.13928266, -0.023862006, 0.019713186, 0.052911054, 0.11128267) * inp_4_0_1; + result4 += M4(-0.028301813, -0.0837762, -0.020459857, 0.08439594, -0.08888771, 0.12981653, -0.119595625, 0.0062344214, 0.078405134, 0.033431035, -0.034099188, -0.29706937, 0.13518852, -0.08675123, -0.09147663, -0.020852897) * inp_4_1_1; + result4 += M4(-0.12631403, -0.00073663425, 0.013419659, -0.015249826, 0.36151773, -0.08041647, -0.058474917, 0.0053324434, -0.09226296, 0.057632837, 0.049839847, 0.0831306, -0.15372884, 0.0042750374, 0.0017865851, -0.11391898) * inp_4_2_1; + result4 += M4(-0.07926971, -0.027371088, -0.01110064, -0.017107418, 0.17038901, 0.06714438, -0.08350233, -0.031930126, 0.31153667, -0.05438068, -0.048561644, -0.07731436, 0.09884543, -0.007631899, -0.0013403071, -0.035442516) * inp_4_0_2; + result4 += M4(0.14012894, 0.0028412007, -0.062296163, -0.08842521, -0.34216368, -0.028954593, 0.089838505, 0.10713954, -0.20487824, 0.024797026, 0.016134374, 0.22162604, 0.04851766, 0.042203438, 0.00096152845, 0.062135063) * inp_4_1_2; + result4 += M4(-0.025321418, 0.0444421, 0.009977276, 0.051531363, 0.08019694, -0.09846713, 0.056881953, -0.038393106, 0.013713512, 0.04312247, 0.11063409, -0.03899735, -0.044035774, 0.019130269, 0.036256697, 0.08657744) * inp_4_2_2; + result5 += M4(0.030981408, 0.08781324, 0.0465234, 0.028900536, -0.08502707, 0.047651898, 0.051460773, 0.11776715, 0.008373296, -0.059764728, -0.0953337, -0.122322835, 0.052956562, -0.044707738, 0.008952465, -0.045302067) * inp_4_0_0; + result5 += M4(0.07303235, 0.036684416, -0.013709382, -0.015096143, -0.009532191, 0.23011005, -0.11166426, -0.08966601, -0.058177434, -0.14690246, 0.111598514, 0.20627128, 0.056426786, 0.05660523, 0.0047775772, 0.017691562) * inp_4_1_0; + result5 += M4(-0.0065977685, -0.020389399, -0.04035871, -0.056656703, -0.001296415, -0.28594384, 0.13048528, 1.6333655e-05, 0.036310315, 0.08479238, -0.0068808305, -0.041508738, -0.03145242, 0.0749781, -0.06828677, -0.040379528) * inp_4_2_0; + result5 += M4(0.03188623, -0.11244197, 0.13534582, -0.008461294, 0.08006386, -0.025378594, -0.016635874, -0.20673247, -0.11248133, 0.0967427, -0.007489057, 0.17561181, -0.005050758, -0.01930356, 0.1797711, 0.11191476) * inp_4_0_1; + result5 += M4(-0.15243255, 0.018820502, -0.008216767, -0.026068626, 0.10426205, -0.18403246, -0.08314527, 0.22374412, 0.15961742, -0.21690856, -0.0077303206, -0.21131787, -0.039587844, -0.17945555, -0.07393377, -0.12739745) * inp_4_1_1; + result5 += M4(0.04706311, 0.026824584, -0.081707716, 0.062018704, -0.17168696, 0.30135295, 0.040612355, -0.0057184286, -0.070350975, 0.13984181, -0.058176886, 0.07217856, -0.04006961, 0.12129718, -0.069553226, 0.0813602) * inp_4_2_1; + result5 += M4(0.036619246, 0.14100142, 0.023282213, 0.051742148, -0.016604811, -0.12804525, -0.09562551, 0.07746391, -0.06442569, 0.17474443, 0.09775942, -0.15528885, -0.06495131, 0.22383533, -0.039015647, -0.02622935) * inp_4_0_2; + result5 += M4(0.022782035, -0.11527496, -0.06607121, -0.022222778, -0.109326735, 0.2814242, 0.27344614, -0.077948414, -0.0309022, 0.13699773, 0.11074792, 0.13306884, 0.08793571, 0.078675315, -0.0011466475, 0.079729445) * inp_4_1_2; + result5 += M4(-0.072083555, -0.023365624, 0.0013773862, -0.023897903, 0.1909737, -0.27293402, -0.1859008, -0.050656065, 0.1253508, -0.22552036, -0.13976125, -0.037139904, -0.007087417, -0.2299057, 0.111989535, -0.06787896) * inp_4_2_2; + result6 += M4(0.05125755, 0.020197475, 0.051851336, -0.04044587, 0.123426095, 0.04441016, -0.014034072, 0.12893628, -0.16182423, 0.10722033, -0.0011704656, -0.3681144, 0.10618148, 0.07166449, 0.035273563, -0.109781794) * inp_4_0_0; + result6 += M4(0.02106569, -0.040576797, -0.049933493, 0.00552437, -0.08974453, 0.1483031, -0.034924146, -0.0021361308, 0.04079294, -0.11598749, -0.003729837, 0.06637196, -0.0458319, -0.13152426, -0.06391264, 0.19713907) * inp_4_1_0; + result6 += M4(-0.21092935, 0.02182073, 0.03705599, 0.09195985, 0.11813646, -0.17102215, 0.00767189, -0.17389582, 0.2084574, -0.0021891808, -0.019679487, -0.030480323, -0.14351867, 0.08145486, 0.018724296, 0.10749066) * inp_4_2_0; + result6 += M4(0.07340585, 0.029559419, -0.041336842, 0.0030860824, -0.21102114, -0.08455312, 0.03509718, -0.14093173, -0.24958752, -0.069229946, 0.09697096, 0.46258098, -0.18969557, -0.039852537, -0.061017238, 0.0780439) * inp_4_0_1; + result6 += M4(-0.049350746, -0.06178836, -0.046902917, 0.11307912, 0.0908593, -0.24150716, 0.14461373, -0.054369617, -0.0010273365, 0.084890105, -0.09785255, -0.002330616, -0.004343787, 0.091098666, -0.03035586, -0.05609253) * inp_4_1_1; + result6 += M4(0.1906352, 0.03562363, 0.05633377, -0.24253497, -0.22601411, 0.2752202, -0.16600806, 0.2319767, -0.19106264, -0.0181399, 0.032506607, -0.12824795, 0.13629645, -0.073911026, 0.08124848, -0.14383006) * inp_4_2_1; + result6 += M4(0.00283909, 0.005476308, -0.007212551, -0.051652085, 0.21574217, 0.007472785, -0.06870259, -0.005254144, 0.1919404, 0.018648757, 0.04264531, -0.3499618, 0.1969271, -0.038681425, 0.075780615, -0.22787845) * inp_4_0_2; + result6 += M4(0.044691067, 0.008617043, -0.01647189, -0.051183738, -0.05136751, 0.14447081, -0.07357494, -0.08821368, 0.06784491, 0.037806783, 0.015042085, 0.20493537, 0.07330816, 0.011998123, 0.0027163553, 0.13485123) * inp_4_1_2; + result6 += M4(-0.16050476, -0.008769032, 0.015945897, 0.14171965, 0.040322777, -0.14308958, 0.17062505, 0.07755573, 0.13424328, -0.028520895, -0.076917514, 0.13208783, -0.07813255, 0.064059675, -0.05208738, -0.022037482) * inp_4_2_2; + result7 += M4(-0.027150644, 0.015814956, -0.05754513, -0.04873897, 0.11025416, -0.435392, 0.19333814, 0.1508991, -0.024739647, 0.235516, 0.008029071, 0.16134943, -0.028440928, 0.11872575, 0.005241932, 0.052433252) * inp_4_0_0; + result7 += M4(0.05012264, 0.04066345, 0.16703197, 0.07589541, -0.1270166, 0.22868992, -0.17756659, -0.25659922, -0.08701758, -0.23962207, 0.12861854, -0.005225858, 0.046291653, -0.067466155, 0.18713556, 0.10580186) * inp_4_1_0; + result7 += M4(0.03803395, 0.044674866, -0.14320253, -0.060602285, -0.01924285, 0.18292303, 0.058129393, 0.07757843, 0.027198482, -0.102262065, -0.27906904, -0.0512138, 0.035892766, -0.10657082, -0.28256884, -0.09792226) * inp_4_2_0; + result7 += M4(-0.012270241, 0.053292412, 0.016127117, 0.19542322, 0.057889953, 0.16662508, -0.03501168, -0.11492125, -0.090744615, 0.09574408, 0.11650677, -0.41509, -0.013611491, 0.23077895, 0.07481661, -0.20365353) * inp_4_0_1; + result7 += M4(-0.050340824, -0.054458, 0.06925373, -0.015471931, 0.20114389, 0.2039917, -0.030549502, 0.015708799, 0.18677916, 0.118704855, -0.21017921, 0.2957251, -0.117368944, -0.09008227, -0.08263792, 0.026435705) * inp_4_1_1; + result7 += M4(-0.054188915, 0.029804207, -0.009779273, -0.081521824, -0.15916476, -0.36768237, 0.075100474, 0.0754138, 0.0321642, 0.12112747, 0.029604962, 0.065914765, 0.0464749, 0.075301185, 0.1676729, 0.18092157) * inp_4_2_1; + result7 += M4(-0.05563333, -0.12616087, 0.012166298, -0.04718368, -0.104780555, 0.29519585, -0.16578898, -0.07897049, 0.27093765, -0.37851065, -0.006221345, -0.16941196, 0.07149533, -0.3072529, -0.006891178, 0.0058584786) * inp_4_0_2; + result7 += M4(0.08174425, 0.0066998987, -0.1545479, -0.045850534, -0.21832131, -0.36911124, 0.2271025, 0.24205635, -0.25416878, 0.21453868, -0.0020685422, -0.076271765, 0.027678948, 0.06828489, -0.16908534, -0.028928304) * inp_4_1_2; + result7 += M4(0.020836782, -0.004165595, 0.09501674, 0.050931085, 0.25541326, 0.04736341, -0.15443301, -0.12439448, -0.053851433, -0.07920274, 0.19243084, 0.17072554, -0.06956967, 0.036722843, 0.03300749, -0.030620713) * inp_4_2_2; + const V4 inp_5_0_0 = inp[5][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_5_1_0 = inp[5][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_5_2_0 = inp[5][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_5_0_1 = inp[5][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_5_1_1 = inp[5][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_5_2_1 = inp[5][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_5_0_2 = inp[5][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_5_1_2 = inp[5][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_5_2_2 = inp[5][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.12003355, -0.16197917, 0.059405312, 0.07180529, -0.05629396, 0.013290857, -0.0052766665, 0.09455482, 0.01543527, 0.011780181, 0.057772804, -0.13602418, -0.061191246, -0.16955279, 0.124109864, -0.1183837) * inp_5_0_0; + result0 += M4(0.05955308, 0.053755064, -0.05912226, 0.059642237, -0.0071855322, -0.029552229, 0.03535187, -0.15141864, -0.009641184, -0.026793739, -0.050860763, 0.11444209, 0.08226794, -0.07105464, -0.042521194, 0.07108895) * inp_5_1_0; + result0 += M4(-0.013662906, 0.015743596, -0.014923373, -0.093593605, 0.03436503, 0.041070525, 0.059213225, 0.02759247, 0.02458038, -0.031689767, -0.009155178, 0.044973597, 0.07871554, -0.00091928855, -0.032794576, -0.061289173) * inp_5_2_0; + result0 += M4(-0.04006067, 0.033175442, -0.03350228, -0.034955546, 0.08868477, -0.3529098, 0.026085868, 0.01780157, -0.070186034, 0.14003612, -0.09421042, 0.029189141, -0.22171648, 0.48245174, -0.08523667, -0.048465196) * inp_5_0_1; + result0 += M4(-0.031620048, 0.048981346, 0.119027406, -0.053538505, -0.10466223, 0.20030582, 0.0031505707, 0.18679461, -0.0039542615, -0.1092992, -0.030247496, -0.081444435, 0.090862796, -0.09707826, 0.04802185, 0.1843612) * inp_5_1_1; + result0 += M4(0.025353258, -0.08440316, -0.071790025, 0.0939602, -0.02492188, -0.010279576, -0.0085374415, -0.07879575, -0.05467549, 0.10885414, 0.06744527, -0.038631376, -0.005260795, 0.0062984955, -0.011207649, 0.0042925635) * inp_5_2_1; + result0 += M4(0.04318823, 0.017087901, 0.015507152, -0.0399064, -0.05217652, 0.18274924, -0.024354495, -0.018944124, 0.14000441, -0.16249917, 0.06768747, 0.034056284, 0.33973533, -0.24633941, 0.06325992, 0.051955324) * inp_5_0_2; + result0 += M4(0.090544865, 0.03812243, -0.04685882, 0.07921033, 0.13163239, -0.08538402, 0.047212694, -0.10792595, -0.10553096, 0.11198856, 0.01893768, -0.002910181, -0.22805168, 0.09493717, -0.1350254, -0.028514877) * inp_5_1_2; + result0 += M4(-0.0020659876, 0.02641642, 0.050112758, -0.056890834, -0.028001526, 0.0004420334, -0.08067158, 0.030398091, 0.030433327, -0.033877548, -0.034929655, 0.02662399, -0.10773558, -0.006818527, 0.056062534, -0.04896137) * inp_5_2_2; + result1 += M4(0.03258047, -0.052619673, 0.05270988, 0.040191118, -0.09071488, -0.06996327, 0.16471885, -0.06737587, 0.052756038, -0.0022453472, 0.092932105, -0.010896488, 0.04580427, 0.085039, -0.07618685, 0.064979956) * inp_5_0_0; + result1 += M4(0.1951554, 0.036085036, -0.009290518, 0.069995, 0.14538154, 0.063646965, 0.092518404, 0.059114642, 0.063923776, -0.06806279, -0.09183431, 0.05754977, 0.35395905, 0.19334923, 0.10200411, -0.02997106) * inp_5_1_0; + result1 += M4(-0.24828573, -0.004792883, 0.022715965, -0.09860157, 0.025934624, -0.023228055, -0.05306074, 0.06148609, 0.061106965, 0.08510779, 0.0964113, -0.060335647, -0.5500463, -0.015466951, 0.0038261348, 0.029761259) * inp_5_2_0; + result1 += M4(-0.05167719, 0.029057823, -0.014516638, -0.116867214, -0.030308379, 0.09485954, -0.063914984, 0.05470092, 0.041646264, -0.0063661053, -0.116822705, -0.105100274, -0.019247223, -0.0832243, -0.12425487, -0.0118761435) * inp_5_0_1; + result1 += M4(-0.021092294, -0.029194383, -0.050390244, 0.00158418, 0.16306238, -0.13986772, 0.005240572, -0.10477794, -0.16051888, 0.063361645, 0.0143055245, -0.039061237, -0.20482795, -0.17144455, -0.057555333, -0.08863986) * inp_5_1_1; + result1 += M4(-0.015010751, -0.011550606, -0.11363092, 0.118543334, -0.10496344, 0.04566546, -0.038451992, -0.06844769, -0.02229933, -0.15297353, 0.044718236, 0.04278037, 0.30405974, 0.074570045, 0.15799953, -0.19066344) * inp_5_2_1; + result1 += M4(0.04853332, -0.032755524, 0.0049538394, 0.031706464, 0.0047149574, -0.07018417, 0.01809364, -0.031045804, -0.017443474, 0.00020574062, -0.08245773, 0.1705651, 0.06239835, -0.024232745, 0.065580495, -0.02700926) * inp_5_0_2; + result1 += M4(0.08792307, 0.11839337, 0.15449655, -0.019440375, -0.10750216, 0.14731896, -0.095238104, 0.033393282, 0.015933257, -0.044214644, 0.080685206, 0.07126956, -0.07176213, 0.14139394, -0.09018208, 0.08857924) * inp_5_1_2; + result1 += M4(-0.03942989, -0.0033529664, -0.045179617, -0.046639547, 0.0153619535, -0.045801118, 0.0061453776, 0.08117962, 0.0061470335, 0.08383105, 0.008545463, -0.1630509, 0.11137197, -0.22180216, -0.007165417, 0.13725665) * inp_5_2_2; + result2 += M4(-0.07162368, 0.008320469, -0.016239693, 0.07078737, 0.023477828, -0.047015175, 0.07388938, -0.0029179566, 0.09491361, 0.03563946, 0.011633351, -0.25174063, -0.059890006, -0.018932959, -0.18780632, 0.2579437) * inp_5_0_0; + result2 += M4(0.028248543, 0.019484054, -0.027846083, 0.041749362, -0.08646284, -0.030927047, 0.09021006, -0.09275915, -0.08607313, -0.10149054, -0.1400739, 0.2731593, -0.13838679, 0.021160038, 0.034722634, -0.057621293) * inp_5_1_0; + result2 += M4(-0.03982442, 0.026836047, -0.03613328, -0.04447033, -0.0022374494, 0.052297074, -0.036316257, 0.05577091, -0.008493564, 0.031058041, -0.043638617, -0.11503755, -0.0076658786, -0.058363948, -0.2052407, -0.025714977) * inp_5_2_0; + result2 += M4(-0.095139764, 0.0247599, -0.011542132, -0.07359805, -0.13077253, -0.063271865, -0.07238107, 0.069741495, -0.0064015957, 0.083768986, 0.017574271, 0.011000743, 0.12050844, 0.3159717, 0.0133289695, -0.5839281) * inp_5_0_1; + result2 += M4(0.0070453915, -0.18619055, -0.05005009, 0.050016135, 0.3226143, 0.05727172, -0.16433138, 0.21040182, -0.026514474, 0.09263667, 0.2196227, -0.18017212, -0.25222498, -0.3095673, 0.0573257, 0.1467147) * inp_5_1_1; + result2 += M4(0.111105636, 0.05933965, 0.19296558, -0.059382055, -0.0032696927, 0.01649373, 0.120798446, -0.13421486, 0.063438565, -0.05486111, -0.086723626, 0.23265551, 0.28463507, 0.10272014, 0.43203583, -0.019537918) * inp_5_2_1; + result2 += M4(0.026049253, -0.004973095, 0.08159644, -0.03636471, 0.011969807, 0.06550089, 0.062204897, -0.00113211, -0.0769578, -0.11944113, 0.051923975, 0.039290503, 0.021110805, -0.22022353, 0.07161828, 0.38350755) * inp_5_0_2; + result2 += M4(0.02627604, 0.053603858, -0.124548875, 0.013245878, -0.03297196, -0.06992905, -0.10844409, -0.14215866, 0.035372898, 0.035923637, -0.11074343, 0.03117478, -0.04783038, -0.029917013, -0.034464158, 0.030497307) * inp_5_1_2; + result2 += M4(0.0071609905, -0.03536496, 0.00039634493, 0.034345772, -0.07917082, -0.012948089, -0.021412505, 0.09780846, 0.015765065, -0.0051242504, 0.085272364, -0.04523213, 0.07473343, 0.1924517, -0.1613756, -0.0695631) * inp_5_2_2; + result3 += M4(0.0936764, 0.0727645, -0.09191257, 0.028542265, -0.004242984, -0.12925819, -0.05965603, -0.0916298, 0.044130825, 0.055520903, -0.11651543, 0.05937713, 0.02960808, 0.20339587, -0.04215195, 0.105516575) * inp_5_0_0; + result3 += M4(-0.00086285215, -0.0053421725, 0.09163141, -0.02215397, 0.017044332, 0.18502776, -0.052835803, 0.14749831, -0.09115981, -0.020195, 0.08422582, -0.047440406, 0.0036308488, -0.08399501, -0.14179623, 0.2076642) * inp_5_1_0; + result3 += M4(0.065958485, -0.05092897, -0.12486665, -0.01591939, -0.026933705, -0.00034600915, -0.04012294, 0.01835805, 0.025524888, 0.11017898, 0.051572528, 0.0050430587, -0.0061673275, -0.14830218, -0.070066296, -0.17512442) * inp_5_2_0; + result3 += M4(-0.006322129, -0.05130162, -0.10250846, 0.078147486, 0.010313552, 0.09160393, -0.19518466, 0.10126341, 0.08569675, -0.02202771, 0.10800954, 0.09647128, 0.14175075, -0.21591015, 0.42399246, -0.009744689) * inp_5_0_1; + result3 += M4(-0.08427477, 0.035397388, 0.04334003, 0.11795246, 0.17240937, -0.07412815, 0.2852057, 0.03035263, -0.1237582, -0.045732386, -0.23397751, -0.021895723, -0.282495, 0.10910523, 0.18405761, 0.02430514) * inp_5_1_1; + result3 += M4(-0.055420503, -0.035713453, -0.05819, -0.034817934, -0.07711311, 0.0031517823, 0.0824834, 0.03513442, 0.037209656, -0.02826138, 0.019423742, -0.048010595, -0.1830242, 0.19548298, 0.18720385, 0.25826752) * inp_5_2_1; + result3 += M4(-0.012711321, -0.014773102, 0.08445789, -0.0011040412, -0.03532163, 0.03572516, 0.095552124, 0.16370453, -0.16713002, 0.0035945307, 0.13715753, -0.2738259, -0.17380354, 0.05297608, -0.28510606, -0.06673679) * inp_5_0_2; + result3 += M4(0.065061085, -0.002477947, 0.06363547, 0.14726545, -0.19244426, 0.011858805, -0.17093466, -0.2225141, 0.29929358, -0.025185632, 0.06759338, 0.06628545, 0.4007033, -0.08818937, 0.025526904, -0.34851858) * inp_5_1_2; + result3 += M4(-0.056808334, 0.04388231, 0.092988245, -0.32249317, 0.14241633, -0.09635709, -0.028627941, -0.24672635, -0.12270784, -0.010564661, -0.08020065, 0.19258168, 0.074817345, 0.0062310006, -0.2813075, -0.05714053) * inp_5_2_2; + result4 += M4(0.14351599, -0.23870468, -0.026942117, 0.01242863, -0.0042657256, 0.11563464, 0.08670423, -0.051678367, 0.14876002, -0.11070847, -0.11774867, -0.064385824, 0.06939922, -0.16355611, -0.1529536, 0.05954419) * inp_5_0_0; + result4 += M4(-0.12006971, 0.20102823, -0.083869666, -0.09750756, 0.27393854, -0.302599, -0.23688407, 0.08711506, -0.07741656, 0.096549965, -0.014315022, 0.04604538, 0.05278051, -0.09231464, 0.042200197, -0.15771396) * inp_5_1_0; + result4 += M4(0.07737635, 0.012567092, -0.004091606, -0.029619686, -0.11469922, 0.12536775, 0.06810136, -0.06348559, 0.140911, -0.113748066, 0.015589228, 0.0025230474, -0.07012043, 0.22377232, 0.113108814, 0.08852651) * inp_5_2_0; + result4 += M4(0.0056582396, 0.078882545, 0.0077623185, 0.032017227, -0.055795144, -0.13769925, -0.054563537, 0.032173645, 0.029430533, 0.0018932626, -0.013880744, -0.041406777, 0.07825584, 0.1353202, 0.007053003, -0.21357124) * inp_5_0_1; + result4 += M4(0.031096337, -0.06709735, 0.042306617, 0.08148489, -0.099168226, 0.26118174, 0.027319256, -0.15638678, -0.075788885, -0.05370201, 0.13126755, 0.07045495, -0.22505215, 0.13080864, -0.036012262, 0.3554495) * inp_5_1_1; + result4 += M4(-0.091560796, 0.043158796, -0.035778236, -0.08161522, 0.09801841, -0.055962037, 0.0025960545, 0.082062796, -0.010049943, 0.08080348, 0.05516002, -0.05857115, 0.31706148, -0.091393486, -0.11543547, 0.014303345) * inp_5_2_1; + result4 += M4(0.033979546, -0.016973428, 0.021975696, -0.06751869, 0.11583836, 0.01712324, -0.029094141, -0.015134157, -0.29137477, 0.07932426, 0.10633309, 0.042257246, -0.29559028, 0.05290787, 0.009760574, 0.06686467) * inp_5_0_2; + result4 += M4(0.024116596, 0.010916278, -0.0033806204, 0.035124186, -0.12094391, -0.015575345, 0.071325466, 0.05094787, 0.21398658, -0.03600775, -0.119391106, -0.018717255, 0.080642305, -0.13165694, -0.05458357, -0.17661105) * inp_5_1_2; + result4 += M4(-0.11885578, -0.02852532, 0.05854512, 0.11888104, -0.07900621, -0.015379971, 0.029345816, 0.032982536, -0.038481638, 0.038634837, -0.055058125, 0.024901068, -0.07451205, -0.060470708, 0.16448991, -0.03274605) * inp_5_2_2; + result5 += M4(0.0062863613, 0.094014004, 0.06838872, 0.017027162, -0.0066087837, 0.109006256, 0.009656355, -0.12624873, 0.039297182, 0.055420354, 0.010825974, 0.024931299, -0.038787495, 0.25810665, 0.19611731, 0.21545151) * inp_5_0_0; + result5 += M4(0.07559675, -0.0463294, -0.037242327, 0.035878398, -0.038687695, -0.1375315, -0.025202958, 0.16201124, 0.013408605, 0.014355783, -0.096680835, 0.022255216, 0.03341664, 0.21360716, -0.19629255, -0.080730826) * inp_5_1_0; + result5 += M4(0.05780671, 0.03151051, -0.09533458, -0.036138754, 0.085325405, 0.079871885, -0.05447282, -0.015572637, -0.038760122, 0.0092937825, 0.050205197, 0.044981916, 0.070406854, -0.21447529, 0.086107105, -0.1265078) * inp_5_2_0; + result5 += M4(-0.038627252, -0.083129525, 0.17659403, -0.00029304123, -0.05110783, -0.11466111, 0.041817386, 0.08996499, 0.0058902204, -0.101673685, -0.097280845, 0.016377315, 0.123583294, -0.37882477, 0.18708384, -0.21274601) * inp_5_0_1; + result5 += M4(0.017891554, -0.0924529, -0.11230249, -0.04422683, 0.19535036, -0.07621418, -0.015419963, -0.052413005, -0.12729426, 0.25029254, 0.109996825, -0.03906445, -0.15298806, 0.20329486, -0.15516731, 0.16511911) * inp_5_1_1; + result5 += M4(-0.116612375, 0.08374208, -0.053796217, -0.06865302, -0.13067329, 0.0070271594, 0.0050101983, -0.036871094, 0.045488104, -0.20447975, 0.019111462, -0.009512405, -0.11449201, 0.08815275, -0.0013520175, -0.04141479) * inp_5_2_1; + result5 += M4(0.012299937, 0.040253855, -0.020103863, 0.014504533, 0.0070058526, 0.34766734, -0.011668727, 0.011997763, 0.05332768, -0.12484089, 0.1411861, 0.017044658, 0.07146129, -0.17852463, -0.046510007, 0.261115) * inp_5_0_2; + result5 += M4(0.013000854, 0.01427056, 0.06157069, 0.034582317, -0.06337898, -0.1682466, 0.1966991, 0.033848155, 0.081196725, -0.09845173, -0.17626299, -0.04258284, 0.040944576, 0.01767872, 0.096687, -0.13569689) * inp_5_1_2; + result5 += M4(0.0011596079, -0.02902239, 0.039856132, 0.06654238, 0.06272485, -0.040144224, -0.14967823, -0.011194731, -0.08152785, 0.17720066, 0.02770775, -0.029510932, -0.015763372, -0.008295878, -0.17469892, -0.06197967) * inp_5_2_2; + result6 += M4(0.12634937, 0.0047176755, -0.0023666045, -0.17185715, 0.041995194, 0.08580433, -0.019855058, -0.16372326, 0.0005703018, -0.051382005, 0.09084429, -0.0923641, 0.5026688, -0.13673092, -0.041429102, 0.2305102) * inp_5_0_0; + result6 += M4(-0.17184043, -0.046707463, -0.09629054, 0.17896427, -0.14317074, -0.034042265, -0.028564677, -0.09288513, -0.04052649, -0.103569254, -0.11988994, -0.016139982, -0.2713395, 0.21981595, -0.13325606, 0.13163035) * inp_5_1_0; + result6 += M4(0.17869763, 0.04220423, 0.020358948, 0.0024650232, 0.24445039, -0.09796552, 0.030105257, -0.017725293, -0.083676815, 0.10193483, -0.007315185, 0.041317523, -0.058383707, -0.1376982, 0.0880252, -0.056816675) * inp_5_2_0; + result6 += M4(-0.099820845, 0.03825947, 0.02760095, 0.12253293, -0.15873304, -0.03239704, 0.12766914, 0.076064214, 0.12373115, 0.028318314, -0.05778652, 0.000201399, -0.03422849, 0.14859863, -0.07394239, -0.45415223) * inp_5_0_1; + result6 += M4(0.0046086614, -0.029323088, 0.0037501832, 0.027988294, 0.03323502, -0.051436786, -0.05228498, 0.044276025, 0.034207437, 0.16238986, 0.010878247, 0.08464746, 0.1487494, -0.26896262, 0.20652126, -0.18100755) * inp_5_1_1; + result6 += M4(-0.035197876, -0.04366502, 0.035339285, 0.050565384, -0.29892582, 0.072769985, -0.1155187, 0.13084127, 0.20492572, -0.10352106, 0.05120397, -0.16049863, -0.16324668, 0.18290119, -0.10591192, 0.4367685) * inp_5_2_1; + result6 += M4(0.06542644, -0.014019163, 0.049701963, -0.17240004, 0.05597519, 0.061345052, -0.050692916, -0.055611074, 0.015141942, 0.019591434, -0.02537892, 0.16448306, 0.10904281, 0.019480957, -0.057452843, 0.29781646) * inp_5_0_2; + result6 += M4(0.02090635, 0.048748102, -0.0068986276, 0.07381991, 0.12719898, 0.06750788, -0.011535723, 0.03762042, -0.08301663, -0.14192106, 0.064508125, -0.18024893, -0.19493704, 0.038035985, -0.10094456, -0.37358606) * inp_5_1_2; + result6 += M4(-0.061400414, 0.034934737, -0.03841873, -0.13124485, 0.12522037, -0.020985782, 0.077340946, -0.02178773, -0.20025279, 0.067012675, 0.0019786628, 0.14482464, -0.09902924, -0.08181926, 0.19886817, -0.0876146) * inp_5_2_2; + result7 += M4(0.005649079, -0.059613556, 0.02964755, -0.008253926, -0.032677952, 0.0048968527, -0.05435635, 0.037290543, 0.005426379, 0.14760187, -0.13819705, -0.20871899, 0.05374583, -0.60471654, 0.12308755, 0.09233771) * inp_5_0_0; + result7 += M4(0.008553421, -0.0645067, 0.038095362, 0.13192508, -0.05705614, -0.03130014, -0.05336549, -0.004368372, -0.020328974, 0.056116655, 0.16079322, 0.080766626, 0.03758701, 0.27084115, -0.19478312, -0.11305778) * inp_5_1_0; + result7 += M4(0.025759513, -0.11544007, -0.13009948, -0.09325596, 0.031546887, 0.009393887, 0.10479527, -0.010015455, 0.021379417, 0.02588358, 0.09822233, 0.013954054, 0.006573289, 0.28000477, 0.47753495, -0.035638705) * inp_5_2_0; + result7 += M4(0.0641764, 0.13217968, 0.039280195, -0.16454938, -0.025768677, -0.022151973, 0.05872212, -0.23989552, 0.085176446, -0.17971896, -0.09992917, 0.27695453, 0.15325901, 0.043672174, -0.09613854, 0.21809594) * inp_5_0_1; + result7 += M4(0.0074359905, 0.1685519, -0.09009094, 0.08143212, 0.17212771, 0.2637319, -0.08570341, 0.16874231, -0.11409092, -0.17448346, 0.046117924, -0.05846929, -0.06711896, 0.17457324, 0.10569317, -0.16965592) * inp_5_1_1; + result7 += M4(0.024910688, 0.02056893, -0.012128357, 0.040595967, 0.031881515, -0.038413577, -0.04442754, 0.06732903, 0.07553692, 0.11135082, 0.034813605, -0.05207529, -0.12512033, -0.3301706, -0.12434907, -0.04464195) * inp_5_2_1; + result7 += M4(-0.05928546, -0.033062376, 0.030242398, -0.051686622, 0.10269837, -0.053202778, 0.031299736, -0.19218338, -0.16345605, 0.08292737, 0.21957637, 0.13657396, -0.3350501, 0.51627177, -0.172988, 0.0145964045) * inp_5_0_2; + result7 += M4(-0.01876092, -0.030428665, -0.021914767, -0.04481331, -0.24269202, 0.023109574, 0.02617615, 0.024787918, 0.19887243, 0.08684815, -0.20336089, -0.14958073, -0.037786152, -0.34368092, 0.090763696, 0.18229406) * inp_5_1_2; + result7 += M4(-0.072768904, -0.041036393, 0.10446251, 0.07985334, 0.006942449, -0.14677073, 0.026783535, 0.07301252, -0.09170757, -0.15814917, -0.097314164, -0.02838477, 0.29388687, -0.03887368, -0.18596645, -0.14245121) * inp_5_2_2; + const V4 inp_6_0_0 = inp[6][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_6_1_0 = inp[6][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_6_2_0 = inp[6][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_6_0_1 = inp[6][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_6_1_1 = inp[6][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_6_2_1 = inp[6][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_6_0_2 = inp[6][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_6_1_2 = inp[6][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_6_2_2 = inp[6][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.012106466, -0.15345298, -0.08378939, 0.12622406, 0.012718541, -0.008613582, 0.033625353, 0.025256662, -0.044943176, 0.1857792, -0.029300677, -0.03670613, 0.039346103, 0.111817226, 0.01024991, -0.0119714085) * inp_6_0_0; + result0 += M4(-0.037384275, -0.14414127, 0.0962, -0.046945114, -0.0671494, -0.039485455, 0.012243028, -0.0028543829, 0.008464603, 0.08692771, -0.03990161, 0.13193013, -0.04097, -0.04636373, -0.19106796, 0.0985175) * inp_6_1_0; + result0 += M4(-0.018671004, -0.017943678, 0.04398808, 0.094916835, 0.07654241, 0.033742562, -0.039423797, -0.045341562, -0.0029132208, -0.0017163929, 0.011742977, -0.0020405827, 0.06202555, 0.1921562, 0.021508468, -0.09311479) * inp_6_2_0; + result0 += M4(0.08258628, -0.15739617, 0.032765172, -0.054458193, -0.059486303, 0.03932351, 0.00085268443, -0.018396974, -0.045281533, 0.8353495, -0.19662504, -0.14061503, 0.092955, 0.43550152, -0.17532475, -0.011303331) * inp_6_0_1; + result0 += M4(-0.21856928, 0.08050352, 0.03677221, 0.0651133, 0.06932937, 0.0042430065, -0.042399313, 0.03919132, 0.18629305, 0.08669851, 0.05961686, -0.27594873, 0.18094176, -0.21195422, -0.028879004, -0.07385303) * inp_6_1_1; + result0 += M4(0.036994472, 0.01662979, -0.054696392, -0.10013999, -0.086165935, -0.028104296, 0.012374445, 0.030374156, 0.04777046, -0.09116055, 0.10015607, -0.17447135, 0.20724836, -0.09685017, -0.046217337, 0.014567777) * inp_6_2_1; + result0 += M4(-0.18870883, 0.24891973, -0.058342047, -0.102999404, 0.06289564, -0.04927099, -0.035229925, -0.027459668, -0.11389219, 0.281945, -0.042358447, -0.08145434, 0.09102512, 0.18765716, -0.03359404, -0.12243276) * inp_6_0_2; + result0 += M4(0.2887588, 0.06335172, 0.05468212, 0.10598921, -0.02554402, 0.006700232, 0.008271227, -0.046788972, -0.6011407, 0.043958507, -0.12628426, 0.022061458, -0.08201852, -0.053557277, -0.12616639, -0.11289462) * inp_6_1_2; + result0 += M4(-0.0662575, 0.025483217, 0.06843246, -0.057116106, -0.010014512, 0.03863418, 0.047006205, 0.038808186, -0.32513607, 0.028112732, 0.061865132, 0.052737467, 0.12510483, 0.06065424, 0.0061625503, -0.08212802) * inp_6_2_2; + result1 += M4(-0.05537547, -0.10584454, 0.17445882, 0.039320838, 0.029352712, 0.10009384, 0.018403254, -0.008451422, -0.010438245, -0.049993772, 0.013073953, 0.0012875921, -0.14018881, -0.16595082, 0.0052606612, -0.002602665) * inp_6_0_0; + result1 += M4(0.5974986, 0.38695624, 0.16659424, 0.21760575, 0.16671526, -0.064696155, 0.14363948, -0.07474475, -0.041908372, -0.08203296, -0.118649796, -0.017634304, -0.41561303, 0.008651487, -0.25636798, -0.017652659) * inp_6_1_0; + result1 += M4(-0.14412911, -0.007872712, 0.015968226, -0.014418979, -0.20120674, 0.023706729, -0.09115236, 0.07184485, -0.31529373, -0.09372805, -0.093335286, -0.07609914, -0.3186875, 0.028608622, -0.04111354, -0.05754573) * inp_6_2_0; + result1 += M4(-0.039024632, -0.04611198, 0.056130063, -0.0019070219, -0.09471824, 0.04971225, -0.11604436, 0.034022447, -0.012728234, -0.18483748, 0.12125591, 0.07499227, 0.02772473, -0.2146635, 0.09928117, -0.010939701) * inp_6_0_1; + result1 += M4(-0.14313851, -0.26408833, -0.12528805, -0.2300533, -0.12326439, -0.056244265, -0.0924131, 0.0392229, -0.29384363, -0.31348163, 0.330936, 0.025901005, -0.19144477, -0.08315651, 0.044882346, 0.40910354) * inp_6_1_1; + result1 += M4(-0.13263476, 0.09399424, -0.18401755, 0.060563993, 0.20146129, 0.012537847, 0.19415396, -0.17056547, -0.036495067, -0.09367358, -0.025172954, -0.29933095, 0.13618505, 0.026404368, -0.046856225, 0.18194523) * inp_6_2_1; + result1 += M4(-0.10728768, -0.040524904, -0.0256625, -0.026695987, 0.037023287, -0.15622687, 0.029011453, -0.069045186, 0.018591557, 0.048545625, 0.10051945, 0.07578343, 0.006115621, -0.26347432, -0.13156949, -0.012525573) * inp_6_0_2; + result1 += M4(-0.036134083, 0.029875446, 0.0019903486, -0.06975292, -0.023380252, 0.07665267, -0.07290828, 0.09365051, -0.07313285, 0.09349326, 0.37566623, -0.46782276, -0.0868402, -0.0695731, 0.035579726, 0.17563824) * inp_6_1_2; + result1 += M4(0.0058661443, -0.05787653, -0.0070689344, 0.057756037, 0.016281847, 0.000754575, -0.01613972, 0.09095201, 0.010673997, 0.07296203, 0.06352837, -0.46791345, 0.05497706, 0.073918924, -0.10419392, 0.06697151) * inp_6_2_2; + result2 += M4(-0.30791253, 0.054929286, -0.11619131, 0.20885357, -0.003551234, -0.011490099, 0.010738854, -0.0023565886, -0.04622841, 0.117540166, -0.020852482, -0.05393148, 0.26176038, 0.10078302, 0.019561853, -0.41914457) * inp_6_0_0; + result2 += M4(-0.19308683, -0.05961244, 0.14863037, -0.06427681, -0.07715048, -0.03101713, 0.005530758, -0.14717019, -0.17455803, 0.012907689, 0.09311841, 0.13581964, -0.044078086, 0.053658266, -0.15522219, -0.013672103) * inp_6_1_0; + result2 += M4(0.04293136, 0.029523639, -0.071078524, -0.26523545, 0.094132036, 0.032061774, -0.037358224, 0.09966991, 0.111482225, -0.02270647, 0.12524423, -0.11504007, -0.0038967214, 0.06406252, 0.11020652, -0.11673919) * inp_6_2_0; + result2 += M4(0.15995932, 0.01628486, -0.10748732, -0.08356608, 0.021173634, 0.064193584, 0.008848415, -0.072128735, 0.044811167, 0.24923256, 0.2170841, -0.13928747, 0.15425721, -0.02810852, 0.04772339, -0.051768236) * inp_6_0_1; + result2 += M4(0.17703275, -0.10982029, -0.115383305, 0.44708803, -0.004119606, 0.025502378, 0.032340597, 0.17390364, -0.41836554, -0.08544096, 0.19394878, -0.2471876, -0.20595935, -0.2773386, 0.005247382, -0.19914868) * inp_6_1_1; + result2 += M4(0.24976474, 0.22905642, 0.24719793, -0.14712569, 0.020671936, -0.02012602, 0.009262729, -0.09029471, 0.4186103, -0.086724505, 0.25843936, -0.17639849, 0.0411741, -0.052974965, -0.007161358, -0.07557877) * inp_6_2_1; + result2 += M4(-0.08693387, 0.088292375, -0.010787665, -0.05368293, -0.0497267, -0.054036945, 0.03659949, 0.01648016, 0.2731276, 0.20715119, 0.084664635, -0.4510117, 0.12420691, 0.1324471, 0.024092857, -0.015220077) * inp_6_0_2; + result2 += M4(0.004188181, -0.07960533, -0.012280582, 0.014133065, -0.00037244317, -0.0054945317, -0.0008293582, -0.08630114, -0.17743078, 0.3379718, 0.0042328853, 0.11659004, -0.0779983, -0.036052812, 0.06280147, -0.07078268) * inp_6_1_2; + result2 += M4(-0.12103991, -0.13086842, -0.0691693, 0.02434762, -0.014101179, 0.016723646, -0.06618713, 0.11079065, 0.36945522, 0.08123133, 0.059545223, -0.16160169, -0.18173711, -0.1070442, 0.08762668, 0.07940788) * inp_6_2_2; + result3 += M4(0.0038555262, -0.035539962, -0.15305716, -0.040686075, -0.001395411, -0.006230044, 0.08067099, 0.02537404, 0.020188874, 0.037195217, -0.0063610673, 0.018840492, 0.04581549, -0.2953481, 0.16795851, 0.018277468) * inp_6_0_0; + result3 += M4(0.044500068, 0.48384443, -0.251938, 0.31228992, -0.054366183, 0.09986723, -0.13791041, 0.12415033, 0.03818242, -0.075632244, 0.16462453, 0.05111858, -0.08858612, -0.32170576, 0.06191775, 0.017193083) * inp_6_1_0; + result3 += M4(0.06857752, -0.33082834, -0.13673152, -0.19575082, 0.039417002, -0.08244813, 0.0009284936, -0.11823014, -0.059374202, 0.026232705, -0.0029804094, 0.008301534, 0.096700616, 0.046536308, 0.002709834, -0.029206563) * inp_6_2_0; + result3 += M4(-0.0071823034, 0.08439951, 0.18662809, 0.123422585, 0.07848613, -0.013321786, 0.08114353, 0.049146492, -0.014172599, -0.106093876, 0.43698654, 0.08134191, -0.1051863, 0.0103056645, 0.16959958, 0.101134695) * inp_6_0_1; + result3 += M4(0.2656892, -0.18195593, 0.5030563, 0.050045732, 0.029901233, -0.031708173, 0.06740759, 0.066785894, -0.21847509, 0.038321655, -0.059498433, 0.038515206, -0.03182428, 0.048759192, 0.025033671, -0.06781109) * inp_6_1_1; + result3 += M4(-0.24185222, -0.10268158, 0.059367534, -0.042547498, -0.10144291, 0.0710651, -0.041285533, 0.0139204, -0.06819188, -0.00238278, 0.014819355, 0.076350845, 0.32023802, 0.020679062, 0.09375915, -0.09526196) * inp_6_2_1; + result3 += M4(0.08537252, 0.0057462896, -0.12523384, 0.13038383, -0.017883396, -0.02239685, -0.098460004, 0.002886984, 0.10167507, 0.0015704846, -0.017546427, 0.060097456, -0.022908391, 0.027439581, 0.29503915, -0.043815017) * inp_6_0_2; + result3 += M4(-0.051369827, 0.040966537, -0.26092237, 0.101121426, -0.035460584, -0.05978096, 0.03460531, -0.24298002, 0.53973204, -0.07241015, 0.07205192, 0.5240865, -0.05638357, -0.02844116, 0.008436423, -0.23450613) * inp_6_1_2; + result3 += M4(-0.10621907, 0.027842356, -0.049255498, -0.42702007, 0.06065241, 0.037673924, 0.015880253, 0.092496835, -0.28590575, 0.028880058, 0.023324812, 0.5276617, -0.08194627, -0.040459733, 0.009024029, -0.16347758) * inp_6_2_2; + result4 += M4(-0.0036340184, -0.19224647, 0.122025914, 0.044550303, -0.03944944, 0.00025841105, -0.034183946, 0.030966835, -0.036516797, -0.13000216, 0.0123277595, -0.041757237, -0.11440482, 0.06848479, 0.014669274, -0.0016524862) * inp_6_0_0; + result4 += M4(0.3280191, -0.28087407, -0.53217494, -0.14237612, 0.10763859, -0.0402313, -0.017866354, 0.036505796, 0.043750647, 0.06835897, -0.036990255, -0.06274793, -0.40183654, 0.4600486, 0.4631865, -0.0560154) * inp_6_1_0; + result4 += M4(-0.0034581015, 0.25419223, 0.13969666, -0.024186742, -0.036613047, 0.014686457, 0.03856947, -0.051897224, 0.049743965, 0.024846803, -0.07048087, -0.061835982, -0.016084349, 0.031234695, 0.051300075, -0.16437761) * inp_6_2_0; + result4 += M4(-0.034397483, 0.0024732144, -0.08201674, -0.019793672, 0.06486806, -0.022493416, -0.06811711, -0.13785273, -0.1567208, -0.05678462, 0.20837055, 0.046358436, -0.018036349, 0.18258855, 0.16738671, 0.05476182) * inp_6_0_1; + result4 += M4(-0.092339724, 0.18858752, 0.034547217, 0.11541137, -0.11787786, 0.07035984, 0.06415264, 0.07906819, 0.06359256, -0.2824897, -0.14351916, -0.0854402, -0.17815758, 0.063458644, -0.072746515, -0.096280366) * inp_6_1_1; + result4 += M4(-0.0557854, 0.020173848, -0.003971126, 0.056449562, 0.082830966, -0.024724817, 0.015091682, 0.025925938, 0.13794515, -0.12205794, -0.08458665, -0.34304833, 0.09521836, 0.10625166, -0.07884946, -0.3412227) * inp_6_2_1; + result4 += M4(0.18805267, -0.038490828, -0.025904175, -0.008483034, -0.047314472, 0.06923969, 0.040638484, 0.029876344, 0.1917949, 0.0509993, 0.081868425, 0.02926477, -0.09164984, -0.011828185, -0.10790521, 0.080319576) * inp_6_0_2; + result4 += M4(-0.05598666, 0.072711565, 0.10128454, 0.016907338, -0.059954006, -0.105596386, -0.06877422, -0.05849031, 0.5586191, 0.02948197, 0.08816101, 0.09812052, -0.11868488, -0.28614712, 0.15188959, -0.11080101) * inp_6_1_2; + result4 += M4(-0.17027429, -0.025383769, 0.1169771, -0.012234105, 0.054236878, 0.041374665, 0.041269615, 0.04356989, 0.23114279, -0.02649456, -0.17426552, -0.080268, -0.18888266, -0.03767309, 0.033702627, -0.2538175) * inp_6_2_2; + result5 += M4(-0.004918348, 0.19905144, 0.05262634, 0.069202065, -0.039908826, 0.0833353, 0.026864378, 0.10965801, 0.005247605, 0.0055892146, -0.11265625, 0.016843623, 0.023402216, -0.07743773, -0.22316042, -0.35602027) * inp_6_0_0; + result5 += M4(-0.040287238, -0.33916506, -0.16253309, 0.2871137, 0.008959897, 0.12299351, -0.043768045, -0.003122143, -0.11948717, 0.14991072, -0.006827206, -0.08529128, -0.10718264, 0.06527513, 0.09372023, -0.38260207) * inp_6_1_0; + result5 += M4(0.20020314, -0.008048079, -0.18600494, -0.08164018, -0.02846727, -0.1514154, 0.022539655, -0.061827984, -0.050332196, -0.029327614, 0.17235793, 0.017677268, -0.16149905, -0.07287796, -0.06718061, -0.01375314) * inp_6_2_0; + result5 += M4(0.118015416, -0.086825274, 0.07507014, -0.11611629, -0.011043244, -0.17142507, 0.029793518, -0.17836748, -0.0017105595, -0.110007964, -0.17448409, 0.04322612, 0.026848376, -0.2228803, -0.23631029, 0.23014198) * inp_6_0_1; + result5 += M4(0.109121315, -0.30629945, 0.044800602, 0.00031975657, -0.003881907, -0.05468688, 0.008386701, -0.00925419, -0.38520077, 0.14721003, 0.019947473, 0.021119498, -0.1846955, -0.09388212, -0.107238755, -0.007386925) * inp_6_1_1; + result5 += M4(-0.2803955, 0.07304927, -0.08881065, -0.13521475, -0.03575965, 0.12258199, -0.042164072, 0.16698818, -0.05332283, 0.0064989896, 0.19709145, -0.061822847, 0.09997842, 0.11037973, -0.082862906, 0.021769479) * inp_6_2_1; + result5 += M4(-0.017753689, 0.7216013, -0.040688187, -0.0039997245, 0.02397351, 0.1162306, 0.008456707, 0.06458571, 0.098280385, -0.01937478, -0.3917561, -0.248364, -0.026535183, 0.40029076, -0.08676536, 0.10481424) * inp_6_0_2; + result5 += M4(0.038752086, -0.19745655, 0.07278577, 0.10173609, -0.0028424757, -0.02649189, 0.056131862, 0.050097574, -0.13234589, 0.15139034, -0.07750276, -0.4894782, -0.0868365, -0.16052026, 0.08192918, 0.11276872) * inp_6_1_2; + result5 += M4(-0.13758172, 0.18617037, 0.21518631, -0.043789245, 0.07482252, -0.04646531, -0.072005406, -0.14747803, -0.19270235, 0.05757941, 0.033084534, -0.19923544, 0.0076074735, -0.13343146, 0.04625468, 0.16586748) * inp_6_2_2; + result6 += M4(0.3692552, 0.18700288, 0.046469208, -0.83745253, 0.16609484, -0.023618586, 0.047567476, 0.25111392, -0.052940432, 0.020116925, -0.035472732, 0.12248557, -0.15619072, 0.07367641, -0.014206049, 0.35193592) * inp_6_0_0; + result6 += M4(-0.17344889, -0.035080187, 0.016237963, 0.24028131, -0.061824355, 0.020947462, -0.013190794, -0.1326595, 0.13987835, -0.061027236, 0.044086207, 0.13641013, 0.012129531, 0.03541953, 0.18398593, 0.25241706) * inp_6_1_0; + result6 += M4(0.45027927, -0.13119091, 0.14480837, -0.3900522, -0.039011486, -0.032457303, -0.041927848, -0.1141818, -0.048385255, 0.036863778, -0.09468647, -0.14622603, -0.017622251, 0.055058237, -0.07404342, -0.08019119) * inp_6_2_0; + result6 += M4(-0.5126082, 0.0250307, 0.05720017, 0.34627405, -0.08955548, 0.07276102, -0.06251175, -0.3268237, 0.067469105, 0.123653635, 0.03377985, 0.48476285, 0.05552931, -0.053781208, -0.0002798505, 0.2947853) * inp_6_0_1; + result6 += M4(-0.015389773, -0.031241164, -0.13403958, 0.048113085, 0.0054829135, -0.115541756, 0.04782047, 0.12844259, 0.010296193, -0.17678712, -0.071923204, -0.07861362, 0.007796647, -0.21490929, -0.08351756, -0.02593395) * inp_6_1_1; + result6 += M4(-0.44125608, 0.17373408, -0.07024419, 0.53966373, -0.028802782, 0.059344836, 0.021555273, 0.15413366, -0.100253135, 0.10107631, -0.05112034, 0.076062314, -0.012534987, -0.017741298, -0.07552009, -0.024660543) * inp_6_2_1; + result6 += M4(0.2836132, -0.01932003, -0.0136915445, -0.5124644, 0.044597175, -0.033958435, 0.007405325, 0.11399435, 0.01970318, -0.028952098, 0.02431384, -0.03813878, 0.092619576, 0.17260937, 0.06430765, 0.00641455) * inp_6_0_2; + result6 += M4(-0.11700236, -0.12621722, 0.0036962251, 0.340042, 0.009588825, 0.059699494, -0.07709355, -0.1449235, 0.019256035, -0.19967644, 0.10564262, -0.056742966, -0.040997576, -0.047084644, -0.010661702, -0.0022625392) * inp_6_1_2; + result6 += M4(0.13365895, 0.0034713922, -0.04030902, 0.024485944, -0.023411265, -0.024093764, 0.07691721, 0.05109017, -0.080172874, 0.0145921325, 0.06321368, 0.29013556, -0.05296626, 0.039180975, -0.09404607, 0.102516964) * inp_6_2_2; + result7 += M4(-0.0142698195, -0.35068092, 0.09134653, 0.100349456, 0.027457558, -0.25371256, -0.05916039, -0.047232125, 0.06380676, -0.068687566, -0.010155156, 0.042301953, 0.09267003, 0.14634989, 0.0026647695, -0.0049481075) * inp_6_0_0; + result7 += M4(-0.09915805, 0.08602638, 0.1746032, 0.037031297, -0.02763648, 0.07252486, -0.09003767, -0.023388645, -0.061541844, 0.2054888, 0.2198256, -0.10380363, 0.00073509815, 0.01588891, -0.115924574, -0.07018012) * inp_6_1_0; + result7 += M4(-0.05837695, -0.17103878, -0.05001107, -0.03663052, -0.017222203, 0.1871162, 0.1700977, 0.01788191, 0.0024174396, -0.1487449, -0.03310217, -0.014056119, 0.14408614, -0.1415077, -0.45177191, 0.05164154) * inp_6_2_0; + result7 += M4(-0.084672846, 0.12466793, -0.1432201, -0.3398579, 0.010911488, -0.093502656, 0.00756657, 0.17970008, 0.1492752, 0.21295321, -0.19132859, 0.5085314, -0.19924381, 0.17707938, 0.02740011, 0.46549532) * inp_6_0_1; + result7 += M4(0.41169757, 0.5967105, 0.026373118, 0.07418247, 0.09373894, 0.21151355, 0.05413694, -0.099333405, -0.2888301, 0.05785326, 0.14055033, -0.11988609, -0.269145, -0.048865616, -0.024069898, 0.04433855) * inp_6_1_1; + result7 += M4(0.097007565, 0.18792208, 0.047719333, -0.02351276, -0.023761727, -0.12780339, -0.061044425, 0.00915271, -0.07568198, -0.119766876, 0.17411695, 0.15572698, -0.2480675, 0.0790848, -0.060102552, 0.06784786) * inp_6_2_1; + result7 += M4(0.14531173, -0.2054003, -0.7614083, -0.23984447, -0.026955362, 0.33937895, 0.101706505, -0.15278089, -0.038381867, -0.18224654, -0.52462786, 0.4673273, -0.069073536, -0.33421674, -0.09704695, 0.10429694) * inp_6_0_2; + result7 += M4(-0.2850001, 0.25573727, 0.15921137, 0.0010903815, -0.12251482, -0.260288, 0.033454634, 0.098720774, 0.92828685, 0.06440317, -0.24102682, 0.09411055, -0.3397009, 0.22110723, 0.09996403, -0.020825688) * inp_6_1_2; + result7 += M4(-0.06272972, -0.4137962, 0.37996432, 0.38542953, 0.08703189, -0.08905659, -0.18196754, 0.024184512, 0.25047547, -0.016506394, 0.028860852, 0.031100653, -0.11408193, 0.111942284, 0.14682114, 0.04318035) * inp_6_2_2; + const V4 inp_7_0_0 = inp[7][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_7_1_0 = inp[7][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_7_2_0 = inp[7][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_7_0_1 = inp[7][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_7_1_1 = inp[7][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_7_2_1 = inp[7][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_7_0_2 = inp[7][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_7_1_2 = inp[7][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_7_2_2 = inp[7][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.014353114, -0.11275372, 0.017101286, 0.04500403, -0.028307123, -0.027228843, 0.03751128, -0.04944511, -0.06487342, -0.111867905, 0.124301545, -0.045297578, 0.021065714, 0.0335565, 0.055671465, 0.0467294) * inp_7_0_0; + result0 += M4(0.052967153, 0.032695595, -0.0132920565, 0.053149506, -0.03851454, 0.121283025, 0.003841687, 0.053148795, 0.17063406, 0.15267807, 0.041710112, -0.15338065, -0.04026101, 0.005603595, -0.052845787, -0.025693765) * inp_7_1_0; + result0 += M4(-0.028077211, -0.027225709, -0.0051577147, -0.11659893, -0.01417866, -0.00052974204, -0.04348931, 0.08966539, 0.006414392, -0.06365352, 0.039985918, -0.24214837, 0.03032394, -0.0004049964, -0.028789049, 0.026453212) * inp_7_2_0; + result0 += M4(-0.046294864, 0.22096519, -0.021905879, -0.18977551, 0.0692849, -0.079159915, 0.019926084, 0.117099494, -0.18453087, -0.17593549, 0.004554182, 0.05615213, 0.09616826, 0.22854215, -0.02020335, 0.07491898) * inp_7_0_1; + result0 += M4(0.053866386, -0.11384861, -0.03276426, 0.013385152, -0.08028509, 0.5418343, -0.056845386, 0.40829384, -0.13290142, 0.27085716, -0.040069412, 0.28983802, -0.024209587, -0.25874156, 0.032672346, -0.14334495) * inp_7_1_1; + result0 += M4(0.10088695, -0.024727784, 0.034140524, 0.078566186, 0.001957661, 0.06481202, 0.18895929, 0.079009496, -0.134042, -0.048751436, 0.027198179, 0.18978055, -0.08585495, 0.08180948, -0.027686188, -0.008015847) * inp_7_2_1; + result0 += M4(0.03346555, 0.0151627585, -0.045812663, 0.07184466, 0.2848006, 0.05750056, 0.018815454, 0.05078782, 0.14931768, -0.018108085, 0.08897964, -0.020083474, -0.101658605, -0.2438199, 0.038232405, -0.0028725616) * inp_7_0_2; + result0 += M4(-0.10693435, 0.008253324, 0.004617819, 0.03426456, 0.43525624, 0.25294906, 0.054209054, 0.04168832, 0.1367255, -0.076938614, -0.10859612, -0.018767882, 0.014070651, 0.15839024, -0.022569476, 0.064987905) * inp_7_1_2; + result0 += M4(-0.033445988, 0.01778602, 0.034630578, -0.029133061, 0.16804501, -0.03651849, 0.03725318, 0.02294806, 0.09204603, 0.046556253, -0.08887389, 0.028313152, 0.06748311, -0.0025560146, 0.01351426, -0.01065418) * inp_7_2_2; + result1 += M4(0.040308073, 0.04505658, -0.028936354, 0.05357192, 0.069005154, -0.022885451, -0.04451302, -0.03266394, -0.015595519, 0.041988354, 0.041710246, 0.06770739, -0.03120778, -0.055994637, 0.052312985, -0.032743722) * inp_7_0_0; + result1 += M4(0.016969742, -0.048291955, -0.071368635, 0.047664452, -0.05572528, -0.10641916, 0.11160313, -0.014072517, 0.34282428, -0.2082821, 0.14904083, -0.14416885, -0.090661965, -0.061563205, -0.07512007, 0.06139925) * inp_7_1_0; + result1 += M4(-0.19702905, 0.030960094, -0.05458272, -0.0754698, -0.2766572, -0.01714257, -0.26215035, -0.17854984, -0.12216617, 0.042103052, -0.065890305, 0.16145104, 0.3728696, 0.025717204, 0.038364805, -0.06061092) * inp_7_2_0; + result1 += M4(-0.03357625, -0.061053906, 0.0053991075, -0.06292604, 0.11292377, 0.11852541, 0.025336754, 0.023148049, 0.0272661, 0.009107645, -0.11430631, 0.0349591, 0.03963782, 0.04256717, -0.1300768, 0.060850278) * inp_7_0_1; + result1 += M4(-0.095392935, -0.027390571, 0.015524171, 0.054022916, -0.009220926, -0.15404417, -0.19279191, -0.07210376, -0.06588157, 0.14132205, -0.022582307, -0.09584702, -0.0476393, 0.057289902, 0.028087042, -0.078038074) * inp_7_1_1; + result1 += M4(0.22010638, 0.025682257, 0.13692182, 0.11521366, -0.51115274, -0.043630525, -0.37905124, -0.7190254, -0.014344466, -0.14322762, 0.042048674, -0.36055204, -0.2126895, -0.10081747, 0.028942827, 0.04278908) * inp_7_2_1; + result1 += M4(0.034696974, 0.010013742, 0.033755627, -0.020153072, 0.0029146264, -0.16775467, 0.022721024, 0.022360275, 0.029730726, -0.15672398, 0.030952197, -0.13791305, -0.0092123365, 0.020230466, -0.025414525, 0.0035857607) * inp_7_0_2; + result1 += M4(0.02151872, 0.079521835, 0.051630046, -0.15491311, 0.03575967, -0.25270543, -0.30480486, 0.46502337, 0.067274645, 0.12940463, -0.053315967, 0.18826471, 0.08342076, -0.081227385, 0.105936, 0.07108182) * inp_7_1_2; + result1 += M4(-0.04203556, 0.03520508, -0.043292966, 0.03562582, 0.0074006454, -0.014183344, -0.08961154, -0.43540156, -0.15724301, -0.051220912, -0.12103146, 0.18422587, -0.038501363, 0.007947142, -0.02641826, -0.07334442) * inp_7_2_2; + result2 += M4(-0.03443398, 0.0077519407, -0.089413844, 0.17306937, 0.01868346, 0.007816045, 0.04195766, -0.023894185, -0.043585904, -0.07678083, -0.045774665, -0.026052441, 0.04755804, -0.0015195918, 0.012173942, -0.19940287) * inp_7_0_0; + result2 += M4(-0.01257784, 0.08401328, 0.042236045, -0.102779076, -0.29758537, -0.0030091677, -0.050751425, 0.12300386, -0.05593892, 0.07293752, -0.04916725, -0.1674086, -0.0052278875, -0.09500247, -0.09886488, 0.36195952) * inp_7_1_0; + result2 += M4(0.04362559, -0.06273948, 0.023371696, 0.101177715, 0.0863567, -0.04032845, 0.1717006, 0.047807705, 0.106685065, -0.010567523, 0.049855568, 0.1358614, -0.016453585, 0.0739066, 0.04314656, -0.17515093) * inp_7_2_0; + result2 += M4(0.13032791, 0.1103069, 0.0876338, -0.1359878, 0.10360484, 0.057464816, -0.074109405, 0.05356139, 0.026399983, -0.09806969, 0.062716335, -0.018326327, 0.09460351, 0.029219367, 0.09259965, 0.072329156) * inp_7_0_1; + result2 += M4(-0.20484379, -0.16170463, -0.011605044, 0.056872673, -0.11182432, 0.21517394, 0.010260593, 0.40527734, 0.04237112, 0.028367715, -0.050859418, 0.3298651, 0.03210299, 0.05331277, 0.06977549, -0.18202697) * inp_7_1_1; + result2 += M4(-0.0368897, 0.016391978, -0.024294581, -0.009350654, 0.1955551, -0.028641196, 0.499472, -0.023318058, -0.09908497, 0.20021608, 0.15166949, -0.06593413, -0.093563184, -0.01030146, -0.16426736, 0.1239057) * inp_7_2_1; + result2 += M4(-0.055037364, -0.021643072, -0.021387717, -0.029731398, 0.094444685, -0.07963394, 0.021096926, -0.0284398, 0.15600166, 0.051011793, 0.018822383, -0.20377164, -0.06093815, -0.122096315, -0.09575318, 0.07561008) * inp_7_0_2; + result2 += M4(0.102123156, -0.03031301, 0.066700675, -0.020931395, -0.16889022, -0.1305484, 0.08320382, 0.21251659, -0.03229301, -0.16032566, -0.14695112, 0.08483938, 0.00030656724, 0.1682771, -0.037963215, -0.019027025) * inp_7_1_2; + result2 += M4(0.034280032, 0.062147725, -0.044607468, -0.10986789, -0.045719683, -0.041917246, 0.2606613, 0.23340343, -0.0060716677, -0.011685313, 0.09870094, 0.10358789, 0.053007178, -0.09497951, 0.14624749, -0.018423423) * inp_7_2_2; + result3 += M4(-0.023918586, 0.08953427, 0.01771276, 0.05539354, 0.0028634146, 0.009650554, 0.18742946, -0.013471182, 0.009523058, 0.20777467, 0.31837824, 0.12164815, -0.027161406, -0.12503518, 0.053555198, -0.08024025) * inp_7_0_0; + result3 += M4(-0.010696416, -0.20303713, -0.07494842, -0.06720856, 0.036300484, 0.06688092, -0.23665178, -0.028879825, 0.07920989, 0.06684934, -0.09307057, -0.12861334, -0.016808033, 0.068868615, 0.016922612, 0.0935384) * inp_7_1_0; + result3 += M4(0.040408652, -0.026042184, -0.042566612, -0.13783605, -0.041067638, 0.04742047, -0.08538231, -0.12444389, 0.020503249, 0.013062706, -0.16142748, 0.13985167, 0.001934984, 0.14903793, 0.07425482, -0.05194177) * inp_7_2_0; + result3 += M4(-0.021580713, -0.052124616, 0.25143862, -0.08356271, -0.02948785, 0.056538586, -0.19342871, -0.03082576, 0.06952971, -0.024033487, -0.20058027, -0.070293054, -0.025813319, 0.1556333, 0.06812163, 0.007927993) * inp_7_0_1; + result3 += M4(-0.09415238, 0.0819948, -0.020783098, -0.061048, 0.031241082, -0.25082436, 0.17802086, 0.11500772, -0.032032706, -0.017166939, 0.17285053, 0.10988556, -0.0014609772, -0.12550686, -0.32190156, -0.12481579) * inp_7_1_1; + result3 += M4(0.026642501, 0.0027076115, -0.0127527015, -0.030659534, -0.23827177, -0.08147645, -0.06555366, -0.0722888, -0.109351926, 0.037317634, -0.0675982, 0.11558462, 0.049270067, -0.11005517, 0.03807277, 0.029940536) * inp_7_2_1; + result3 += M4(0.058748785, -0.05442449, -0.15973112, 0.064877376, -0.034439556, -0.034699302, 0.22719848, -0.111805916, -0.06498236, 0.010337431, -0.2207168, 0.15086775, -0.0013910768, 0.020652262, 0.047396146, -0.18456744) * inp_7_0_2; + result3 += M4(0.07299843, 0.063161835, 0.09055556, 0.073410906, -0.2721035, -0.089366235, -0.19288264, -0.4911799, -0.2704215, -0.098629974, 0.18357053, -0.31222442, 0.16648315, -0.0030768674, 0.115959756, 0.07765713) * inp_7_1_2; + result3 += M4(-0.07566839, 0.06178913, -0.020680057, 0.20640337, 0.6270522, -0.021944718, -0.09193208, -0.60390484, 0.30230644, -0.07720848, 0.04565392, -0.28929085, -0.12785488, -0.0036496334, -0.02822165, 0.26953188) * inp_7_2_2; + result4 += M4(0.0023062807, -0.034817286, -0.042075228, 0.06544454, 0.005506302, -0.0864455, -0.1226953, -0.013349928, 0.1547137, -0.11107969, -0.011432964, 0.058164947, 0.0428984, 0.043311194, 0.016129535, 0.04118873) * inp_7_0_0; + result4 += M4(-0.1534756, 0.16967072, 0.11172404, -0.11816128, 0.086648315, -0.1714072, 0.06653684, 0.089376345, 0.14469789, -0.21376182, 0.025603222, -0.05220291, 0.06091292, 0.052578565, -0.11138733, 0.0048681847) * inp_7_1_0; + result4 += M4(-0.041845363, 0.013118367, 0.024128294, 0.014151567, -0.08004441, 0.03486238, -0.24785793, 0.15483975, 0.05084481, -0.19106285, -0.11259754, 0.018545493, -0.008554448, -0.14740153, 0.057274133, 0.0051899627) * inp_7_2_0; + result4 += M4(0.064041376, -0.032968413, 0.013469658, -0.08303931, 0.1341178, 0.11964721, -0.009992949, 0.12108774, 0.09818911, 0.14065015, -0.07883844, -0.110692464, -0.033610746, 0.037767347, 0.034289274, -0.081328794) * inp_7_0_1; + result4 += M4(-0.08536015, -0.046906322, -0.05603467, 0.15344562, -0.152151, 0.2835985, 0.08837327, 0.24121024, -0.090531245, 0.29047784, -0.028336503, -0.0079366965, 0.0021427502, -0.09222166, 0.082214415, 0.049104534) * inp_7_1_1; + result4 += M4(-0.03418688, -0.027119642, -0.033249117, -0.04254291, -0.11109964, 0.014894068, -0.2578382, 0.6063039, 0.0059784884, 0.12751795, -0.082763284, 0.13159256, 0.008276564, 0.05974327, -0.024297485, 0.05277847) * inp_7_2_1; + result4 += M4(-0.03444889, -0.017802611, 0.0074504083, 0.016012343, -0.15777689, 0.03241681, 0.013117755, -0.01719593, 0.036037434, -0.03379203, 0.102202065, -0.02253011, -0.06792619, 0.0014595084, -0.017348377, 0.009831464) * inp_7_0_2; + result4 += M4(0.1639479, -0.045117706, -0.03546795, -0.08156594, -0.45054284, 0.07469492, 0.011867304, 0.018695822, -0.49507293, -0.03135175, 0.013335458, 0.1188135, 0.07899112, 0.006609462, 0.099146456, -0.042408854) * inp_7_1_2; + result4 += M4(0.12333911, 0.026525073, 0.022529328, 0.07107176, -0.24384674, 0.10793493, -0.17994872, -0.13251431, 0.06154726, -0.015966468, 0.06687427, -0.07726767, -0.040318996, 0.042070385, -0.11340186, -0.038753133) * inp_7_2_2; + result5 += M4(0.012673467, -0.037103087, 0.050768357, 0.11804936, -0.019557068, 0.0804737, -0.042042516, 0.05063627, -0.012027864, -0.1778315, 0.018416423, 0.10421972, 0.03836791, -0.038451895, -0.02987596, -0.092936814) * inp_7_0_0; + result5 += M4(0.081070006, 0.21753052, -0.039890427, -0.050826468, 0.05336978, 0.025667759, 0.035597946, -0.0027159257, 0.13079563, 0.077491805, 0.0008582202, -0.027367916, -0.03181248, -0.19372894, -0.03209458, 0.13858509) * inp_7_1_0; + result5 += M4(-0.090944424, -0.2096128, 0.09019298, -0.031379037, -0.13405223, -0.0067626154, 0.1769988, 0.054293416, -0.1751145, -0.042708788, 0.09452406, -0.014315755, -0.043122165, 0.13656834, 0.03425129, 0.014349805) * inp_7_2_0; + result5 += M4(0.041083314, 0.1534725, 0.023191346, -0.10281753, -0.06915832, -0.06962649, 0.0956159, -0.058003347, 0.0382738, 0.06731591, 0.032283228, -0.11744953, 0.014508298, -0.059293862, -0.13243897, 0.061025135) * inp_7_0_1; + result5 += M4(-0.141368, -0.050856274, -0.030658523, 0.17189708, 0.13174817, 0.0645548, -0.059649896, -0.02070111, 0.18805191, 0.028028676, -0.053158768, -0.09673214, -0.092923135, 0.24802732, 0.15580657, -0.10671394) * inp_7_1_1; + result5 += M4(0.09939962, 0.09758035, -0.024120683, 0.09566199, -0.60467446, -0.09358554, 0.3542098, 0.020203883, -0.13448891, 0.19609664, -0.05980421, -0.03988452, 0.136309, -0.2209743, -0.018121988, -0.05301252) * inp_7_2_1; + result5 += M4(-0.03687012, -0.18174249, -0.11188414, -0.02836825, 0.044762637, -0.24598104, 0.0068728975, 0.24393502, -0.09776831, -0.24554634, -0.015937854, 0.043758687, -0.005986967, -0.099301524, 0.18006183, -0.0048940037) * inp_7_0_2; + result5 += M4(0.010051847, 0.14913419, 0.04709535, -0.1599654, 0.011909533, -0.040965673, -0.005180561, 0.37368757, -0.056836154, 0.17044185, -0.0014325223, 0.16753975, 0.10263891, -0.12474947, -0.25155222, -0.048479144) * inp_7_1_2; + result5 += M4(0.036764596, -0.09817697, 0.007691489, -0.022019843, -0.2540071, -0.11688611, 0.33893287, 0.19115168, 0.060142547, -0.26031005, 0.049264375, 0.13124378, -0.13203354, 0.25323352, 0.065698855, 0.05051374) * inp_7_2_2; + result6 += M4(0.103523776, 0.02477652, 0.11931213, 0.22718367, 0.06380224, -0.06312115, -0.03342871, -0.4218613, -0.19583617, -0.110368855, -0.013944256, 0.12757345, -0.1519957, -0.09970155, -0.024198022, 0.14459626) * inp_7_0_0; + result6 += M4(-0.047426138, -0.0148957195, -0.042323805, 0.087921016, -0.1303865, 0.05344321, 0.00063070335, 0.1077284, 0.29951233, -0.08278956, 0.05315382, -0.36245754, 0.13688883, -0.0050035845, 0.007669434, -0.2535922) * inp_7_1_0; + result6 += M4(-0.13914482, 0.08349452, -0.013398495, -0.15577376, 0.30625576, 0.04390654, -0.14788996, 0.009021893, -0.18404761, 0.15880117, 0.028981408, 0.24488695, -0.0344917, 0.06377489, 0.0041787643, 0.09069907) * inp_7_2_0; + result6 += M4(-0.021672724, 0.10200765, -0.08164302, -0.29037845, -0.06524793, -0.022847952, 0.028325712, 0.2354771, 0.13164325, 0.038568657, -0.16452388, -0.19628757, 0.19386996, -0.03581283, -0.00604313, 0.050671853) * inp_7_0_1; + result6 += M4(0.035448324, -0.1123009, 0.09017061, -0.08369615, 0.1547177, -0.05313325, 0.13626438, 0.14329228, -0.03914897, -0.07970992, 0.031553738, 0.12308475, -0.021477817, 0.18625718, -0.056503914, 0.025862794) * inp_7_1_1; + result6 += M4(-0.01362803, 0.009873275, -0.021020252, 0.087704435, -0.14416143, 0.08732547, -0.14793603, -0.03519952, 0.08739808, -0.05324601, 0.07178301, -0.08709111, 0.20508981, -0.076404765, 0.04942568, -0.17588924) * inp_7_2_1; + result6 += M4(-0.013772979, -0.11576433, 0.01059106, 0.11937095, 0.0012364802, 0.097883895, -0.0006651487, 0.06130685, -0.103754304, 0.067012094, 0.044164915, 0.35208485, -0.21629731, 0.07848428, 0.012615492, 0.08878749) * inp_7_0_2; + result6 += M4(-0.015643293, 0.06297431, -0.04773868, -0.008664792, -0.011143935, 0.09854246, -0.055016216, -0.052518137, 0.05246791, 0.08729363, -0.17093359, 0.06510517, -0.11441792, -0.1609416, 0.06776908, -0.06430595) * inp_7_1_2; + result6 += M4(0.123950824, -0.051986836, 0.014396684, 0.012277637, 0.06813568, 0.23590678, -0.023414893, -0.58936876, -0.070839845, 0.008637937, 0.034731027, -0.33632293, -0.05807661, 0.012112994, -0.051097997, 0.16272677) * inp_7_2_2; + result7 += M4(0.03890071, -0.33123735, 0.07610937, 0.017791811, 0.0057243104, 0.026786948, -0.087388285, -0.01708201, -0.008149538, -0.25381488, 0.044889413, -0.04300029, 0.005804609, 0.2458334, -0.08152119, -0.11150984) * inp_7_0_0; + result7 += M4(0.0422852, 0.13573533, -0.06058061, -0.0424984, 0.03687254, -0.03310906, 0.09053876, -0.07896283, 0.10294674, 0.052148327, -0.058537725, 0.00015676564, -0.084710106, 0.0056222873, 0.12804465, 0.035081454) * inp_7_1_0; + result7 += M4(-0.042567257, 0.12327564, -0.035985358, 0.022775404, 0.03893252, 0.05088072, 0.25473788, -0.061396737, -0.15365401, 0.002246268, 0.022066768, -0.032394666, 0.032087665, -0.11022627, 0.044275492, 0.042746745) * inp_7_2_0; + result7 += M4(0.020063348, 0.2125661, 0.049881417, 0.093660116, 0.120162055, -0.098703384, -0.0842956, -0.082464784, 0.08245367, -0.0054075294, 0.036755443, -0.18863225, 0.05575246, -0.24835603, -0.12517622, 0.21147853) * inp_7_0_1; + result7 += M4(-0.1254844, -0.016756577, 0.06075211, -0.07974918, 0.17144044, 0.20313495, -0.07901684, 0.1899529, 0.1122259, 0.1490667, -0.004221913, 0.12265247, -0.05538133, -0.13985953, 0.0050306907, -0.049673144) * inp_7_1_1; + result7 += M4(-0.08064654, -0.10558799, -0.0926085, -0.05734894, 0.05110601, -0.049914468, 0.20254362, 0.15950541, 0.14961079, -0.21021506, -0.043306883, -0.0031992765, 0.0018046714, 0.27162942, 0.07231483, -0.047220748) * inp_7_2_1; + result7 += M4(-0.03405335, -0.06100464, -0.14044772, 0.008790728, -0.22311267, 0.12704943, 0.315955, -0.07793368, -0.06166175, 0.27874878, 0.45222285, -0.21086659, -0.11326259, -0.001237944, 0.22471191, 0.10012642) * inp_7_0_2; + result7 += M4(0.08034098, -0.04164105, 0.109292865, 0.06862852, -0.9858028, -0.29458532, 0.005978831, -0.08900043, -0.35984895, -0.31873637, -0.04210668, 0.3260013, 0.25243136, 0.108902775, -0.15964879, -0.13984245) * inp_7_1_2; + result7 += M4(0.115727626, 0.06112435, -0.0116834, -0.007107361, -0.20668198, -0.0906514, 0.030455202, 0.09493923, 0.06987535, 0.31463626, -0.25152567, -0.05157696, -0.10789083, -0.058889717, -0.0033864905, -0.039781593) * inp_7_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(4, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 0), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 0), max(result3, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result4, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result5, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 1), max(result6, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 1), max(result7, V4(0.0))); +} + +//!DESC ArtCNN C4F32 DS (Conv2D-2-ReLU) +//!COMPUTE 48 32 12 16 +//!HOOK LUMA +//!BIND conv2d_1 +//!SAVE conv2d_2 +//!WIDTH LUMA.w 4.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[8][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(4, 2); + inp[0][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(2, 0), 0)); + inp[3][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(3, 0), 0)); + inp[4][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(0, 1), 0)); + inp[5][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(1, 1), 0)); + inp[6][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(2, 1), 0)); + inp[7][y][x] = V4(conv2d_1_mul * texelFetch(conv2d_1_raw, input_base + ivec2(3, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(-0.02816354, -0.055914808, -0.005309126, 0.04302756); + V4 result1 = V4(-0.014681287, -0.016003639, 0.00277319, -0.0058796373); + V4 result2 = V4(0.02500318, 0.020994185, -0.031882454, 0.008797194); + V4 result3 = V4(0.02854713, 0.0019857346, -0.014389184, -0.0067033246); + V4 result4 = V4(0.0074750828, 0.03989044, -0.008352795, 0.023925535); + V4 result5 = V4(-0.0012237664, -0.00821828, -0.032822374, 0.015555121); + V4 result6 = V4(0.0007366013, 0.012672618, 0.030530484, -0.0013905298); + V4 result7 = V4(-0.00665594, 0.019364757, 0.016776288, 0.005514103); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.00973409, -0.2905453, 0.16804078, 0.03635058, 0.006616991, -0.0051788976, 0.13990617, -0.2115806, 0.03791847, -0.021446934, -0.021149958, -0.16244367, -0.00543431, -0.078437224, 0.07517865, -0.24875812) * inp_0_0_0; + result0 += M4(0.16061167, 0.7075375, 0.65901136, -0.003121915, -0.108868085, 0.032168996, -0.4784643, -0.22404712, 0.23408975, 0.1489741, 0.10012224, -0.24961211, 0.013702174, 0.056856558, 0.3949789, 0.05728903) * inp_0_1_0; + result0 += M4(-0.07653732, 0.058309093, -0.2743541, -0.21182717, -0.060219403, -0.45752004, -0.39590853, -0.16866995, -0.094204135, 0.022472931, -0.028624104, 0.036514435, 0.053413846, -0.02451724, 0.27651215, 0.15742646) * inp_0_2_0; + result0 += M4(0.002592745, -0.030824926, 0.12114033, 0.050930567, -0.04900121, 0.06812072, -0.104584135, -0.1769679, 0.055577897, -0.16978319, -0.051331874, 0.05407539, 0.087580524, -0.2494271, -0.15750952, -0.06727893) * inp_0_0_1; + result0 += M4(-0.22075485, -0.60167396, -0.11148448, -0.051743947, -0.035690382, -0.017755114, -0.1048373, -0.75410384, -0.0017477311, 0.79013854, 0.070787504, 1.113939, 0.42162004, 0.08894495, 0.0162932, -0.6922328) * inp_0_1_1; + result0 += M4(-0.041542415, -0.1072675, -0.1547168, -0.057783205, -0.18774375, -1.0897189, 0.22137026, 0.49475524, 0.16061123, 0.18809871, -0.09942451, 0.12167183, 0.18478668, 0.052944053, 0.008523406, -0.49077532) * inp_0_2_1; + result0 += M4(0.079150654, -0.09704456, -0.025152894, 0.0662591, -0.049504023, -0.061450716, -0.006600424, -0.17110133, -0.022903575, -0.04218302, -0.035543904, -0.16162673, -0.010834032, -0.17441283, -0.06410564, -0.010752595) * inp_0_0_2; + result0 += M4(0.00037973173, 0.041147046, -0.0467547, -0.018489948, 0.006920091, 0.10765793, -0.03490517, -0.03536748, 0.0046151318, 0.06889305, -0.23292892, -0.005253062, -0.04773103, -0.35578787, 0.29783678, -0.48508322) * inp_0_1_2; + result0 += M4(0.07547907, 0.048772506, -0.14922605, 0.017899437, -0.037430517, -0.08345768, -0.08171882, 0.11549391, 0.0005753293, 0.19681996, 0.0007395721, 0.13482398, 0.04092026, 0.25392926, 0.13197581, -0.02444149) * inp_0_2_2; + result1 += M4(0.026670206, -0.4946369, 0.3635779, -0.09936638, -0.23612276, 0.12949154, -0.19376677, -0.018545061, -0.042181347, -0.8171006, -0.11456052, -0.12682119, 0.25297365, -0.11276777, 0.29135993, -0.30411947) * inp_0_0_0; + result1 += M4(-0.18254642, -0.196034, -0.1642319, 0.09249603, -0.18092251, 0.16449213, -0.1416846, -0.031061044, -0.026164776, 0.036878493, 0.16753155, 0.2940041, 0.101618774, -0.027227087, -0.17554337, -0.10692067) * inp_0_1_0; + result1 += M4(0.03190994, -0.08537802, -0.05265426, 0.2876244, -0.226532, -0.110195614, 0.09589837, 0.20734823, 0.061036523, 0.06264236, -0.06855547, -0.2823261, -0.026292771, -0.0022096266, -0.03458269, 0.28914374) * inp_0_2_0; + result1 += M4(0.11070176, -0.26740578, -0.1026421, 0.4110956, 0.09973385, -0.08346745, -0.3098377, 0.01835725, 0.1627276, -0.052195985, -0.48610088, -0.011137913, -0.22427069, 0.19412372, 0.062320832, 0.072610706) * inp_0_0_1; + result1 += M4(-0.14468084, -0.11145455, 0.1275323, -0.013943981, 0.21764868, 0.08969234, -1.2398715, -0.032734215, 0.36903408, 0.31528226, -0.07379252, -0.0041661304, -0.16513638, 0.29776296, -0.2183875, 0.18277328) * inp_0_1_1; + result1 += M4(0.13366769, -0.19119081, 0.23958637, -0.054906853, -0.045737054, -0.36034152, 0.2197925, -0.13690129, 0.06692774, 0.104316145, 0.060143124, 0.36369458, 0.20639238, 0.13639095, 0.091172956, -0.2692958) * inp_0_2_1; + result1 += M4(0.018454649, -0.05970896, -0.12773207, -0.13395509, -0.13538544, -0.021243846, -0.29808754, -0.072587125, 0.04806527, -0.09977992, 0.14219216, 0.096854396, 0.28429163, 0.14802298, 0.29175624, 0.26465315) * inp_0_0_2; + result1 += M4(0.064868286, 0.12650129, -0.04001578, -0.19142, -0.15243354, 0.04739349, -0.17602153, 0.089925356, -0.009179498, 0.2031116, 0.031400472, 0.11040097, 0.09661687, 0.05683243, -0.25136912, -0.11845621) * inp_0_1_2; + result1 += M4(-0.006583343, -0.027446115, 0.052255236, -0.048547603, 0.04551308, 0.08371158, 0.06561082, -0.17494093, -0.08677734, 0.11848272, -0.09256678, 0.12511909, 0.03584318, -0.03873551, -0.033272453, -0.3697406) * inp_0_2_2; + result2 += M4(0.077423126, 0.16964856, -0.17045945, 0.13343857, -0.012152219, 0.007827578, -0.07009769, 0.017719552, -0.07333286, 0.04077868, -0.024390765, 0.12850142, -0.03029182, 0.118830204, 0.1101359, -0.040818922) * inp_0_0_0; + result2 += M4(0.04737959, -0.57087344, 0.41235384, 0.1218992, -0.11092868, 0.030822208, 0.14311466, -0.092787445, 0.0027061475, -0.23113571, -0.29040268, 0.031662967, 0.04665202, -0.2214472, 0.124013655, 0.04762459) * inp_0_1_0; + result2 += M4(0.109790795, -0.13166402, -0.10937001, 0.13497192, -0.09461978, 0.11224206, -0.13746579, -0.210441, -0.058519382, 0.07024931, 0.058509335, 0.0596217, 0.057765707, 0.1522484, -0.112002224, -0.17201875) * inp_0_2_0; + result2 += M4(-0.23446816, -0.012046481, -0.2965843, 0.02298828, -0.019495957, -0.014813968, -0.07092402, -0.036055468, -0.017873934, 0.111397855, 0.09068365, -0.013072809, -0.024324076, -0.12630874, -0.12351092, -0.026566792) * inp_0_0_1; + result2 += M4(-0.0441673, 0.6080127, -0.4925612, 0.17336337, -0.21843402, 0.6022208, -0.89766985, -0.31109822, -0.01132926, -0.38773924, 0.4651305, 0.38577083, 0.20481502, 0.07963986, 0.17493346, 0.22013973) * inp_0_1_1; + result2 += M4(0.17083597, 0.12362538, -0.27829507, -0.1323653, -0.46952274, 0.45709655, -1.3564483, -0.09467831, 0.109629124, 0.09952558, -0.1851101, -0.06606823, 0.093976825, -0.063372426, -0.1879661, 0.08313608) * inp_0_2_1; + result2 += M4(-0.03973812, -0.031842444, 0.093453266, -0.04741993, -0.039069645, -0.054418374, -0.045754157, -0.029643415, -0.0028617077, -0.036310848, -0.2293659, -0.012074187, -0.07525764, 0.05500191, 0.07562592, -0.115233526) * inp_0_0_2; + result2 += M4(0.036355898, -0.034812134, 0.1152061, 0.029086314, -0.18425488, -0.21790303, 0.0787836, -0.09064558, 0.0409123, 0.2763841, 0.055201523, 0.09320933, -0.18550111, -0.19603312, 0.15517412, 0.18693168) * inp_0_1_2; + result2 += M4(0.040125795, -0.113297805, 0.025580121, 0.030720403, 0.004614835, -0.13644749, -0.033115827, -0.28015882, 0.082783215, -0.04702188, -0.075818196, 0.019709801, 0.22457251, -0.36561012, 0.18594532, -0.10976233) * inp_0_2_2; + result3 += M4(0.21994363, 0.18810263, 0.03882187, 0.031097172, 0.028676543, -0.01652421, 0.0009278432, -0.097504616, 0.060369167, 0.022149583, 0.12658578, -0.047912594, 0.087797225, 0.0830042, -0.059321098, -0.09670434) * inp_0_0_0; + result3 += M4(-0.24017385, 0.20781578, 0.2484141, 0.07595827, 0.31128934, -0.077589154, -0.22300583, -0.08513767, -0.088106796, 0.07169701, 0.21182175, -0.16114962, -0.20586795, -0.09325638, -0.036742713, 0.04096944) * inp_0_1_0; + result3 += M4(-0.015692951, -0.03014106, -0.008278672, -0.0012050589, 0.31460193, -0.22267194, -0.15603703, -0.016500553, -0.08611368, 0.0129460925, 0.13168901, -0.17860411, 0.17449656, 0.16480394, -0.111943886, -0.119625956) * inp_0_2_0; + result3 += M4(0.3417092, 0.19531095, -0.12030788, -0.07435814, -0.00526715, 0.04863232, -0.108501635, -0.10556784, 0.10033676, 0.0058830003, 0.14145415, -0.10324726, 0.04020823, -0.11052599, 0.1680087, 0.019774001) * inp_0_0_1; + result3 += M4(0.17469816, -0.108954616, -0.022078786, -0.57005113, 0.35266578, -0.15694757, -0.15896995, -0.07326995, -0.105245724, 0.04300008, 0.056248702, -0.061844226, -0.061631538, 0.15420584, -0.24465819, -0.04917201) * inp_0_1_1; + result3 += M4(-0.029127898, 0.10533356, -0.05784396, -0.36961702, 0.27379173, -0.08493819, -0.4078918, 0.2997451, -0.13829932, 0.035396393, 0.5777129, -0.06907513, -0.21687625, 0.0904391, -0.18873766, 0.042626336) * inp_0_2_1; + result3 += M4(-0.113065094, -0.008775924, -0.0840243, -0.08211604, -0.13342449, -0.0070020193, -0.03519927, -0.04905381, 0.11932424, 0.07503596, 0.082997814, 0.26825115, 0.2309719, -0.06072887, -0.13271064, -0.16668823) * inp_0_0_2; + result3 += M4(-0.13799047, 0.20521674, -0.009416285, -0.60644346, -0.12462929, -0.17963387, -0.00022621856, -0.6172592, -0.12347812, 0.11500762, -0.015037872, 0.3211392, -0.2576381, 0.20789056, 0.09743092, 0.17717129) * inp_0_1_2; + result3 += M4(-0.12627003, -0.014355152, 0.05081674, 0.18330996, -0.17688012, -0.09465515, -0.5051855, -0.53248626, 0.044556856, -0.081473775, 0.12005949, -0.15343209, 0.008224941, -0.17976554, -0.060513843, -0.31796342) * inp_0_2_2; + result4 += M4(-0.0647204, 0.09654864, -0.15104817, -0.04117688, 0.035523016, -0.046621397, -0.16918875, -0.05828916, -0.0629011, -0.09747466, -0.043645624, -0.13677382, -0.059999257, -0.11347389, 0.008796834, -0.16867939) * inp_0_0_0; + result4 += M4(-0.356825, -0.11862738, 0.11185236, -0.18727553, 0.10917819, -0.056881405, -0.12957531, 0.05320026, 0.24368936, 0.12946552, 0.073803104, -0.14360286, -0.071822084, 0.036721706, -0.23379014, -0.43976963) * inp_0_1_0; + result4 += M4(-0.09626581, 0.2864044, -0.20154244, -0.1094759, 0.12988517, 0.12269461, -0.03490066, -0.12602843, -0.10067345, -0.19819431, -0.10748926, -0.13594708, -0.00062526186, 0.004989592, 0.026069064, -0.010176603) * inp_0_2_0; + result4 += M4(0.0010864082, 0.15448679, -0.20172782, -0.095403604, 0.098961875, -0.048226472, -0.11919011, -0.022309378, 0.086312205, -0.19949594, -0.3084711, -0.08324916, 0.19120875, 0.25057435, 0.10739944, 0.09866035) * inp_0_0_1; + result4 += M4(0.44983077, -0.26926205, -0.20882393, 0.4908703, 0.55888087, -0.3844248, 0.17641366, 0.47042987, -0.32669616, -0.3570138, -0.14759587, -0.20607074, 0.02512093, 0.30407578, -0.044438023, -0.057541154) * inp_0_1_1; + result4 += M4(0.1176155, 0.113683954, 0.15930681, 0.17338523, 0.15644524, -0.14696267, 0.40857235, 0.20752317, -0.13565753, -0.019979121, 0.11889125, -0.10791812, 0.22435357, 0.113052554, -0.03955994, -0.08461989) * inp_0_2_1; + result4 += M4(-0.047255587, 0.16348606, -0.046946447, 0.056087777, 0.11520522, -0.008176931, -0.088727005, -0.075671315, 0.04560841, -0.167085, 0.0037524768, 0.153626, 0.10664237, -0.16228183, -0.08856867, -0.033942416) * inp_0_0_2; + result4 += M4(0.08530228, 0.036670424, 0.034691263, -0.20549068, 0.17499734, -0.0066715935, -0.24056336, -0.6436748, 0.0014624022, 0.1331887, 0.20349261, 0.39051116, 0.19860937, -0.09635772, -0.3097962, -0.061393823) * inp_0_1_2; + result4 += M4(-0.04709873, 0.12436787, 0.09431891, 0.06727294, 0.11121267, -0.13708098, -0.4096628, -0.5281741, 0.02461811, 0.086295374, -0.040318497, 0.11986206, 0.008481668, -0.07885111, -0.14814031, 0.06536796) * inp_0_2_2; + result5 += M4(-0.1205189, -0.13522245, -0.13375437, -0.33984226, 0.059571605, 0.040225558, 0.045981076, -0.22930293, 0.015563473, 0.06315636, 0.11301604, -0.07917363, 0.14391504, -0.025930865, 0.039270613, 0.21071853) * inp_0_0_0; + result5 += M4(-0.168494, -0.15959108, -0.03137135, -0.031032706, -0.012562032, 0.05714811, 0.0873991, -0.11245921, 0.114595555, 0.068395376, -0.08256869, 0.059741195, 0.31202134, -0.091089986, 0.11305526, -0.043918602) * inp_0_1_0; + result5 += M4(0.01850779, -0.23716848, -0.10720259, 0.17940275, 0.02630356, -0.031081656, 0.03651098, 0.11984031, 0.04672979, -0.23975179, -0.06333951, 0.0773084, 0.063252, 0.023403741, -0.005932706, 0.09592404) * inp_0_2_0; + result5 += M4(0.13276811, 0.14552811, 0.0012012721, 0.048469163, 0.1799069, 0.09026324, 0.17791766, 0.039031304, -0.17148705, -0.018644629, 0.032975942, -0.08356387, -0.07501362, -0.08741777, 0.17653543, -0.037628986) * inp_0_0_1; + result5 += M4(0.052284062, 0.30748817, 0.017134773, 0.054767136, 0.08047865, 0.12932916, 0.43879172, 0.4796407, 0.1070753, -0.22417559, -0.075027876, -0.04380084, 0.12943043, -0.26664734, -0.28268087, -0.36309803) * inp_0_1_1; + result5 += M4(0.022102708, -0.27027315, -0.05346116, -0.22804186, 0.075889595, 0.36816397, 0.29277337, 0.18898353, 0.059737135, -0.062378123, 0.30335823, -0.025132932, -0.15769532, -0.01610137, 0.15320984, -0.06287545) * inp_0_2_1; + result5 += M4(-0.05120104, 0.040515866, -0.11039598, -0.022910422, 0.068926826, -0.021788657, 0.14885426, 0.04582351, -0.1011755, -0.008622556, 0.019709354, -0.033576366, -0.2670982, 0.13014965, -0.19012322, -0.09114442) * inp_0_0_2; + result5 += M4(0.06225843, -0.092458956, -0.008116768, 0.07783341, 0.007597398, -0.01865556, 0.10360059, -0.00978511, -0.02124729, 0.031475246, 0.017553534, 0.07894418, 0.09715431, -0.016325492, 0.19725467, -0.07008915) * inp_0_1_2; + result5 += M4(0.074878536, -0.07708234, -0.07687017, 0.06568579, -0.14378831, -0.12435922, 0.07116281, 0.057560194, -0.13975972, -0.10590216, -0.082184136, -0.06793749, -0.032578167, 0.16950749, -0.09511035, 0.09423518) * inp_0_2_2; + result6 += M4(-0.047091704, 0.1762099, 0.040428344, -0.10331589, 0.016791053, -0.002741752, -0.026449017, 0.003729791, 0.06808642, 0.2392403, 0.08078326, -0.16181335, 0.119027816, 0.027509267, -0.088286825, -0.0015622613) * inp_0_0_0; + result6 += M4(-0.15559126, 0.19469191, -1.6796982, 0.07050413, 0.14751838, -0.136357, 0.11992304, 0.21932352, 0.04491368, 0.25785303, -0.33661342, 0.06752385, 0.006559123, -0.39538005, -0.14140283, 0.02698698) * inp_0_1_0; + result6 += M4(0.04060059, 0.004955614, 0.17289354, -0.020432219, 0.04132994, -0.2269096, 0.009849744, -0.048955765, 0.07166714, 0.15780523, 0.030655716, 0.007910881, -0.01654475, -0.1261956, -0.033270393, 0.06643357) * inp_0_2_0; + result6 += M4(0.23296551, 0.39368978, 0.10173819, 0.016990587, 0.10725656, -0.21445906, -0.0460863, 0.12937367, 0.22015992, -0.056731716, -0.15625024, 0.11746047, -0.054077156, -0.29911926, -0.066048205, -0.13064308) * inp_0_0_1; + result6 += M4(0.14043681, 0.16510749, 0.37955365, 0.024925599, -0.10113562, -0.91881996, -1.4156492, 0.49913162, 0.056183968, -0.32814565, 0.36283296, -0.21359983, 0.018981446, 0.078645796, 0.48507872, -0.040559407) * inp_0_1_1; + result6 += M4(-0.11389132, -0.025869433, 0.17677203, -0.0012497363, -0.42856163, -0.7060819, -0.9791711, 0.06421006, 0.15110345, 0.05471478, -0.1331566, 0.06792761, -0.15620281, -0.17329371, 0.0050743627, -0.08315401) * inp_0_2_1; + result6 += M4(0.01762451, 0.34044358, -0.038219716, -0.00977577, 0.07978265, -0.07561531, 0.025359692, -0.009767879, 0.054548223, 0.056554604, -0.008550653, -0.024759918, 0.08444629, 0.4397034, -0.13774768, -0.0475808) * inp_0_0_2; + result6 += M4(0.07251138, 0.14877741, 0.14064711, -0.01770789, -0.12055167, -0.13074405, -0.03881797, 0.18801236, 0.244702, 0.10442613, -0.09986584, 0.14181675, -0.3256468, 0.24721909, -0.13838233, 0.05967567) * inp_0_1_2; + result6 += M4(0.08274853, -0.05230511, -0.015015344, -0.008427317, -0.1261798, 0.17729543, 0.20077544, -0.10061183, 0.09802276, -0.02198857, 0.20390317, -0.027713804, 0.28264147, -0.3060371, 0.012613725, -0.03912084) * inp_0_2_2; + result7 += M4(-0.06321895, 0.1795193, 0.30838016, -0.03319495, -0.022143506, -0.08803499, 0.04103361, -0.032351818, 0.02227362, -0.08811049, -0.0959823, 0.02694849, -0.0043757185, 0.013062695, 0.15145485, 0.026561698) * inp_0_0_0; + result7 += M4(0.16038859, -0.28498343, -0.53026897, 0.025555888, 0.099517666, -0.0127455015, 0.09401707, 0.056986097, -0.04029349, 0.19178541, 0.023709709, -0.02593737, -0.20253864, 0.28925106, -0.16694629, -0.026898233) * inp_0_1_0; + result7 += M4(0.061291948, -0.4159536, -0.21278694, 0.0041169757, 0.18120582, -0.11143881, 0.12851085, -0.04763011, 0.24448766, -0.15402062, -0.16995446, 0.051363885, -0.189586, 0.11198077, 0.087760806, 0.007919328) * inp_0_2_0; + result7 += M4(0.03529199, -0.08172859, 0.20492913, 0.010756407, -0.021344246, -0.103721984, -0.13724221, -0.03416302, 0.098283276, -0.08297246, -0.23792939, 0.053858396, 0.028365767, 0.17811257, -0.04905931, -0.027732367) * inp_0_0_1; + result7 += M4(-0.09731158, 0.07015159, 0.025875507, -0.08366549, 0.026216093, 0.20282517, -0.047570836, 0.12024377, 0.039535135, 0.06453895, 0.096107006, -0.120748885, 0.36688223, -0.32637262, -0.23932144, -0.017603891) * inp_0_1_1; + result7 += M4(0.0009714144, 0.0901112, -0.14175467, 0.15882266, 0.0050029205, 0.06735896, -0.04336168, 0.09880196, -0.088926695, 0.050075166, 0.13868159, 0.048162885, 0.11580188, 0.14974794, 0.16592643, -0.17951703) * inp_0_2_1; + result7 += M4(0.030689232, 0.25767696, -0.006166152, -0.036973067, 0.031712633, -0.048197642, -0.14026803, -0.028327234, 0.016440952, 0.13980462, 0.08790442, 0.08222346, 0.042942114, 0.23712075, 0.23788041, 0.027321558) * inp_0_0_2; + result7 += M4(0.008700281, 0.08348494, -0.20075266, 0.02521982, 0.021076478, 0.09265842, -0.06407022, -0.00076757924, 0.101533175, -0.19637956, -0.16996434, 0.09663022, -0.05636163, -0.2059281, 0.34135315, -0.16630952) * inp_0_1_2; + result7 += M4(0.03454254, 0.26498768, 0.13600038, 0.02592277, 0.0008362706, -0.100303456, 0.05319897, -0.009874358, 0.14062883, 0.09164722, -0.15648055, 0.08009963, 0.078154504, 0.094008006, -0.21762596, -0.018340524) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.050353423, -0.046809703, -0.074424565, -0.049597032, -0.059440833, -0.016547872, -0.030117158, -0.10792511, 0.067184374, 0.046471834, -0.0028451944, 0.08514948, 0.08273609, 0.029481065, -0.41196913, -0.12889831) * inp_1_0_0; + result0 += M4(0.06213183, 0.05712363, -0.120768435, 0.0054600067, -0.06808212, -0.2668333, -0.23615515, 0.13161564, -0.093465604, -0.15012908, -0.0579171, -0.070676625, 0.093419425, -0.9064117, -0.3119384, -0.27338335) * inp_1_1_0; + result0 += M4(0.012120313, -0.008722017, -0.06845569, 0.00030523405, 0.068179175, -0.094685584, 0.3295802, 0.08102866, -0.07075261, -0.11404178, -0.058991797, 0.10451936, -0.019411365, -0.031391826, 0.11522716, -0.07312307) * inp_1_2_0; + result0 += M4(0.06082993, -0.23506641, -0.0674635, 0.06528714, -0.012952341, 0.04296578, 0.035333797, -0.17849007, 0.14081058, -0.0053381305, -0.012471617, 0.13901459, -0.02180143, -3.354169, 0.018167697, -0.17981246) * inp_1_0_1; + result0 += M4(0.011075656, 0.09919327, -0.068206266, 0.24021362, -0.035487056, -0.3568312, 0.002771683, 0.09228731, -0.14318392, 0.31760496, 0.15125819, -0.036176164, -0.057475246, -0.06588559, 0.10080686, 0.08425073) * inp_1_1_1; + result0 += M4(-0.028857037, 0.052384343, -0.15574992, 0.035086505, 0.24430661, 0.44947267, -0.25937915, 0.5916093, -0.050427713, 0.06593315, 0.04158293, 0.067717426, 0.0035418617, 0.082726985, 0.0015692243, -0.13341355) * inp_1_2_1; + result0 += M4(-0.07018673, 0.57565486, -0.12212208, -0.021671755, 0.04045959, -0.027279906, 0.0033897066, -0.12028911, -0.051435515, -0.25275406, -0.05656492, 0.13834813, -0.026642008, -0.035601966, 0.007892064, -0.11206658) * inp_1_0_2; + result0 += M4(-0.13334328, -0.36171016, 0.20771265, -0.18690872, -0.0052082087, 0.15840878, -0.012833503, 0.14350723, -0.038447812, 0.2642458, 0.10113913, 0.1956421, -0.016976172, -0.018625548, -0.036039453, 0.13024461) * inp_1_1_2; + result0 += M4(-0.025897514, 0.022892162, -0.085544705, -0.1056002, 0.0076056076, 0.00021891292, 0.14977726, -0.058212887, 0.057734717, 0.029316211, 0.016036771, 0.2862503, -0.029245151, -0.04861973, 0.06345646, 0.0025747707) * inp_1_2_2; + result1 += M4(0.12230406, 0.110402204, 0.0022191075, 0.0208074, 0.1359608, -0.39918938, -0.19621581, -0.03328318, -0.14194785, -0.1326139, -0.016295277, 0.25213736, -0.11394504, 0.1707785, -0.50810874, 0.09009043) * inp_1_0_0; + result1 += M4(0.039731972, 0.019554405, -0.050087366, -0.116993316, 0.036561966, -1.6013801, 0.025701985, -0.20249905, -0.087569736, -0.110885486, 0.086238414, 0.18336657, -0.118454196, -0.14258544, 0.21710697, 0.12274369) * inp_1_1_0; + result1 += M4(-0.04302544, 0.03054647, -0.03619867, -0.012912802, -0.21779968, 0.05877272, -0.062298175, 0.05893563, -0.08509494, -0.09765255, 0.1835829, -0.301379, 0.016239118, 0.013196551, 0.046792064, 0.14568199) * inp_1_2_0; + result1 += M4(-0.47913632, 0.07477867, -0.013720931, -0.16285127, 0.09672787, 0.26150432, -0.07223319, 0.026923614, 0.15294167, -0.3069324, -0.05468833, 0.009024659, -0.2764688, 0.025165537, 0.21237579, 0.14874646) * inp_1_0_1; + result1 += M4(-0.12191206, -0.031483904, 0.25469255, 0.04896874, -0.03953795, -0.13158178, 0.23139334, -0.062157433, 0.21271344, 0.15276282, -0.10278962, 0.045026843, -0.13069059, -0.019814454, 0.12993966, 0.12076317) * inp_1_1_1; + result1 += M4(-0.021779012, -0.06921528, -0.04792355, -0.054524377, 0.21400808, 0.051987875, 0.17276382, 0.07044453, -0.08517467, 0.018291483, 0.110145435, -0.07507238, -0.014085478, 0.0014016334, 0.0069213454, 0.21427554) * inp_1_2_1; + result1 += M4(0.3039211, 0.21061566, -0.21254519, 0.11502978, 0.004645631, -0.035205964, -0.15530144, 0.016145334, -0.3796126, -0.26098803, -0.06447568, -0.18469138, 0.00040711233, -0.019105973, 0.14028107, -0.029840464) * inp_1_0_2; + result1 += M4(-0.10201214, -0.12005942, 0.28632927, -0.0048452117, 0.10168667, 0.1222315, -0.065509446, -0.018354936, 0.20522162, 0.45282546, -0.32358447, -0.21195723, 0.05026903, -0.0347392, 0.049776144, 0.04231012) * inp_1_1_2; + result1 += M4(0.052235685, 0.06476681, -0.007898288, -0.014652278, -0.010168681, -0.06502043, 0.11613052, 0.016242228, -0.008920748, 0.060279775, -0.083112516, 0.11410098, -0.0022111523, 0.012418391, 0.003915518, 0.11510619) * inp_1_2_2; + result2 += M4(0.009627145, -0.02091571, -0.040712036, -0.086539805, -0.077503406, -0.06554453, -0.0375449, 0.0003467931, -0.112540826, -0.042942278, -0.004069735, 0.06633014, 0.11937579, 0.112028055, -0.19244236, -0.011381193) * inp_1_0_0; + result2 += M4(-0.010039437, -0.17678991, -0.014025697, -0.13453454, -0.078378275, 0.21216086, -0.046340372, 0.004593987, -0.030087475, 0.093752, 0.0021318006, -0.07141553, 0.21013309, 0.29048875, -0.38266456, -0.06400555) * inp_1_1_0; + result2 += M4(0.050876804, 0.009760382, -0.019924283, 0.059721947, 0.041578773, -0.07134676, -0.05581895, 0.117495336, -0.111501575, 0.033511136, -0.055773247, -0.066173546, 0.13521561, 0.054245476, -0.0018692814, -0.12549134) * inp_1_2_0; + result2 += M4(0.05737616, 0.27942115, -2.298544, 0.027574228, 0.0033914193, -0.029851897, -0.029384125, -0.06649299, 0.13537526, -0.10982203, -0.015818523, 0.03578428, 0.082637616, 0.25502712, -0.95422614, -0.024462754) * inp_1_0_1; + result2 += M4(0.07468704, 0.19655287, 0.020330673, -0.15325862, -0.07257556, 0.021362118, -0.097650744, -0.07458505, -0.07285997, -0.2091995, 0.053149696, -0.035658777, 0.12165436, 0.019479273, -0.051164947, -0.05572143) * inp_1_1_1; + result2 += M4(0.05212816, 0.05875644, 0.007962393, 0.042551465, 0.06982919, -0.5235366, 0.36652777, 0.018920891, 0.02451188, -0.01821463, -0.0820836, -0.012211782, 0.13590047, -0.09741252, -0.024899637, 0.06283093) * inp_1_2_1; + result2 += M4(0.13758332, -0.11508548, -0.06850991, 0.027755717, -0.0053178435, -0.031295706, -0.009957828, 0.01909424, -0.14549612, 0.005653666, -0.060142104, -0.0726525, 0.019328095, -0.08044059, 0.0045705475, -0.025495505) * inp_1_0_2; + result2 += M4(0.17690514, 0.47819778, -0.56697905, -0.32600853, -0.15631567, 0.050864168, -0.070710234, -0.0061398265, 0.22401346, -0.66397154, 0.67689145, 0.12443163, -0.005753283, -0.003162449, 0.038585782, -0.021491662) * inp_1_1_2; + result2 += M4(0.052644014, -0.01084531, -0.009258209, -0.04327573, 0.08937049, 0.05608117, 0.0020092733, -0.13975157, 0.18227273, 0.010968768, 0.05547196, 0.27393818, 0.014354109, 0.04734593, -0.04274871, 0.08966255) * inp_1_2_2; + result3 += M4(-0.15466352, 0.1753106, -0.057654276, -0.080346055, -0.08684239, -0.060628965, -0.018058756, -0.019003063, 0.1649216, 0.0056091007, 0.018234013, 0.115384765, 0.2728903, -0.050012514, 0.07286001, 0.21214484) * inp_1_0_0; + result3 += M4(-0.055282563, 0.042270336, -0.14920826, -0.05565247, -0.17509723, -0.007836413, 0.025385581, -0.060870547, 0.15458457, 0.026210451, 0.0056088725, 0.009496039, 0.4410752, -0.02443769, 0.018905113, 0.34486783) * inp_1_1_0; + result3 += M4(0.13845061, -0.041570053, 0.05206113, 0.032746986, 0.3097028, -0.079597846, -0.0045065354, 0.036300916, -0.24376567, 0.1437171, -0.07567566, 0.12263813, -0.10524432, -0.032756347, -0.04089654, 0.11922382) * inp_1_2_0; + result3 += M4(-0.3450517, -0.0293347, -0.008506553, 0.27482376, -0.104029484, 0.015886096, 0.047152877, -0.022681655, 0.05039552, -0.06931879, -0.24398392, -0.19114342, 0.33690536, -0.1760741, 0.062387463, -0.60001916) * inp_1_0_1; + result3 += M4(-0.33937278, 0.03221792, -0.20601016, 0.09151184, 0.088146046, 0.010388135, 0.037717123, -0.33787167, 0.031349875, 0.2467585, 0.11280596, -0.081789084, 0.100762054, 0.11897287, -0.14958718, -0.4274934) * inp_1_1_1; + result3 += M4(-0.16177538, -0.10681617, 0.097662374, 0.027116643, -0.15535423, 0.0071900445, 0.098842345, -0.09686859, -0.020677991, 0.1223462, -0.18145184, -0.12322052, -0.049173184, -0.04933215, 0.011176784, 0.10453388) * inp_1_2_1; + result3 += M4(0.0143258395, -0.047530204, 0.06751263, -0.009686652, 0.049010016, 0.08026732, 0.0735831, 0.06534365, -0.11096335, 0.07671127, -0.17131972, -0.18913133, 0.03580388, 0.02546478, 0.031590775, -0.46314153) * inp_1_0_2; + result3 += M4(-0.11024047, 0.059999876, -0.24776231, 0.069180936, 0.099450134, -0.0028138063, 0.14560589, -0.27537617, -0.13162738, 0.2602523, -0.082328625, 0.5751915, -0.016883427, 0.035476677, -0.058363155, -0.087529816) * inp_1_1_2; + result3 += M4(-0.06527366, -0.07321466, -0.11013269, 0.10700489, 0.12794274, 0.143373, -0.1998652, 0.085530356, 0.27018106, 0.03430492, 0.01313275, -0.19258638, 0.099327035, 0.031997293, -0.01579704, -0.028137546) * inp_1_2_2; + result4 += M4(0.034241717, 0.14560685, -0.07059983, -0.048365757, -0.06923395, 0.02788708, 0.07024026, -0.07239688, -0.05073314, 0.06361448, 0.1036229, 0.13770972, 0.16711862, -0.06759201, 0.06868784, 0.21040082) * inp_1_0_0; + result4 += M4(7.889136e-05, 0.1448967, 0.0120723415, -0.04398796, -0.0025940053, 0.19994844, 0.045044854, 0.122164845, 0.00011145298, 0.039136488, -0.058423296, 0.011019284, 0.3187712, 0.002346311, 0.3133367, 0.3366688) * inp_1_1_0; + result4 += M4(-0.020006701, -0.09640312, 0.034889605, 0.032910477, 0.0859932, -0.16727556, 0.18134122, 0.08072309, -0.005591878, 0.2618464, 0.11717167, 0.13277426, 0.005803244, -0.07343049, -0.0007594699, 0.07177366) * inp_1_2_0; + result4 += M4(0.24020621, 0.17265165, 0.27775222, 0.37951496, 0.007373834, 0.013477186, -0.05720337, -0.08359239, 0.06963244, -0.20801787, -0.16162816, -0.16387402, 0.17029399, -0.06789564, 0.057876557, 0.15928234) * inp_1_0_1; + result4 += M4(0.08696715, 0.22902814, -0.098804325, 0.17399752, -0.031757943, 0.009000329, -0.10855027, 0.11406956, -0.10605073, 0.038545147, 0.12092632, -0.28194898, 0.10004931, -0.29438514, 0.14205848, 0.025120387) * inp_1_1_1; + result4 += M4(0.00935219, -0.043909084, -0.057207387, -0.006858439, -0.18782052, -0.24575754, -0.18026431, -0.1580193, -0.070116736, 0.11748019, -0.13015077, -0.10171491, -0.0051615736, 0.079644755, 0.08537926, -0.025504366) * inp_1_2_1; + result4 += M4(-0.01457055, -0.23596151, -0.12770654, -0.44953966, 0.010319849, -0.04212761, 0.036205474, 0.15004651, 0.096164376, -0.12687105, -0.16168225, -0.24025269, 0.03186571, -0.10847563, 0.039552685, -0.35295856) * inp_1_0_2; + result4 += M4(0.21015891, 0.15100212, 0.16399124, -0.008079374, -0.016138272, -0.14525296, 0.14673626, -0.13265406, -0.5422777, 0.11019852, -0.004156365, -0.4378592, -0.09075403, 0.051770605, -0.01216994, 0.030551502) * inp_1_1_2; + result4 += M4(-0.02542582, 0.09128689, 0.034989987, -0.031978976, 0.024582174, 0.12885588, -0.010468548, -0.012032657, -0.11233656, -0.1878876, 0.05700864, -0.119735524, -0.052216183, -0.04510211, -0.006198828, -0.018065663) * inp_1_2_2; + result5 += M4(-0.105741695, 0.030120268, 0.010589346, -0.046851862, 0.026937151, -0.0458042, 0.047890246, 0.009865603, 0.06446395, 0.093772225, -0.027894363, -0.013303434, -0.03599333, -0.056318723, -0.02722959, 0.051560834) * inp_1_0_0; + result5 += M4(-0.11275904, -0.07030927, 0.03613805, 0.15197079, -0.016481595, -0.06677235, -0.015963154, 0.04019457, -0.0041889963, 0.07911886, -0.10162684, -0.11922954, -0.016879966, 0.46875194, 0.13243358, -0.3028) * inp_1_1_0; + result5 += M4(-0.021431329, 0.02845094, 0.01917349, 0.26935023, 0.060816262, 0.09210378, 0.115646675, 0.09598305, 0.028917888, 0.046315048, 0.015928345, -0.014620898, -0.11740344, 0.014200038, -0.074817106, -0.22283669) * inp_1_2_0; + result5 += M4(0.1585673, 0.06564245, 0.1417825, 0.5254424, -0.036929425, -0.06180608, -0.0807507, -0.14706615, -0.03911734, 0.103862874, -0.057435155, -0.1461882, 0.048298948, 0.1106879, 0.009483295, -0.14538456) * inp_1_0_1; + result5 += M4(-0.02021285, 0.09545987, -0.041405242, 0.101548724, 0.107480176, 0.03692547, 0.1562033, 0.07395896, -0.094443955, 0.031959772, -0.1996548, -0.024069501, 0.055082295, 0.097889505, 0.15689933, -0.56664586) * inp_1_1_1; + result5 += M4(-0.019528514, 0.107269466, -0.07345283, -0.20095979, -0.11035748, 0.19620666, 0.11484614, -0.021132847, -0.0682673, -0.2231472, 0.02069023, 0.16370034, -0.04632951, 0.009400556, -0.10660355, -0.038149126) * inp_1_2_1; + result5 += M4(-0.2066398, 0.043647215, -0.117421776, 0.4549806, -0.018461045, 0.031187935, -0.016856091, -0.040724073, 0.07212592, -0.10981493, 0.07991286, -0.08563667, 0.0069989623, -0.05383134, 0.024289882, -0.08455121) * inp_1_0_2; + result5 += M4(-0.18827014, 0.46627483, 0.13979256, 0.49860772, 0.03180757, -0.05099197, -0.089179605, -0.051073954, 0.080238454, -0.49372384, -0.40864962, -0.054953966, -0.041159134, -0.060741015, 0.042637322, 0.010033197) * inp_1_1_2; + result5 += M4(0.06931211, 0.0026396862, 0.04362702, -0.01646692, 0.03317615, 0.038116433, -0.0047815028, 0.3006265, -0.06136993, 0.008267831, -0.22555752, 0.08187919, -0.042554468, 0.022714254, -0.036368567, -0.044143267) * inp_1_2_2; + result6 += M4(0.09332225, 0.2107942, 0.046468645, -0.0058521875, 0.027462866, 0.10704902, 0.028843805, -0.020340594, -0.054080028, -0.32308847, -0.020423707, 0.05962786, 0.07113592, -0.66309863, 0.10095243, 0.016556656) * inp_1_0_0; + result6 += M4(0.05626527, -0.047850717, 0.06214642, -0.040974036, 0.13208567, 0.24890055, 0.0488758, 0.012708694, -0.120700605, 0.06647558, -0.0031055915, 0.046462968, 0.053927135, -0.4851143, -1.8134881, 0.068895124) * inp_1_1_0; + result6 += M4(0.021884387, -0.029397087, -0.02141641, -0.014501913, 0.015087727, -0.15378447, -0.11168834, 0.026766786, -0.04538178, 0.18765987, -0.067522295, 0.023636453, 0.03069237, -0.025058249, 0.10501401, -0.028931929) * inp_1_2_0; + result6 += M4(0.0017545207, 0.009366909, -0.565109, 0.26265666, 0.030296054, -0.016820515, 0.067068055, 0.07988171, -0.052892324, -0.20996697, -0.0074573974, -0.09472669, -0.30473316, -1.5234005, -0.3962788, 0.04463244) * inp_1_0_1; + result6 += M4(-0.027665226, -0.01698808, -0.09775606, -0.13257034, 0.16224389, 0.10846303, -0.16721332, -0.22938298, -0.08694459, -0.083731174, -0.013726704, 0.12140914, -0.06224736, 0.16626489, -0.27240467, -0.093341865) * inp_1_1_1; + result6 += M4(0.05643772, 0.15685016, 0.03795502, 0.010408171, -0.12951964, 0.29687145, 0.4011162, 0.05241936, -0.089510605, -0.109212585, 0.14673002, -0.01251537, -0.004850159, -0.03634716, 0.07179159, -0.013744846) * inp_1_2_1; + result6 += M4(-0.13582695, 0.37709188, 0.016129958, 0.09733396, 0.017633319, -0.19455892, -0.033723895, -0.028679593, -0.07662824, -0.46093917, -0.01839582, -0.07459589, 0.04401736, -0.15561318, 0.013520649, 0.029707436) * inp_1_0_2; + result6 += M4(-0.13236041, 0.20047903, -1.4458611, 0.0042178226, -0.14593826, -0.1340935, 0.062991686, 0.041445494, 0.15104139, -0.124417625, 1.6492378, -0.14513507, 0.0465085, 0.0039506154, 0.035408624, -0.032591578) * inp_1_1_2; + result6 += M4(-0.05919881, 0.16983312, 0.08900627, -0.01912651, 0.28432667, 0.07467849, -0.11141047, -0.013259035, -0.07218165, -0.16358578, 0.10745998, 0.044914685, -0.0027635738, -0.059950642, -0.011715925, 0.0082511045) * inp_1_2_2; + result7 += M4(0.00079846574, 0.11804416, 0.39774996, -0.0188999, -0.020984879, 0.1424132, -0.045651954, 0.04802473, -0.07093976, -0.15494217, -0.14104928, -0.0023575677, 0.013031488, 0.1184644, 0.20706058, -0.028626304) * inp_1_0_0; + result7 += M4(0.07073396, 0.047589906, 0.21066403, 0.070525676, 0.0014766767, -0.008504743, 0.16058329, 0.047966074, 0.057557244, -0.031994525, -0.33618268, 0.026231483, -0.14226823, -0.17986543, 0.3749392, 0.025390334) * inp_1_1_0; + result7 += M4(-0.01336333, -0.039813794, 0.028163971, -0.04683214, -0.1481976, -0.15717982, -0.09003236, 0.035600007, 0.0035262385, -0.10815804, -0.15353194, 0.09247015, 0.061191954, -0.04596074, 0.19901207, -0.010301933) * inp_1_2_0; + result7 += M4(-0.071889736, -0.07307619, -0.28616777, -0.08834103, 0.05495883, -0.07238764, 0.009196725, -0.015408031, -0.02424489, 0.05812557, 0.0020887218, -0.04214564, -0.105822794, -0.0055916696, 0.28408337, 0.0051373746) * inp_1_0_1; + result7 += M4(0.12658006, -0.14945039, -0.51529, 0.09083091, -0.07647365, 0.23932236, -0.096072294, -0.022568945, 0.023276795, -0.061652094, -0.19689299, -0.08721155, -0.03799168, -0.26181933, 0.5297491, 0.136994) * inp_1_1_1; + result7 += M4(-0.0073459907, -0.110861465, -0.1085393, -0.035288736, 0.098410346, -0.012924912, -0.078053445, 0.066206686, -0.04341607, -0.13493924, -0.08633322, 0.033935037, 0.0491683, -0.073946364, 0.15834758, -0.02127443) * inp_1_2_1; + result7 += M4(0.07542379, -0.12709174, 0.27380553, 0.08961021, -0.026780073, -0.01095716, 0.15072188, 0.008027963, -6.0380182e-05, 0.1422573, 0.030468704, -0.006553803, -0.021494344, -0.018053466, -0.068701476, 0.01639046) * inp_1_0_2; + result7 += M4(-0.05820514, 0.10647802, 0.27567282, 0.13490169, 0.00027440005, -0.02319636, -0.12695146, 0.052700393, 0.2946579, 0.017761704, -0.18812853, -0.12112882, 0.009524831, 0.09213997, 0.22466551, 0.030493941) * inp_1_1_2; + result7 += M4(-0.048544433, 0.006095917, 0.0888653, 0.01692638, 0.004513951, 0.025711872, 0.100203514, 0.013254646, 0.06259611, 0.091392644, -0.14288813, -0.13578561, 0.0032735362, 0.034511343, -0.02331332, 0.008500248) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.14798167, 0.32969707, 0.35978433, -0.025166519, -0.07360234, 0.012388937, -0.09057915, 0.16475534, 0.21649787, 0.123509444, 0.3188876, -0.17394201, 0.032422878, 0.058578346, -0.041246872, 0.103866) * inp_2_0_0; + result0 += M4(0.065757975, -0.17898147, 0.3018122, 0.24880421, -0.08287398, 0.12209362, 0.09045875, 0.19394627, 0.021012923, 0.3386004, 0.21701767, 0.10220124, -0.0063404455, 0.07541256, -0.13295992, -0.26279962) * inp_2_1_0; + result0 += M4(0.07471258, 0.01625216, 0.101945125, 0.23299837, -0.0053609177, 0.16368029, 0.16530351, 0.3085733, -0.010843449, -0.057353172, 0.05077031, 0.08996226, 0.12557954, 0.13247977, -0.2434184, -0.062008843) * inp_2_2_0; + result0 += M4(0.07892017, -0.19662769, 0.20632322, 0.11177333, 0.065786585, -0.0077009504, -0.03237114, 0.054863397, 0.05309001, 0.0723526, -0.055593383, 0.29698423, -0.006024631, 0.044887517, 0.12367398, 0.074423164) * inp_2_0_1; + result0 += M4(0.024105964, -0.19590275, -0.38412267, 1.4240489, -0.00096269476, 0.19807102, 0.10541693, -0.11132736, 0.21926005, 0.5186404, -0.33780947, -0.2656679, 0.06544344, -0.10347784, 0.21115482, -0.63277185) * inp_2_1_1; + result0 += M4(-0.007660955, 0.14912277, -0.0012517645, 0.09301334, -0.03030125, 0.22706062, 0.062119618, -0.05686286, 0.096497245, 0.011387127, -0.08199684, -0.0014882354, 0.13522181, -0.014533298, 0.19079797, 0.01602368) * inp_2_2_1; + result0 += M4(0.02832157, -0.072065726, 0.08799233, 0.055657417, 0.03586983, 0.08324128, -0.09169483, 0.15052103, 0.065381736, -0.046825428, -0.030092219, 0.048315108, 0.020341216, 0.043230332, -0.077777006, 0.20855433) * inp_2_0_2; + result0 += M4(-0.100543156, -0.23298465, -0.15601614, 0.3822486, 0.00255601, -0.014198933, 0.1152892, 0.009894752, -0.0731281, 0.19547898, 0.09876246, -0.1384148, -0.06909734, -0.2016004, 0.05133047, 0.121334925) * inp_2_1_2; + result0 += M4(0.0008580311, 0.020834906, 0.104385406, 0.20686999, 0.039967004, 0.02231306, 0.0143063925, 0.05704368, -0.02781981, 0.08419426, -0.02055487, 0.015645076, 0.03185749, 0.13832857, 0.3300484, 0.23756409) * inp_2_2_2; + result1 += M4(-0.014646334, 0.193703, 0.21865068, 0.1512659, -0.03620869, 0.31267473, 0.031476807, 0.099512264, -0.06288779, -0.80396616, -0.0031370872, 0.13106087, 0.025451878, -0.23182608, 0.029182073, 0.37473318) * inp_2_0_0; + result1 += M4(-0.019765534, -0.015463853, -0.15314803, 0.629602, 0.3701295, 0.13982703, -0.023968458, 0.2805536, 0.24783622, -0.08060455, -0.07505057, 0.29910687, 0.0047641774, 0.14478186, -0.013111975, -0.103981376) * inp_2_1_0; + result1 += M4(-0.14914878, -0.16744123, 0.13028428, -0.19000438, 0.029777955, 0.07690664, 0.07095186, -0.11045454, -0.019116696, -0.016993696, 0.034676082, -0.10987831, 0.044353545, -0.086995676, 0.10650643, -0.07612089) * inp_2_2_0; + result1 += M4(-0.06546048, -0.18269108, 0.11226446, 0.1259433, -0.09634822, 0.14238119, 0.5685708, -0.08376794, 0.375088, -0.3783969, -0.8373722, -0.34600207, 0.18039258, 0.16030999, 0.069623016, -0.19501628) * inp_2_0_1; + result1 += M4(0.121734336, 0.44253471, -0.20267347, -0.20281743, 0.078100055, 0.006850094, -0.56120986, 0.09676285, 0.05967764, 0.15608798, -0.30019233, -0.3082072, 0.015091912, 0.39740068, -0.08576616, -0.1746624) * inp_2_1_1; + result1 += M4(-0.21738003, 0.0644141, -0.076813586, 0.27681845, 0.0208218, -0.00016772863, -0.24254076, -0.10827645, -0.025245795, -0.06569688, 0.019631762, -0.2352679, -0.17238232, 0.18914285, 0.089545295, 0.38894153) * inp_2_2_1; + result1 += M4(0.22535558, -0.07903611, -0.3908496, 0.10928906, -0.13099486, 0.08887396, 0.32293352, 0.063354105, -0.023962392, 0.09522632, -0.054138266, 0.10658677, -0.049707532, -0.29504964, 0.15979308, -0.14996131) * inp_2_0_2; + result1 += M4(-0.05500486, 0.13170563, 0.23967214, -0.1585575, 0.030043853, -0.053449742, -0.30708346, 0.16330789, 0.08346525, -0.13098939, -0.05193513, 0.12270213, -0.10243151, -0.0179288, 0.010035965, 0.16323087) * inp_2_1_2; + result1 += M4(0.061432607, -0.059181537, 0.036301028, 0.19237389, -0.098314375, 0.031184586, -0.12905139, 0.1262295, 0.0066269664, -0.0325591, 0.04694461, 0.088054225, 0.094405696, 0.044605356, 0.14346221, -0.3402185) * inp_2_2_2; + result2 += M4(-0.090132065, 0.0013867198, -0.17575788, -0.030437393, -0.0056479, -0.04885836, 0.05486155, -0.07175495, 0.11895235, -0.08370183, -0.18873478, 0.046603035, -0.024090894, -0.049802396, 0.17142203, 0.074900344) * inp_2_0_0; + result2 += M4(0.07589163, 0.15743928, -0.26108593, 0.0490332, -0.11990651, -0.029694492, 0.0783449, -0.053165443, 0.1756661, -0.12829363, -0.059792813, 0.24232492, 0.16930164, 0.055432186, 0.1529013, 0.06908528) * inp_2_1_0; + result2 += M4(-0.002898305, 0.13875051, -0.023811057, 0.09005341, -0.20992334, -0.05217095, 0.15754569, -0.09545166, 0.06764274, 0.017226892, -0.005018973, -0.034012653, -0.039837632, -0.049978387, 0.20307639, -0.14002554) * inp_2_2_0; + result2 += M4(0.16155547, 0.20902802, -0.16797282, -0.0011661586, -0.0026229748, 0.043825503, 0.131158, -0.02872627, 0.023362624, -0.04318203, 0.002647419, 0.12905684, 0.06976089, 0.13359642, -0.18916087, -0.060273334) * inp_2_0_1; + result2 += M4(0.14770259, -0.6030893, 0.28123626, -0.35997632, 0.16351381, -0.49432242, 0.91551846, 0.26499605, 0.18039218, -0.22716516, -0.1092489, 0.6843979, 0.28705052, -0.27803588, 0.14257433, 0.080402285) * inp_2_1_1; + result2 += M4(0.15671887, 0.16275057, -0.04220065, 0.08955454, -0.16156888, -0.105369695, 0.1412348, 0.020355534, -0.08625957, 0.12686269, 0.004688464, 0.19197595, 0.0934681, 0.21850333, 0.17202729, 0.1246091) * inp_2_2_1; + result2 += M4(-0.06469733, 0.063847564, -0.0737831, -0.11086153, -0.05387153, 0.08163555, 0.017200531, -0.04286831, -0.023168579, 0.16447546, -0.07716168, -0.056515682, 0.017320625, 0.026413534, -0.0027386176, 0.12700069) * inp_2_0_2; + result2 += M4(0.069572195, 0.10989559, -0.08345742, -0.14026967, 0.011300764, 0.018233528, 0.033457924, 0.0661669, 0.36802906, 0.05073546, -0.090222426, 0.095999464, -0.05007687, 0.07416598, -0.034617137, 0.15506592) * inp_2_1_2; + result2 += M4(0.0075443992, 0.09218535, 0.021907257, 0.24363445, 0.051151756, -0.045401227, 0.06260131, -0.064708665, 0.059091195, -0.0018249397, -0.016233532, 0.040986232, 0.047326323, 0.28709084, 0.09570187, 0.24448664) * inp_2_2_2; + result3 += M4(0.2685766, 0.18301097, -0.17105378, -0.06528451, -0.0007337671, 0.05386833, -0.018203814, -0.02068733, -0.4102558, 0.15415688, 0.09972097, 0.08369299, -0.029018193, -0.037276182, 0.008924699, 0.12222542) * inp_2_0_0; + result3 += M4(0.4391307, -0.029349325, -0.03210177, 0.0754953, 0.20973799, 0.1062292, -0.17323662, -0.054460317, -0.16163473, 0.22031242, 0.098089926, 0.013387313, -0.18300214, 0.15658887, 0.037854254, 0.011919025) * inp_2_1_0; + result3 += M4(0.0070181475, 0.07032167, 0.19497313, 0.06842968, -0.1265164, 0.05689864, -0.06154129, -0.12920445, -0.012065589, 0.037939847, 0.30810964, 0.011577699, 0.17309047, -0.01862103, 0.10220324, 0.29973254) * inp_2_2_0; + result3 += M4(0.31923738, 0.12975454, -0.28034595, 0.19512357, -0.12528826, 0.028097697, 0.05986118, 0.0032601315, -0.20051119, -0.027024012, 0.17180178, 0.23867859, 0.06355175, -0.051550746, 0.08755422, 0.11043871) * inp_2_0_1; + result3 += M4(0.027882274, -0.021074127, -0.25341523, -0.28833082, -0.24950516, 0.21721418, 0.027259434, 0.16804479, -0.22666211, 0.32887012, 0.35872096, -0.10538488, -0.34914768, 0.025243253, 0.3066556, 0.28278568) * inp_2_1_1; + result3 += M4(0.0059141954, -0.02006126, 0.08285728, -0.026303358, 0.066330574, -0.12707698, 0.12860902, -0.1026879, 0.07057301, -0.040765714, 0.20299037, 0.025773192, 0.51236236, 0.0844771, 0.2166118, 0.0769804) * inp_2_2_1; + result3 += M4(-0.09691124, -0.17734091, -0.16368139, 0.21991438, 0.093676895, 0.12049627, -0.037783634, 0.045934517, 0.1098542, -0.039753765, 0.07490589, 0.058368325, -0.0301953, 0.09809937, 0.051264275, 0.14757736) * inp_2_0_2; + result3 += M4(-0.076082446, 0.09214525, -0.17534271, 0.38814884, 0.029871792, 0.10519365, -0.15527949, 0.53442013, -0.08794864, 0.21905257, -0.0120418845, 0.25324836, 0.089029, 0.06474662, 0.31822667, 0.43938985) * inp_2_1_2; + result3 += M4(0.1802647, 0.020040901, -0.01262005, -0.06721949, 0.09334214, -0.0060265893, 0.00029382613, -0.02283571, 0.011216388, 0.10540019, 0.20456208, -0.0341242, -0.18825503, 0.042143803, 0.2433884, 0.29167935) * inp_2_2_2; + result4 += M4(0.03917384, 0.19171996, 0.35897788, -0.035745744, -0.0056778784, 0.11087332, 0.040208973, -0.05626218, -0.08261591, -0.045704328, 0.121067226, -0.05183238, -0.021853054, 0.15057355, 0.11258637, 0.16716263) * inp_2_0_0; + result4 += M4(0.0787703, 0.014477287, 0.016759448, 0.02922606, -0.07746891, -0.10071476, -0.16266973, -0.027350623, -0.119010374, -0.06335973, 0.020502957, 0.015856797, -0.23794225, 0.06888505, 0.15281926, 0.136032) * inp_2_1_0; + result4 += M4(-0.024153247, -0.020140907, 0.10472193, 0.063509874, 0.121605545, 0.14821392, -0.16273807, 0.100088455, -0.0019362759, 0.057722345, -0.02037534, 0.07538998, -0.19317825, 0.15163663, 0.43742216, 0.29304233) * inp_2_2_0; + result4 += M4(0.056429822, 0.20682736, -0.06913481, 0.3664237, -0.06036475, 0.12012815, -0.0050623915, -0.17446505, -0.024140958, -0.04331742, 0.10718152, 0.06466814, -0.1253321, -0.12547116, 0.07918919, -0.010291679) * inp_2_0_1; + result4 += M4(-0.34819266, -0.64322764, -0.18650332, -0.32853603, -0.45525074, -0.14293408, -0.018485148, -0.4928596, -0.1226723, -0.06398023, 0.1588924, 0.22833918, -0.39246163, 0.06805584, 0.028107537, -0.10490754) * inp_2_1_1; + result4 += M4(-0.054888908, 0.04982286, -0.0060292208, -0.024865909, 0.014331968, -0.23263083, 0.059174422, -0.17842662, -0.011708225, 0.017989712, 0.17128073, -0.016141003, -0.31791595, -0.18085133, 0.25932223, 0.18938261) * inp_2_2_1; + result4 += M4(0.035071395, 0.12994127, 0.12453648, -0.09343104, -0.030116221, 0.13095681, 0.021388326, 0.13062276, 0.032947365, -0.055599324, -0.056569736, 0.12875494, -0.20802794, -0.07583426, 0.05496649, 0.03960439) * inp_2_0_2; + result4 += M4(0.14446259, 0.054287024, 0.045010276, 0.21771728, -0.0025658596, 0.28008524, 0.088319875, 0.49949625, -0.11571129, 0.007224913, 0.081445895, 0.28446135, -0.14856477, 0.16881977, 0.1619648, 0.41252476) * inp_2_1_2; + result4 += M4(-0.12660632, 0.16946502, 0.045095824, -0.12160026, 0.098165855, -0.16977406, 0.07873497, -0.031269796, -0.04300626, 0.09427546, -0.050327994, 0.07100062, -0.3121061, 0.20957707, 0.028779844, 0.020830618) * inp_2_2_2; + result5 += M4(0.05594034, -0.27323946, -0.10411966, 0.19273478, -0.06887628, -0.05155524, 0.08415508, 0.22326843, -0.04541371, -0.1974212, -0.07474692, 0.016079674, -0.23771256, 0.11231506, -0.13174021, -0.041805673) * inp_2_0_0; + result5 += M4(-0.17470378, -0.13262028, -0.3045934, -0.23256221, -0.030805834, 0.182573, 0.069530904, 0.008251476, 0.142016, -0.008546693, -0.12632295, -0.32238746, -0.35908225, -0.061007906, -0.33944154, -0.2645622) * inp_2_1_0; + result5 += M4(-0.024161972, 0.06570817, 0.0028879254, 0.06239786, -0.06497316, 0.21702552, -0.010258944, 0.19166872, -0.0033892482, 0.03582859, -0.054844134, 0.1518353, -0.25082752, 0.2837798, -0.18608347, 0.41113275) * inp_2_2_0; + result5 += M4(0.06747966, -0.0057703955, 0.063500226, 0.105181664, -0.057158154, -0.1290059, -0.042310875, -0.12260737, 0.013109046, -0.19605474, -0.07424287, -0.08444099, -0.068970144, -0.11076139, -0.18823707, 0.039594453) * inp_2_0_1; + result5 += M4(-0.07699123, -0.13033818, -0.16277117, -0.36149937, -0.2283251, -0.14638117, -0.17533408, -0.28321895, 0.24702573, -0.14470875, -0.092630565, 0.10027762, -0.12768812, 0.0357125, -0.06146514, 0.12526575) * inp_2_1_1; + result5 += M4(0.07096949, 0.13597254, -0.15845811, 0.2046907, -0.113468185, -0.022919554, 0.015036124, 0.09972615, 0.04426655, 0.009127988, -0.07133441, 0.26635978, -0.21387924, 0.22665285, -0.31868616, 0.10117811) * inp_2_2_1; + result5 += M4(-0.04168437, -0.108219735, -0.008220711, 0.040169477, -0.009767064, -0.022632834, -0.03489749, -0.020245953, 0.012904271, 0.0058327247, -0.049515173, -0.16984537, 0.12049866, -0.11099652, -0.08166101, 0.06628959) * inp_2_0_2; + result5 += M4(-0.032379933, -0.0536348, 0.04880159, 0.014004403, 0.05574491, 0.17830066, -0.00487589, 0.07933988, 0.15870495, -0.0075573875, -0.14323002, -0.15597491, -0.10453179, -0.08835103, -0.14172937, -0.08488344) * inp_2_1_2; + result5 += M4(-0.093279175, 0.111123145, -0.009972042, -0.010945283, 0.044537004, 0.06435724, -0.09753193, -0.09625517, -0.0448321, 0.06894434, -0.05543332, 0.0088264765, -0.24253574, 0.18463078, -0.15143481, -0.015086551) * inp_2_2_2; + result6 += M4(-0.14101617, 0.45603985, 0.11462078, 0.15035559, -0.043287028, -0.52733994, -0.050076496, -0.05160513, 0.038330566, -0.06499483, -0.063733235, -0.1876216, -0.039066933, 0.050710674, 0.15228713, -0.02570981) * inp_2_0_0; + result6 += M4(-0.21618348, -0.16782708, 0.18072358, 0.015840255, 0.062031657, 0.017695678, 0.081718795, 0.06210786, 0.08719056, 0.22781125, -0.0009219294, 0.08272198, -0.061176464, 0.40369153, 0.36968786, 0.066784635) * inp_2_1_0; + result6 += M4(0.001435731, 0.015904447, -0.13786788, -0.0052644447, -0.01821759, -0.07131523, -0.060587518, -0.08045374, -0.06320833, 0.17945474, -0.062166512, -0.0019211707, -0.1726007, 0.6196538, 0.010415715, -0.030465433) * inp_2_2_0; + result6 += M4(-0.032673076, 0.21294901, -0.002008417, 0.124084175, -0.18396752, -0.083575934, 0.03617782, -0.14779688, 0.06381524, 0.36120465, -0.007982644, -0.25186777, -0.088355936, 0.10022911, 0.0012239299, -0.029040184) * inp_2_0_1; + result6 += M4(-0.024227023, -0.11458965, 1.1322322, -0.15262376, 0.21433035, 0.591815, 0.43304297, 0.030893482, 0.076957524, 0.652114, 0.14043349, 0.02515424, 0.20544682, 0.12705134, 0.7626254, 0.14499094) * inp_2_1_1; + result6 += M4(0.043009542, 0.0006286714, -0.0069515225, -0.021069944, -0.0143068135, -0.1210831, 0.113472976, 0.02957111, -0.046939064, -0.04457818, -0.09583104, 0.039483666, 0.07673319, 0.43753898, 0.077740304, 0.035796806) * inp_2_2_1; + result6 += M4(0.21361329, 0.044898354, 0.11632864, 0.037453037, -0.011976736, -0.14009582, 0.011824996, 0.037873846, 0.017858554, 0.3504187, -0.040843245, -0.06727661, -0.07826574, 0.43344057, -0.02636409, 0.04546663) * inp_2_0_2; + result6 += M4(-0.16143668, 0.14270769, 0.20747927, 0.055327367, 0.13745679, -0.17875391, -0.061554633, -0.062469535, 0.26956376, 0.03319949, -0.062331617, 0.013035938, 0.07776556, 0.022040557, 0.15146402, 0.16426323) * inp_2_1_2; + result6 += M4(-0.15287, -0.01402495, -0.07529775, -0.026113965, -0.0013235839, 0.0374326, 0.019171692, 0.042563066, 0.081450544, 0.1506115, -0.0259815, -0.023641048, -0.13419153, 0.2728413, -0.13001315, -0.07124397) * inp_2_2_2; + result7 += M4(-0.20676173, 0.017402256, 0.6366335, -0.032154344, -0.024140522, 0.05937407, 0.1413502, 0.022396233, -0.13420899, 0.10011038, 0.058690336, -0.027011182, -0.008634274, -0.043286756, 0.17064366, 0.011459937) * inp_2_0_0; + result7 += M4(0.036658127, 0.124612376, 0.36770982, 0.04180192, -0.05743151, -0.030430704, 0.070063576, -0.022618817, -0.13503619, 0.060629062, 0.045400027, -0.07597667, 0.007879579, -0.30695942, 0.045526125, -0.032661542) * inp_2_1_0; + result7 += M4(0.13303798, -0.15701066, -0.003759278, 0.026077427, 0.31546238, 0.008026783, 0.29732296, -0.09413903, -0.031766776, -0.02239174, -0.023291357, 0.017597865, 0.27031928, 0.022237126, 0.31170833, 0.07464661) * inp_2_2_0; + result7 += M4(-0.18840568, -0.26675048, -0.27112442, -0.07382757, 0.013058193, 0.0047183875, 0.13746461, 0.027802348, -0.086207464, 0.12491161, -0.1684139, -0.060159087, -0.02137234, -0.047705747, -0.05748505, 0.019910768) * inp_2_0_1; + result7 += M4(0.22780561, -0.4007392, 0.43293673, 0.15633248, -0.09347943, -0.2660596, -0.13969366, 0.09837358, -0.20455904, 0.19487731, -0.23239242, -0.03697396, 0.047783602, -0.08274263, -0.1626889, 0.15236942) * inp_2_1_1; + result7 += M4(-0.051888753, -0.00042802707, 0.08672579, -0.036712416, 0.06717615, 0.103258856, -0.22366904, 0.0125487875, -0.019851524, -0.055699356, -0.1136299, 0.030360853, 0.037519373, 0.019084461, 0.11896503, 0.031885304) * inp_2_2_1; + result7 += M4(-0.0379545, 0.2113392, -0.04047959, -0.01832525, -0.015454086, -0.019668167, 0.066109665, -0.012503281, -0.016549157, 0.028441655, 0.2580847, -0.0040072077, 0.024469642, 0.07551917, -0.08341632, 0.04620936) * inp_2_0_2; + result7 += M4(0.15153699, -0.2522845, 0.18018436, 0.09741081, -0.038173787, 0.030702803, -0.10061468, -0.021667069, 0.017508151, 0.0060765124, 0.30460465, -0.030662311, -0.05648762, 0.25791484, 0.1781746, 0.045209818) * inp_2_1_2; + result7 += M4(-0.06814371, 0.07210286, 0.030608222, 0.037311446, 0.00046949348, -0.057223305, -0.11727483, -0.1063119, 0.04792679, -0.09716068, 0.0592881, -0.031629097, -0.061547503, 0.22438234, -0.1489272, 0.22301634) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.058534563, -0.08267206, -0.21695007, 0.18747747, 0.01720489, -0.023020057, 0.15023144, -0.09669919, 0.02729793, 0.112311065, -0.25918895, 0.23445289, 0.16632354, -0.17474616, 0.07854869, -0.16751495) * inp_3_0_0; + result0 += M4(0.012020389, -0.15200801, 0.04013857, 0.26122445, 0.09409885, 0.08966963, 0.06217526, -0.010806612, -0.13151187, -0.058675487, -0.043021776, 0.15083072, 0.22495933, 0.22885889, 0.37611896, -0.30112284) * inp_3_1_0; + result0 += M4(-0.055003427, -0.001034001, 0.06553042, -0.014416176, 0.023581995, 0.124274336, -0.055304617, -0.017361103, -0.003999049, -0.09707139, -0.15993911, 0.12694289, 0.17240335, -0.025398273, 0.04965644, -0.060369372) * inp_3_2_0; + result0 += M4(-0.07267709, 0.16061275, -0.021404492, 0.10077634, -0.3484654, 0.13236116, -0.018846026, 0.07820672, 0.06836986, 0.01328081, 0.05409976, 0.15940472, 0.086702205, -0.16181922, -0.063018546, -0.15048644) * inp_3_0_1; + result0 += M4(-0.16778232, -0.16919425, 0.32210878, 0.30770034, -0.10026125, 0.50551236, 0.15202284, 0.25049973, 0.08387161, -0.09930171, -0.04543509, -0.007290529, 0.13551292, 0.21227215, 0.16385181, -0.01219463) * inp_3_1_1; + result0 += M4(-0.037734684, -0.015427, 0.034323335, 0.025884293, -0.0360236, 0.02818554, 0.13304651, 0.29946503, -0.054653373, 0.031857137, 0.33291104, 0.14177413, 0.07515797, -0.07744632, -0.048287045, 0.09698878) * inp_3_2_1; + result0 += M4(0.0342761, 0.112171024, 0.009366116, 0.008959323, 0.08427646, -0.08984434, 0.13423735, 0.24364305, 0.041010898, 0.11919051, 0.02213782, 0.26701698, -0.006046792, -0.01970774, 0.022577964, -0.016565017) * inp_3_0_2; + result0 += M4(-0.0030109207, 0.060629986, 0.05698365, 0.07006874, -0.012725099, -0.124994144, -0.14158584, 0.24625891, 0.006550355, -0.10211694, 0.028206406, 0.04633239, -0.021093545, 0.052575707, 0.079059996, -0.051767126) * inp_3_1_2; + result0 += M4(0.021437345, 0.024834415, -0.002384857, -0.009486033, 0.064322285, -0.0024126503, 0.1333588, -0.049991407, 0.016967114, 0.08633528, 0.20782527, -0.011901945, 0.04061016, 0.0820391, -0.03549982, -0.027612321) * inp_3_2_2; + result1 += M4(-0.029237268, -0.2418947, 0.077807836, 0.0018296613, -0.026609482, -0.09135472, 0.18337487, 0.11731806, 0.26917633, -0.00089886, -0.011611949, 0.08119477, 0.057736166, -0.037667263, -0.015940651, -0.22332524) * inp_3_0_0; + result1 += M4(-0.3137956, -0.027481757, 0.15234096, -0.47996718, -0.018590739, 0.07049502, -0.14070325, -0.28256378, -0.12689131, 0.21311055, 0.016073389, -0.09805352, -0.012172061, 0.00086137524, -0.40366814, 0.20937651) * inp_3_1_0; + result1 += M4(-0.00936943, -0.04331876, -0.04187395, -0.12605527, 0.1339605, 0.13177249, -0.052429, 0.17844312, -0.06493971, -0.046479378, -0.018690975, 0.013983085, -0.051454343, -0.06899801, -0.041142467, 0.03337519) * inp_3_2_0; + result1 += M4(0.032279886, -0.05677682, 0.112556025, -0.06994456, -0.03957209, 0.23136573, 0.32293984, 0.0015096692, 0.1875921, 0.14868146, 0.03746478, 0.09948961, -0.20458047, -0.024151998, -0.058608137, -0.247089) * inp_3_0_1; + result1 += M4(-0.077878065, -0.16984342, 0.01351916, 0.033311576, -0.017209582, 0.06575362, -0.30508158, -0.63436157, -0.03780812, 0.082569815, -0.3485529, 0.40524092, -0.0039053683, 0.016290994, -0.2491248, -0.015534804) * inp_3_1_1; + result1 += M4(0.014489613, 0.035196666, -0.0538664, 0.010219747, -0.055602953, -0.035206888, 0.11388407, 0.4155998, 0.071787044, 0.10476, -0.1130021, 0.43028483, 0.010997933, 0.033939384, 0.02075493, -0.036647473) * inp_3_2_1; + result1 += M4(0.027308658, -0.00040981415, -0.12508406, 0.033449247, 0.40246475, 0.26886454, 0.0063552144, -0.09522072, 0.31523877, 0.08121834, 0.18689191, 0.101244755, -0.21848562, -0.053225577, -0.007637685, -0.0023690152) * inp_3_0_2; + result1 += M4(-0.030737527, -0.051708885, 0.03739987, -0.10389346, -0.044733025, 0.18452685, -0.0024768233, -0.2882316, -0.06661157, -0.26502532, 0.036552217, 0.09694698, -0.018443136, -0.03144525, -0.01704141, -0.1724951) * inp_3_1_2; + result1 += M4(-0.004441743, -0.009387335, -0.0119206505, 0.064697534, -0.020856265, -0.060958643, 0.03542067, 0.54511946, -0.15183821, 0.017029079, -0.073157966, 0.18637957, 0.011311436, -0.021767158, -0.032159485, -0.03869201) * inp_3_2_2; + result2 += M4(-0.38375163, 0.10435395, -0.114343464, -0.059575524, 0.13168043, -0.017272063, 0.030857636, 0.0011205697, 0.08873851, -0.015325343, 0.10864721, -0.01915886, 0.0049161534, -0.012174386, 0.14130558, 0.014378584) * inp_3_0_0; + result2 += M4(-0.39819527, 0.24949522, 0.058650177, -0.14375944, -0.014436218, -0.087249786, 0.015214913, 0.10094625, 0.068316616, 0.18515319, 0.05541381, -0.077787705, 0.20808883, -0.096720874, 0.08026607, 0.24277318) * inp_3_1_0; + result2 += M4(-0.046407808, 0.002938751, 0.029356267, -0.08213436, 0.09551396, -0.030745754, 0.02229406, -0.01108846, 0.017611383, 0.023462726, 0.085913725, -0.031210227, -0.015188519, -0.088449866, -0.09824411, 0.11063738) * inp_3_2_0; + result2 += M4(-0.765912, 0.1923157, -0.11000628, -0.18087971, 0.29408768, -0.03546295, 0.37590536, 0.092811055, 0.033951934, 0.023527252, 0.09871188, 0.029839018, 0.048000067, 0.10560536, 0.1679474, 0.11155312) * inp_3_0_1; + result2 += M4(-0.65977836, 0.35553306, 0.09419664, -0.06708742, -0.013754005, -0.08726835, -0.17867324, 0.12793075, 0.269035, -0.17282525, 0.24977434, 0.11201502, 0.32118317, -0.2285605, 0.1508041, 0.26154104) * inp_3_1_1; + result2 += M4(-0.12370831, 0.050049916, 0.026183298, -0.063300624, -0.09115904, 0.10956271, 0.10879264, 0.10794349, 0.22316198, -0.045302544, -0.052448425, -0.16525525, -0.033937674, -0.031299837, 0.03792323, 0.119254544) * inp_3_2_1; + result2 += M4(-0.21032552, -0.04836635, 0.059867993, -0.022304572, 0.1426408, 0.02585757, 0.1508405, -0.21335323, -0.017627332, -0.0023905688, 0.11327619, 0.08282954, -0.0017292941, 0.01570474, -0.01105298, 0.043770354) * inp_3_0_2; + result2 += M4(-0.17816527, 0.011505419, 0.07443795, -0.025017885, 0.14794275, 0.19249506, 0.2712048, -0.23908898, 0.17727052, 0.07436263, 0.13082689, 0.061943088, 0.19826703, -0.0071340753, 0.11247669, 0.14090584) * inp_3_1_2; + result2 += M4(-0.026698045, 0.001220745, 0.048322555, 0.048156608, -0.60087246, -0.032335244, 0.2670392, -0.048305262, 0.11375207, -0.0033873676, 0.06327501, 0.11530058, 0.01065437, -0.06694463, 0.051224068, 0.120340146) * inp_3_2_2; + result3 += M4(0.07284516, -0.23217297, -0.002598979, 0.09973781, 0.13975388, -0.027732007, 0.02992973, -0.07000489, -0.018336449, -0.12717557, -0.009848464, 0.16519193, -0.27603018, -0.011629583, -0.016334843, -0.038882125) * inp_3_0_0; + result3 += M4(0.19739366, 0.029705213, 0.022679528, 0.1480558, 0.04137465, 0.05263497, -0.00777127, -0.016311573, 0.111884736, -0.01672714, 0.2099409, 0.22467138, -0.0060768165, -0.21767901, -0.06799207, 0.051756307) * inp_3_1_0; + result3 += M4(-0.024204006, -0.03449814, 0.026007997, -0.03219569, -0.11151443, -0.0038574652, 0.08009479, -0.11074792, 0.15369965, 0.016292907, 0.07730027, 0.08438262, 0.114305794, 0.09139034, 0.025949497, -0.062349193) * inp_3_2_0; + result3 += M4(0.30558234, -0.22188488, -0.12635924, -0.6348308, -0.23768991, 0.024640478, -0.022938564, -0.11173081, 0.21153735, -0.15561613, 0.16058336, 0.17775838, -0.36279455, 0.12208751, -0.1062096, 0.26480907) * inp_3_0_1; + result3 += M4(0.0622446, 0.014908604, 0.07157153, -0.5516658, 0.022517314, 0.2458744, -0.12926257, 0.17871156, 0.25097668, 0.20877951, 0.24111104, 0.114362665, 0.13183704, -0.090798, 0.22634578, 0.18340142) * inp_3_1_1; + result3 += M4(-0.00920285, -0.0685326, -0.189622, 0.053395983, 0.018070891, 0.17210516, 0.06269431, -0.06509988, 0.21491195, 0.006693742, -0.06663099, 0.05911801, 0.100524455, 0.122591406, 0.13012399, -0.23824808) * inp_3_2_1; + result3 += M4(0.048976675, -0.27702254, -0.027180698, -0.6654293, -0.20287286, -0.07013911, 0.03208923, -0.17066808, 0.22477177, -0.14781, 0.11822354, 0.066514835, -0.13554192, 0.09925652, -0.07581494, 0.18332276) * inp_3_0_2; + result3 += M4(-0.021756848, -0.09349331, 0.013657232, -0.5790786, -0.13597181, -0.09976687, 0.06201825, 0.4401853, 0.06481538, 0.13982825, 0.20622955, 0.25086674, -0.06165809, -0.041849703, 0.10213637, 0.12482804) * inp_3_1_2; + result3 += M4(0.018142967, 0.0038623998, 0.007037394, 0.00059219054, 0.3152469, 0.16650225, -0.068798795, 0.26503477, 0.10805224, -0.03642072, 0.03871398, 0.18378225, 0.11262567, -0.0010103745, 0.09697435, -0.09409963) * inp_3_2_2; + result4 += M4(0.17474085, -0.04980379, 0.15372992, 0.14411943, -0.011710013, 0.13538133, -0.11486645, -0.14619313, -0.07880484, -0.06900089, 0.42904586, 0.17555922, -0.18244074, -0.05201728, -0.20749576, -0.01042585) * inp_3_0_0; + result4 += M4(0.025384119, -0.25608438, 0.23688622, 0.15146211, -0.010784338, -0.27337, 0.0827411, -0.071610026, -0.092635326, 0.12953115, 0.26450783, 0.2987299, -0.14343199, -0.23712218, -0.14002666, 0.057215285) * inp_3_1_0; + result4 += M4(0.015038858, -0.03813447, 0.056175046, 0.04263707, 0.0118990615, 0.31871966, -0.19225664, -0.11234522, -0.04105065, 0.13085602, 0.2557004, 0.14220361, 0.011485285, 0.05361946, 0.10180392, 0.03490709) * inp_3_2_0; + result4 += M4(0.06076774, -0.37149101, 0.025851754, -0.12047196, -0.035953376, 0.47370252, 0.16423027, -0.0673372, -0.12655781, -0.06616689, 0.37357056, 0.18191256, -0.07700886, 0.21954961, -0.089262374, 0.30424225) * inp_3_0_1; + result4 += M4(0.14625123, -0.15502419, 0.054219056, -0.17736357, 0.13664928, -0.13019273, -0.27580035, 0.0521699, -0.2446673, 0.34599185, 0.027042225, 0.06351339, -0.07497566, -0.49129882, -0.07385034, -0.087985136) * inp_3_1_1; + result4 += M4(0.0019628303, 0.00013280261, 0.06443812, 0.010985561, -0.12019817, 0.33791456, 0.2585265, 0.07602394, -0.045397405, 0.027223555, 0.028554142, -0.040651303, -0.018324032, -0.15908504, 0.010486933, -0.07503881) * inp_3_2_1; + result4 += M4(0.038083274, -0.18235637, -0.066698745, -0.5058892, -0.067678556, 0.35296583, 0.16949536, -0.16359212, -0.21453044, -0.032573298, 0.10404396, -0.049900003, -0.06855341, 0.120962285, -0.06626313, 0.15220198) * inp_3_0_2; + result4 += M4(0.0109871775, -0.10816531, -0.063197896, -0.33376604, -0.04669717, -0.09676746, -0.04275124, -0.056628846, -0.19187354, 0.25965554, 0.14733441, 0.11788299, -0.11146972, -0.06829089, 0.01073942, 0.11837586) * inp_3_1_2; + result4 += M4(-0.019016001, -0.020372467, -0.02291969, 0.022698285, -0.11680618, 0.15217352, 0.3282598, -0.0439835, -0.12201311, 0.069069184, 0.149647, 0.039209466, -0.037240166, -0.10747331, -0.02172351, -0.08826641) * inp_3_2_2; + result5 += M4(0.019840166, -0.06181727, 0.14222327, 0.17917559, -0.035763416, -0.12893444, -0.084954835, -0.043033402, -0.068251446, -0.002812812, -0.107642114, 0.24211544, -0.12643388, -0.09841472, -0.15779707, -0.6051122) * inp_3_0_0; + result5 += M4(0.05454774, 0.07682123, 0.034559008, -0.24346364, 0.020827362, -0.06584504, -0.0056850114, -0.053709242, -0.03188751, 0.11759836, -0.1178612, 0.23259772, -0.0539883, -0.08213933, -0.07912998, -0.14198215) * inp_3_1_0; + result5 += M4(0.12078032, -0.10450228, 0.03827481, -0.06621465, 0.04285826, -0.124861315, -0.0046536014, 0.11013294, -0.03810551, 0.14046112, 0.0005526692, 0.14568546, 0.07775516, 0.10267673, 0.14614473, 0.28691715) * inp_3_2_0; + result5 += M4(-0.03217419, 0.25927565, 0.071673594, -0.08457725, 0.1546867, -0.010579179, -0.001387946, 0.09392151, -0.12921023, -0.028091574, -0.26816922, 0.084991366, 0.056670528, -0.1504099, -0.040755834, -0.4869911) * inp_3_0_1; + result5 += M4(0.0013995785, 0.23561674, 0.25974888, -0.14824633, 0.12471756, -0.14643112, -0.009456599, -0.14839844, -0.11986328, 0.063610844, -0.30340317, 0.044824358, 0.026667086, 0.072877906, 0.05555367, -0.41920543) * inp_3_1_1; + result5 += M4(0.097624615, 0.014444517, -0.0136684, -0.027330529, 0.14607185, 0.46903804, 0.15576625, 0.06154415, -0.016773771, 0.09159693, -0.17241305, -0.042314645, -0.079406634, 0.124126114, 0.06438929, -0.09387847) * inp_3_2_1; + result5 += M4(-0.11906939, 0.02034849, 0.030269135, -0.17779353, -0.010973351, 0.1639962, 0.23628642, 0.18063055, -0.15246627, -0.023771457, -0.28708884, -0.18488741, 0.120001964, 0.018080931, -0.06272283, -0.04118312) * inp_3_0_2; + result5 += M4(-0.12625262, 0.008316212, -0.04138115, -0.095510066, 0.26595443, -0.2009985, 0.25843897, -0.031679258, -0.26262575, 0.030705791, -0.22027838, -0.12344691, 0.07513727, 0.010777727, -0.06073883, -0.012409973) * inp_3_1_2; + result5 += M4(-0.0034503017, 0.008154137, 0.012336985, -0.061151337, -0.18714279, 0.017955994, 0.11175068, -0.10800975, -0.083521836, 0.060158, -0.08686018, 0.042005144, 0.022592612, 0.0012510516, -0.01516854, -0.097913854) * inp_3_2_2; + result6 += M4(-0.0017869193, -0.22986798, -0.022328213, 0.03801556, -0.050030906, -0.045862682, -0.015420725, -0.015010319, -0.032529578, 0.111728564, 0.0760141, 0.087046, 0.02885678, 0.20267792, 0.1885614, -0.09043646) * inp_3_0_0; + result6 += M4(-0.16050087, 0.022562942, -0.18160018, 0.06610709, -0.03135219, 0.085650764, 0.09794036, -0.059744872, -0.21719149, 0.17258601, 0.0049531157, 0.075172625, 0.11409518, 0.008569935, 0.17913039, 0.037813663) * inp_3_1_0; + result6 += M4(0.037501205, -0.0263542, 0.015046902, 0.029913085, -0.08123129, 0.106906526, 0.12852493, -0.012850448, -0.21055417, 0.15080416, -0.07958182, 0.0025546588, 0.097868614, -0.0024404689, -0.15359125, -0.0035282439) * inp_3_2_0; + result6 += M4(-0.14149998, 0.11445414, 0.0044851066, 0.049062133, -0.036440693, -0.068187654, 0.2357466, 0.008546502, -0.124260455, 0.17017806, 0.087895915, -0.0610435, 0.11334801, 0.19967702, 0.039386716, -0.03207605) * inp_3_0_1; + result6 += M4(-0.10868707, -0.1830082, -0.21345106, 0.077289596, -0.07365736, 0.4673585, 0.35748494, -0.08752111, -0.15984589, 0.47734797, -0.09837698, 0.06799788, 0.064178385, -0.4400765, 0.079284, 0.02338205) * inp_3_1_1; + result6 += M4(-0.02154515, -0.013499519, 0.028091516, 0.009506083, 0.03623487, 0.10572431, -0.122433506, 0.047206417, -0.07241629, 0.35506696, 0.02883558, -0.07923319, 0.083307266, -0.1302157, -0.07361634, -0.015637545) * inp_3_2_1; + result6 += M4(-0.084878385, 0.027462108, 0.04622544, -0.0075728325, 0.073470384, -0.2892803, -0.31980026, 0.27047557, -0.11455268, -0.00838944, 0.014691762, 0.037093077, 0.035062805, -0.06846471, 0.0557262, -0.008442687) * inp_3_0_2; + result6 += M4(-0.12246098, -0.103739195, -0.0058314125, 0.016955493, 0.318048, -0.00018005638, -0.306629, -0.07962692, -0.1484962, -0.12201055, -0.08032803, 0.014402754, 0.007292962, -0.31601855, 0.10337287, -0.010671918) * inp_3_1_2; + result6 += M4(0.027842296, -0.0038718951, 0.04369523, 0.02405883, -0.053789336, -0.0279039, -0.14543176, 0.09750471, -0.055104915, 0.16526844, -0.0060611386, 0.016362505, 0.024724854, -0.040237606, 0.0015387846, -0.01970051) * inp_3_2_2; + result7 += M4(0.07799608, -0.03756142, -0.15946124, 0.030217864, 0.08607164, 0.17471892, 0.08624368, 0.0045786146, 0.07044087, 0.028068539, -0.06528517, 0.025315324, 0.030368216, 0.01471786, -0.648812, -0.009863933) * inp_3_0_0; + result7 += M4(0.02292787, -0.017326167, -0.07848829, 0.03720695, -0.034441825, 0.02965932, -0.21812427, -0.07649149, -0.04161487, -0.2019438, -0.23876616, 0.04698337, -0.034467332, 0.18653259, -0.36914194, 0.04170335) * inp_3_1_0; + result7 += M4(0.011701725, -0.016690679, -0.13723364, 0.043153375, 0.11420859, 0.1237593, 0.11257727, -0.017927894, 0.070698805, 0.013200926, -0.085107155, 0.08930653, 0.011315696, 0.05854115, -0.18638979, 0.033048) * inp_3_2_0; + result7 += M4(-0.008442322, 0.029425137, -0.25667918, 0.033553775, 0.19272333, 0.04340016, 0.07303243, 0.06513279, 0.052829947, 0.13275717, 0.35959122, 0.07377083, 0.030978408, -0.31547382, -0.20079869, 0.02423032) * inp_3_0_1; + result7 += M4(-0.048716236, 0.15976153, -0.14868331, 0.09602924, -0.101685226, 0.33166257, -0.5513272, 0.037471116, 0.0736064, -0.18596496, 0.53179204, 0.012391486, -0.042396203, 0.014146373, -0.72128665, -0.0101347305) * inp_3_1_1; + result7 += M4(0.008836737, 0.048219725, 0.06047796, 0.07236714, -0.15650013, 0.3703931, 0.011843346, 0.00947209, -0.08357066, -0.020797452, 0.4892843, 0.111511394, -0.0020968642, 0.036360387, -0.15283315, -0.0016491066) * inp_3_2_1; + result7 += M4(0.00902981, -0.20167586, -0.15373093, 0.02432798, -0.11945541, 0.08256757, 0.14022216, -0.110512376, -0.0626592, 0.014022612, 0.27587077, 0.09828396, 0.06361625, -0.15622514, 0.009687524, -0.039123245) * inp_3_0_2; + result7 += M4(-0.017314475, -0.05310819, -0.108744346, -0.015228726, -0.18041962, -0.6175114, -0.07958901, 0.100302145, -0.099540524, -0.15658498, 0.40941125, 0.040705808, -0.005762831, -0.037789654, -0.36949483, 0.0025697378) * inp_3_1_2; + result7 += M4(0.0010597089, 0.040891714, 0.13572384, 0.012261106, -0.05278703, -0.18582681, -0.073954985, -0.016551588, -0.11223141, -0.08771503, 0.017168771, 0.06880364, 0.026438978, 0.08435423, 0.033355653, -0.00829886) * inp_3_2_2; + const V4 inp_4_0_0 = inp[4][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_4_1_0 = inp[4][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_4_2_0 = inp[4][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_4_0_1 = inp[4][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_4_1_1 = inp[4][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_4_2_1 = inp[4][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_4_0_2 = inp[4][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_4_1_2 = inp[4][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_4_2_2 = inp[4][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.04305409, 0.11176719, 0.08597714, 0.00049601786, -0.062116448, -0.017947877, -0.21897869, -0.022407915, -0.003971403, -0.17125294, 0.072130404, 0.07831358, 0.60045433, 0.4922693, 0.017562635, 1.2532773) * inp_4_0_0; + result0 += M4(-0.06263793, -0.10810063, 0.048341513, 0.033160172, -0.19500294, -0.04675883, -0.4002144, -0.14051639, 0.06720143, 0.22420949, 0.56135184, -0.08857201, -0.26179764, 0.28116164, -0.20511062, 0.009111406) * inp_4_1_0; + result0 += M4(-0.016187077, -0.08897449, 0.21898264, -0.00950795, -0.033877086, -0.13508922, -0.24069354, -0.15611845, 0.0008279733, 0.110152185, -0.028671898, 0.07176969, -0.31599745, -0.4928454, -0.013503589, -0.55562186) * inp_4_2_0; + result0 += M4(-0.05818953, 0.027291035, -0.052520476, -0.1955628, 0.017190797, -0.027439956, 0.067244, -0.019712083, 0.023169432, 0.05637902, -0.053515404, 0.25675163, 1.2109313, 1.7048917, -0.91695136, 2.1668386) * inp_4_0_1; + result0 += M4(0.20479065, 0.07864295, -0.04785691, 0.23942699, 0.49933773, 0.2936974, -0.8557609, -0.15096465, 0.39180985, -0.026214255, -0.32314906, -0.1414668, 0.0048528165, 0.44652796, -0.08378215, 1.3877233) * inp_4_1_1; + result0 += M4(-0.019790411, 0.004489421, -0.1839837, -0.076589614, 0.02528201, 0.17397436, -0.1297137, -0.061592605, 0.047706757, 0.32120365, -0.25539586, 0.3379385, -0.047388483, -0.95197576, -0.65991455, -0.4835222) * inp_4_2_1; + result0 += M4(0.023583742, 0.20350221, 0.03874766, -0.03570739, -0.01830487, 0.021995382, -0.022943925, 0.5269705, -0.01726829, 0.19895968, 0.0310699, 0.0841442, 0.27791443, 0.43230355, 0.9290483, 0.2149712) * inp_4_0_2; + result0 += M4(0.0698528, -0.095751725, -0.018925322, -0.17468323, 0.035944324, -0.015047672, 0.23744197, 0.39720836, 0.012356704, 0.03078174, -0.05721653, 0.057529688, -0.124955714, -0.7226543, 0.9914917, 0.11677116) * inp_4_1_2; + result0 += M4(-0.109197564, -0.059206225, 0.099042386, -0.031215744, 0.045129422, -0.047674976, 0.08938741, 0.04268483, 0.053480405, -0.09282501, 0.17190757, 0.33064157, -0.08043694, -0.5275766, 0.1736941, -0.35548675) * inp_4_2_2; + result1 += M4(0.115241274, 0.23834142, -0.22037292, -0.10773489, -0.20203483, 0.2564087, -0.12480241, -0.014368536, 0.09855736, 0.1417844, -0.09845811, 0.14975907, -0.46074733, 0.062055077, 0.24731185, -1.3025191) * inp_4_0_0; + result1 += M4(0.12858908, 0.056481436, 0.13710234, -0.032665927, -0.080657765, -0.23290908, 0.098453395, 0.12761988, 0.23997094, 0.3216201, -0.1042049, 0.28961274, -0.39917043, -0.20419855, 0.09971636, 0.6437219) * inp_4_1_0; + result1 += M4(0.086334385, 0.1389801, 0.01838412, -0.06806034, -0.046940796, -0.005889171, -0.027570356, -0.17938402, -0.01332321, 0.016332142, -0.024383062, 0.20279832, 0.22654916, 0.06664337, 0.32538632, -0.33960968) * inp_4_2_0; + result1 += M4(-0.013266585, 0.084680825, 0.11511902, -0.051530734, 0.19516058, 0.1262526, -0.15671806, 0.116464585, -0.6919797, -0.041155636, 0.40505388, 0.10380915, 1.0243481, -0.45496213, -1.023632, -0.38543403) * inp_4_0_1; + result1 += M4(-0.3199287, 0.10961233, 0.2809706, 0.13942754, -0.06333182, 0.2228361, 0.40465695, -0.004015398, -0.19529878, 0.21502659, -0.34753472, 0.059127867, -0.15143098, -0.35828757, 0.45172203, -0.3196675) * inp_4_1_1; + result1 += M4(0.083587795, -0.06833488, 0.009357782, -0.14922418, 0.09992282, 0.15072636, 0.047865238, -0.19624999, -0.18515311, -0.3278566, -0.1259383, -0.2291827, 0.04791808, 0.0922475, -0.047212943, -0.21117374) * inp_4_2_1; + result1 += M4(0.29294783, 0.04636893, -0.030649351, 0.1589842, -0.033546854, 0.092204526, -0.3581079, -0.25244322, -0.14708053, 0.06940555, 0.14047131, 0.10408999, -0.07738764, 0.17149006, 1.2557439, 0.3894146) * inp_4_0_2; + result1 += M4(-0.089484476, -0.33820024, 0.20849167, 0.1614044, 0.13212253, 0.047157973, -0.51512915, -0.2746234, 0.23242816, 0.08945186, 0.19532014, -0.042705078, -0.19105509, -0.17811388, 0.010501524, -0.3545278) * inp_4_1_2; + result1 += M4(0.019447548, 0.007892576, 0.06607077, -0.104389586, -0.0975221, 0.064485066, -0.11721102, -0.08844911, -0.024724124, 0.12946258, -0.015253397, 0.055234097, 0.110158324, 0.05599077, 0.24299455, 0.22943555) * inp_4_2_2; + result2 += M4(0.06243231, -0.03080686, -0.010034511, 0.010906477, -0.083122596, -0.029972939, -0.1699356, -0.03393727, 0.07949472, -0.022816116, 0.24316265, -0.004902569, 0.27971682, 0.05745822, 0.086882725, 0.13561091) * inp_4_0_0; + result2 += M4(-0.03348177, 0.16825163, -0.2858046, 0.008476143, -0.050870344, 0.08688432, -0.036886882, 0.08342965, 0.15195124, -0.1400096, 0.24082322, -0.048991017, -0.16710205, 0.2213648, -0.28270057, 0.019434704) * inp_4_1_0; + result2 += M4(-0.021879468, 0.029086184, 0.06375903, -0.036705192, -0.07152258, -0.08405272, 0.009126181, 0.041362375, 0.010069433, -0.03296121, 0.051549606, 0.070626736, -0.0701935, -0.038468104, -0.20310104, 0.027696736) * inp_4_2_0; + result2 += M4(0.13280624, 0.0029688375, 0.063456334, -0.028322415, -0.2665115, -0.10824069, -0.11066845, -0.12142015, -0.13628188, -0.007641665, 0.11414588, -0.02057948, -0.15871942, -3.8885188, 1.58179, 0.10343098) * inp_4_0_1; + result2 += M4(0.040351696, -0.16582695, -0.17164497, -0.007849884, -0.20808913, 0.30068874, 0.0835827, -0.069587596, 0.03504311, -0.42582002, -0.16951635, -0.22155721, -0.45369977, 0.43222344, -0.4066853, 0.24775113) * inp_4_1_1; + result2 += M4(0.1143635, -0.016784213, 0.0472682, 0.027353937, -0.30716023, -0.070385255, 0.20868735, -0.15181156, 0.060414966, 0.051172152, 0.15772508, 0.6396605, -0.3225857, -0.06471235, -0.23874941, -0.044259693) * inp_4_2_1; + result2 += M4(0.10806135, 0.017882362, -0.042468145, 0.08220766, -0.12985216, -0.15932857, 0.28344554, 0.00066246133, 0.19643955, 0.04992641, 0.3398252, 0.12404135, -0.22131181, -0.20275827, 0.71895754, 0.33842087) * inp_4_0_2; + result2 += M4(-0.10851297, 0.38080224, -0.45152915, -0.085034646, 0.0716164, -0.29138008, -0.51535314, 0.08845703, 0.08584361, 0.22396721, 0.1635391, -0.32108584, 0.09885805, 0.8477584, -0.17397182, 0.3018451) * inp_4_1_2; + result2 += M4(-0.10493052, 0.08810675, -0.06452757, -0.1613554, -0.0011969488, 0.07247748, -0.33340722, 0.23338965, -0.19328506, 0.06157833, 0.14561516, 0.05837044, 0.074669376, -0.010393692, -0.16974366, 0.26621738) * inp_4_2_2; + result3 += M4(-0.22222115, 0.0074784025, 0.047398493, -0.043663613, -0.06080802, -0.078227445, 0.08049125, 0.004488113, 0.0991715, 0.036138956, -0.096216515, 0.12484699, -0.24911477, 0.6779984, 0.21604092, 0.77542776) * inp_4_0_0; + result3 += M4(0.030274367, 0.076183334, 0.031904638, -0.040991828, 0.061965287, -0.15433551, 0.094006486, 0.039096843, 0.024390098, 0.007882412, -0.0916322, -0.10465828, 1.0467867, 0.43756014, -0.45471016, 0.4175311) * inp_4_1_0; + result3 += M4(0.15954503, 0.028513957, -0.03199022, 0.028530428, -0.12293308, -0.03854867, -0.0066049723, -0.0062664445, 0.28839985, -0.02763895, 0.041259628, 0.08943823, -0.19038096, 0.25889587, 0.111525126, 0.41104788) * inp_4_2_0; + result3 += M4(0.041438863, 0.0803227, 0.16269784, 0.14344642, -0.20871715, -0.13722162, 0.19706678, -0.082898095, 0.10506128, 0.067395546, -0.123247206, -0.078830846, -0.5529698, 0.3499168, 0.19171025, -0.13291214) * inp_4_0_1; + result3 += M4(-0.021569727, 0.03996306, -0.09489145, 0.28711125, 0.21166669, 0.067331664, -0.061321113, 0.19850886, -0.3052251, 0.1652337, -0.059395615, -0.33339286, 0.044252418, 0.43579766, -0.10196087, -0.630944) * inp_4_1_1; + result3 += M4(-0.1560882, 0.023954758, 0.15639585, 0.314397, 0.04370558, -0.04073754, 0.098097526, -0.23425387, 0.006138961, 0.124991335, 0.3479183, -0.20222782, -0.27129135, 0.089798786, 0.031734347, 0.0014838318) * inp_4_2_1; + result3 += M4(0.1959224, -0.051791076, 0.11577392, 0.45096672, -0.30047828, -0.08729232, 0.33429983, 0.040639695, 0.043423086, -0.031868048, 0.04343922, -0.18168741, 0.9951363, 0.6779704, 0.19688551, 0.81282854) * inp_4_0_2; + result3 += M4(0.110027246, -0.10094923, -0.052526306, -0.12501228, -0.27323133, -0.4786127, -0.38895276, -0.94579303, 0.03283588, -0.18848437, 0.055940457, 0.35748008, -0.47208208, 0.49668717, 0.061124697, -0.9958602) * inp_4_1_2; + result3 += M4(-0.33333632, 0.105203375, -0.061146054, 0.31423125, 0.05308085, -0.013111337, 0.30190304, 0.64082, 0.0968669, 0.020935085, -0.002691396, 0.0055832, -0.2549382, 0.5169665, 0.05373311, 0.37135825) * inp_4_2_2; + result4 += M4(-0.018554613, -0.31538603, -0.027073208, -0.016269749, 0.08721572, -0.0978943, -0.11694246, 0.07132488, -0.1633322, -0.08412939, 0.060046867, 0.054399405, -0.24835192, -0.43097737, 0.6438047, 0.84883213) * inp_4_0_0; + result4 += M4(0.008297077, 0.3070949, 0.23559389, 0.10120678, 0.1063028, 0.14788942, -0.15700959, 0.21542779, -0.23130956, -0.15931411, 0.1638324, -0.24973845, -0.11564923, 0.5542824, 0.24268627, 0.90316206) * inp_4_1_0; + result4 += M4(-0.017849084, -0.19411187, -0.033079863, -0.062527016, 0.106704175, -0.17120638, -0.023030141, 0.033408403, -0.13115425, -0.032268446, 0.117338836, 0.057866845, -0.2980991, -0.111615874, -0.0158531, -0.5238175) * inp_4_2_0; + result4 += M4(-0.06477427, 0.17674847, 0.22984941, 0.27743047, 0.16878267, -0.21353288, 0.039101083, 0.0021998256, 0.0317513, 0.1677063, -0.048979975, -0.19397894, -1.6818529, 0.119567774, 0.20270815, -0.2815504) * inp_4_0_1; + result4 += M4(0.05881081, 0.026019238, 0.12755994, 0.31477025, 0.10886015, -0.18924402, 0.25566214, 0.22322816, -0.37583232, 0.21965338, -0.007663065, -0.38772458, 0.5927244, -0.51076436, 0.18607512, 0.053665124) * inp_4_1_1; + result4 += M4(-0.07345876, 0.13525315, 0.06285085, 0.14679123, 0.1347598, 0.040965777, -0.13841116, -0.116792835, -0.06403706, 0.1522847, -0.02061705, -0.032410428, -0.016132811, -0.42665946, -0.3188076, 0.27266532) * inp_4_2_1; + result4 += M4(-0.087834165, -0.07839777, 0.1506058, 0.3557263, 0.066434175, 0.13599882, 0.110494606, -0.20529054, -0.09943617, -0.2899718, -0.095053196, 0.16347927, 0.15770288, -0.30951142, 0.76602536, 0.3098032) * inp_4_0_2; + result4 += M4(0.27171537, 0.088698454, 0.024937956, 0.05871026, -0.3523191, 0.29500192, 0.11641451, -0.25327176, 0.05277166, -0.3232964, -0.09708374, 0.04349622, 0.23741995, -0.71324193, 0.1851881, -0.09442719) * inp_4_1_2; + result4 += M4(0.036605358, 0.15635848, -0.023374999, 0.30927876, -0.029212039, 0.14914301, 0.2779765, -0.010274902, -0.09040753, -0.21608385, -0.13206193, 0.030652693, -0.1215538, 0.38372636, 0.43953812, 0.30959544) * inp_4_2_2; + result5 += M4(-0.02372011, -0.014935471, 0.0046966528, 0.041532308, -0.08713677, 0.102717265, 0.084658965, -0.21433803, -0.088726446, 0.07258954, -0.1777257, -0.1785439, -0.20974338, 0.63156265, 0.09205572, -0.24030016) * inp_4_0_0; + result5 += M4(0.14261784, 0.021301309, 0.016872916, 0.30446127, -0.09667691, 0.12914002, 0.09567189, 0.022265786, -0.111078255, 0.044935968, -0.14371537, -0.016974835, 0.18495229, 0.14913443, 0.030482247, 0.120692655) * inp_4_1_0; + result5 += M4(-0.044102244, -0.091261394, -0.033437748, -0.30377164, -0.039902624, -0.0713258, 0.12725319, -0.20821251, 0.05562083, 0.18455294, -0.112763606, 0.13647695, -0.43052682, -0.08831913, 0.19765604, -0.49446633) * inp_4_2_0; + result5 += M4(-0.020785145, -0.050931253, -0.08109034, 0.05910568, -0.0062823356, 0.3255998, 0.14434633, 0.39494473, 0.12303079, -0.08310123, -0.021128759, 0.21541841, -1.9671965, -0.7371834, -0.5168264, -0.18985191) * inp_4_0_1; + result5 += M4(0.027101878, -0.08842568, -0.012144593, 0.08992351, -0.020138465, 0.3067692, 0.09032445, -0.017230976, -0.14870377, -0.37536424, -0.2890627, 0.08392149, 0.23425648, 0.91296816, 0.17762998, 0.23526564) * inp_4_1_1; + result5 += M4(0.0672514, 0.018849773, -0.05773434, 0.017648185, 0.09298665, 0.010716047, 0.06307072, 0.006801315, 0.07954308, 0.23055385, 0.0393071, 0.35691229, 0.065422736, -0.06471603, 0.33816966, -0.471639) * inp_4_2_1; + result5 += M4(-0.08225651, 0.05632306, -0.035111938, -0.030768128, -0.24232209, -0.16741686, 0.15765136, 0.2368801, -0.01259822, 0.053519137, -0.045613293, -0.042108674, -0.61746305, 0.56319, -0.23051819, 0.197345) * inp_4_0_2; + result5 += M4(-0.20756823, 0.38793558, 0.14884292, -0.007983229, -0.027410332, -0.60050946, -0.28704426, 0.27561533, -0.16390233, 0.12511982, 0.22906592, 0.22610174, 0.50863, 0.36241955, -0.10465414, 0.44608098) * inp_4_1_2; + result5 += M4(-0.06989171, -0.028340604, 0.09668498, 0.0348285, -0.0067173922, 0.07211928, -0.04110069, 0.2631417, 0.10073734, 0.04803034, 0.044985283, -0.002657226, 0.2764329, 0.20462798, 0.08578274, 0.31915313) * inp_4_2_2; + result6 += M4(0.032785777, 0.15885757, -0.027589627, 0.016733928, 0.029733058, -0.06476136, 0.0021533875, -0.066802375, 0.008806604, -0.16958116, 0.02088448, 0.0010474634, -0.29112884, -1.6132256, -1.7260915, 0.34106126) * inp_4_0_0; + result6 += M4(0.12322075, -0.10652362, -0.08984651, 0.013572062, 0.08170077, 0.04724855, -0.010108016, -0.037087526, 0.029392263, 0.1821705, 0.105637565, -0.019256163, -0.56992877, 1.0325651, -0.03334818, 0.14209521) * inp_4_1_0; + result6 += M4(-0.052494686, -0.105625585, 0.019894024, -0.027618747, 0.03428332, -0.09801582, -0.030065225, -0.0061193993, -0.012288469, 0.16192077, 0.033170305, 0.01367951, -0.1779692, -0.38380915, 0.08621929, -0.062460866) * inp_4_2_0; + result6 += M4(0.0368347, 0.12542813, 0.04380804, -0.033293262, 0.023384377, -0.016387435, -0.536373, 0.04929447, -0.097531185, 0.0028912555, -0.1794702, 0.037355762, -0.60289866, 0.07661829, -2.9835203, 0.29708284) * inp_4_0_1; + result6 += M4(-0.078338705, 0.007893033, -0.26153123, -0.08710498, -0.19241379, 0.29445362, -0.9674952, 0.07221217, -0.03219465, 0.46199805, 0.66272104, -0.18116875, -0.3322162, -1.213149, -1.0827179, 0.23517527) * inp_4_1_1; + result6 += M4(0.027267402, 0.08066793, 0.011767587, -0.032864526, 0.20028964, 0.08806489, 0.24974431, 0.0219503, -0.023652226, 0.2216681, -0.13682073, 0.045651093, -0.46100193, 0.8369607, 0.23994556, 0.07360858) * inp_4_2_1; + result6 += M4(-0.054726627, 0.10524355, -0.04689709, 0.04616609, -0.22773783, 0.45156208, -0.05400684, 0.22083044, -0.17462498, -0.16437173, -0.26941505, 0.15800458, -0.13797864, -2.6323333, -1.5196991, 0.04762208) * inp_4_0_2; + result6 += M4(-0.13177747, 0.15229201, -0.7652503, 0.10133035, 0.21490802, 0.042347305, 0.26624078, -0.22924802, -0.48565182, 0.016563121, 0.0045131897, 0.008790221, -0.10966729, 1.0263358, -0.352884, 0.47062835) * inp_4_1_2; + result6 += M4(-0.023600928, 0.22463967, -0.042015925, -0.0233899, -0.041405104, -0.1937879, -0.36887828, -0.0052565024, -0.06255296, 0.037563305, -0.17711361, 0.05712629, 0.10749479, 0.7987707, 0.19939129, 0.16435558) * inp_4_2_2; + result7 += M4(-0.004418903, 0.3166235, 0.29223296, 0.015304121, 0.08466793, -0.18584673, -0.06541433, -0.02270776, 0.009344044, 0.20567061, 0.39762345, 0.042079635, -0.26761764, -0.82151717, -0.4652876, 0.506165) * inp_4_0_0; + result7 += M4(-0.04465701, 0.4396988, 0.5603336, 0.0051679043, 0.13228583, -0.016537944, -0.28920653, 0.007170126, 0.094849035, -0.0015922618, 0.67430943, 0.039542858, 0.75927895, -0.6441329, 0.26150444, 0.6896651) * inp_4_1_0; + result7 += M4(-0.12183013, 0.4683825, 0.21179545, -0.016460383, 0.092247896, -0.09603741, -0.13345097, 0.01408285, -0.00270894, 0.20367518, 0.076567546, -0.00911101, 0.32144699, -0.16310102, 0.5939863, 0.13743041) * inp_4_2_0; + result7 += M4(-0.005855817, 0.21719484, 0.113287, 0.03918942, 0.053082608, 0.10152378, -0.15179963, -0.039251637, 0.052032035, -0.22566451, -0.063187204, 0.0036690927, 0.9743889, -1.3120145, -0.8437327, 1.260124) * inp_4_0_1; + result7 += M4(0.08126965, 0.17834574, 0.4298001, -0.036700815, 0.25315952, -0.14485209, -0.41929123, 0.35981572, -0.047610704, -0.11161931, -0.1125463, -0.0064353365, 0.15277267, -0.31722865, 0.10171603, 0.9509688) * inp_4_1_1; + result7 += M4(0.049401242, 0.045618303, 0.08995752, -0.04812938, 0.29819807, -0.36165085, -0.3333235, -0.068012096, -0.06253801, -0.1752275, -0.09843542, -0.05615687, -0.23092799, 0.15508914, 0.0968813, 0.07054126) * inp_4_2_1; + result7 += M4(-0.06192428, 0.25644004, 0.05498207, 0.037272707, 0.028004821, 0.06913183, -0.15415372, -0.06578213, -0.045622293, -0.3174076, -0.043959387, 0.0038883523, -0.04896643, 0.0067820773, -1.111823, 0.97609) * inp_4_0_2; + result7 += M4(-0.2121365, 0.5326121, 0.21101592, 0.09105239, 0.023586927, 0.22343849, -0.14279713, -0.095309116, -0.019170366, -0.09621605, -0.05418587, 0.08818929, -0.11956935, -0.3027655, 0.33258468, 0.67414373) * inp_4_1_2; + result7 += M4(-0.031838927, 0.13877393, 0.17086424, 0.06789686, 0.14482678, 0.64110893, -0.18934365, -0.11943048, -0.09563664, 0.039406456, 0.10457144, -0.035684735, -0.11465652, -0.069124416, -0.38361502, 0.34649462) * inp_4_2_2; + const V4 inp_5_0_0 = inp[5][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_5_1_0 = inp[5][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_5_2_0 = inp[5][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_5_0_1 = inp[5][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_5_1_1 = inp[5][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_5_2_1 = inp[5][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_5_0_2 = inp[5][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_5_1_2 = inp[5][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_5_2_2 = inp[5][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.032165144, -0.17283043, 0.40634465, 0.18554355, -0.03646573, 0.16061564, 0.1202025, 0.13494422, 0.03973842, 0.012507408, -0.03709211, 0.097898535, -0.022682887, -0.042406686, -0.158498, -0.021587644) * inp_5_0_0; + result0 += M4(-0.061221074, 0.4302052, -0.017923988, -0.049919378, -0.04308044, 0.051651303, -0.031040499, 0.107649356, -0.014500954, 0.3040428, -0.1764697, 0.2050797, 0.047170892, -0.040330313, -0.4301044, 0.383825) * inp_5_1_0; + result0 += M4(0.06048482, -0.103105925, -0.026729293, -0.09565454, -0.059778493, 0.0039278227, -0.28696537, 0.092242114, -0.10437447, -0.021426082, -0.17093132, 0.05321713, 0.015657196, -0.08444574, 0.09244955, -0.011346713) * inp_5_2_0; + result0 += M4(-0.065622956, -1.0223327, 0.18716943, 0.39013413, 3.759452e-05, -0.008561076, 0.036871698, 0.23893104, 0.04100186, 0.18658964, 0.06566288, 0.13253917, 0.026072484, 0.15335394, -0.16708277, -0.06232867) * inp_5_0_1; + result0 += M4(0.0705219, 0.2731388, 0.37419394, -0.5099221, 0.10106326, -0.04581044, 0.08015889, 0.03420968, 0.105513, -0.12692529, -0.032456324, -0.36409527, 0.09334486, -0.12180118, 0.051589683, -0.16843452) * inp_5_1_1; + result0 += M4(-0.02791653, -0.073268086, 0.08332121, -0.104257494, -0.05604274, 0.117989816, 0.1395331, 0.23207246, 0.014246145, -0.20598823, 0.33341828, 0.23594002, 0.06164089, 0.23849802, -0.24719124, 0.16600807) * inp_5_2_1; + result0 += M4(-0.017438488, -0.11099849, 0.04943488, 0.022647617, 0.058134593, 0.13425589, 0.116507016, -0.026565833, 0.03181883, 0.03217316, -0.013940923, 0.09611051, -0.0032853952, 0.052377317, -0.057842232, -0.05447562) * inp_5_0_2; + result0 += M4(0.06765013, 0.13481544, -0.048973545, -0.2124814, 0.027399477, 0.10596413, 0.15481697, 0.21284012, -0.036326382, 0.050706357, -0.05354311, -0.091235146, -0.015660161, 0.26561028, 0.10215399, 0.2868995) * inp_5_1_2; + result0 += M4(-0.04957627, -0.048332002, -0.016767919, -0.09268265, -0.0036624842, 0.09760619, 0.0975638, -0.0022976487, 0.032292455, -0.064868934, -0.123962924, 0.05621701, -0.0035493325, -0.03155808, 0.04369656, 0.14986138) * inp_5_2_2; + result1 += M4(-0.13882595, 0.026293863, 0.19750905, -0.013672408, 0.0857836, 0.044011034, 0.043221448, -0.030713022, -0.093520366, -0.1585751, 0.12062129, -0.08471291, 0.15737423, 0.109550856, 0.014284752, 0.054470185) * inp_5_0_0; + result1 += M4(0.25198418, -0.0902725, -0.027173793, -0.68578213, -0.05146121, 0.09703619, 0.22356944, 0.088729665, -0.20296568, 0.216776, 0.09760393, -0.17919743, -0.31320816, -0.11960541, -0.015387656, -0.15049535) * inp_5_1_0; + result1 += M4(0.14004284, 0.06771928, -0.043470144, -0.043430574, 0.01414718, -0.09780925, 0.09684625, -0.14533332, -0.031170845, -0.05573361, 0.0725194, -0.028513705, -0.1524789, -0.00488204, 0.06385702, -0.12565415) * inp_5_2_0; + result1 += M4(-0.5980765, -0.10799803, 0.014967883, -0.008653867, 0.094177134, 0.09414159, -0.00071129476, 0.14932473, 0.13517241, -0.059837095, -0.011171581, -0.23530217, 0.21400566, -0.013023068, 0.09824032, -0.038958725) * inp_5_0_1; + result1 += M4(-0.028823052, 0.11022507, -0.1449101, 0.3164187, -0.07676177, 0.056961577, 0.187237, -0.027592823, -0.015379031, 0.08239875, -0.05506426, 0.001831446, -0.010472539, 0.32377413, 0.18965952, -0.023738606) * inp_5_1_1; + result1 += M4(0.09264047, -0.0029376545, 0.021067226, 0.0608879, -0.082351126, 0.05936524, 0.036029242, 0.09726498, 0.010211812, 0.088664204, -0.022089057, -0.098787196, -0.12641083, 0.050763812, -0.058340017, -0.030372087) * inp_5_2_1; + result1 += M4(0.15021048, -0.13689055, -0.01343731, -0.43789294, 0.051746387, 0.07769025, -0.028072603, 0.032349005, 0.08593159, -0.023610476, -0.16594267, -0.10593114, 0.08988229, 0.065051965, 0.047421977, -0.10344295) * inp_5_0_2; + result1 += M4(-0.027393915, -0.20911823, -0.14861438, 0.07305741, 0.010071254, -0.006128178, 0.041901074, -0.04421154, 0.09441486, -0.00011363394, -0.091649316, -0.09320238, -0.09316372, -0.189048, -0.12609997, 0.0780263) * inp_5_1_2; + result1 += M4(-0.0013726715, -0.009078485, -0.023953171, -0.1463101, -0.0006862536, -0.0008995612, 0.10402892, -0.092954285, -0.03070975, -0.049529374, 0.065487094, 0.07884637, -0.04302176, 0.07587188, 0.0020856916, -0.08507492) * inp_5_2_2; + result2 += M4(0.10301719, -0.022910483, -0.06746284, 0.20937121, 0.051624082, -0.07133462, -0.0021036996, -0.044607222, -0.023507895, 0.0340289, -0.07798698, -0.019175507, -0.035228696, 0.035518996, -0.0021251217, 0.042910658) * inp_5_0_0; + result2 += M4(0.054237112, -0.034621216, 0.15788543, 0.23602548, 0.18491454, 0.07353308, -0.1131845, 0.1156592, -0.07567536, -0.19284339, 0.24879329, -0.19427714, -0.111234866, 0.18764073, 0.1485776, 0.123295985) * inp_5_1_0; + result2 += M4(-0.112203136, -0.12003465, -0.041917715, -0.03238734, -0.07198111, 0.028996484, 0.1111366, -0.124065146, -0.10561945, -0.009082544, 0.006997792, -0.23555192, 0.038605206, 0.027334265, 0.0646343, -0.053433992) * inp_5_2_0; + result2 += M4(-0.13104938, -0.30081755, -0.04565684, 0.16132258, 0.15536843, -0.10211957, 0.19431044, 0.050139476, 0.063079715, -0.029818468, -0.0050877226, -0.01849609, -0.050283793, 0.045031067, 0.023956012, 0.02018957) * inp_5_0_1; + result2 += M4(-0.01382849, -0.15523173, 0.28399482, -0.7521889, 0.24544442, 0.012596007, -0.03206668, 0.008040535, -0.23877345, 0.038458355, 0.22159629, -0.3853706, -0.22539756, 0.015639903, 0.4748152, -0.16719179) * inp_5_1_1; + result2 += M4(-0.10120006, -0.13266163, 0.040841457, -0.30963138, 0.037651785, 0.07730276, 0.07580404, -0.026615815, -0.12387708, 0.014711871, 0.016514767, -0.17926922, -0.13275193, 0.13773493, 0.13179703, 0.12123983) * inp_5_2_1; + result2 += M4(0.07339468, 0.06203622, -0.12329334, 0.08337741, 0.12093235, -0.0960478, 0.085040405, 0.024159962, -0.030216862, 0.068158925, -0.04042995, -0.06740357, -0.057916418, 0.016825855, -0.08366378, 0.115069166) * inp_5_0_2; + result2 += M4(-0.47783527, 0.07719642, 0.01707533, 0.14425534, 0.013818421, -0.023337537, 0.09349242, -0.036243826, -0.071517676, 0.026565881, 0.01973659, -0.16347322, -0.086143896, 0.28260255, -0.0801551, -0.019386794) * inp_5_1_2; + result2 += M4(-0.16804834, -0.06665571, -0.021137923, -0.07496317, -0.05221263, -0.0091073625, 0.07460384, 0.021114651, -0.0012520734, -0.024890244, 0.045420658, -0.22388467, -0.03264385, 0.09342122, -0.016314741, 0.029080233) * inp_5_2_2; + result3 += M4(-0.13623719, -0.074121214, 0.36390996, -0.0684557, -0.10150539, 0.022530444, -0.073087454, 0.041017555, -0.3129346, 0.10789508, 0.0730042, -0.03168122, -0.085479625, -0.10615614, 0.074155, 0.12174722) * inp_5_0_0; + result3 += M4(-0.44083247, 0.10533798, 0.19465177, -0.007246912, 0.054594878, 0.29730833, -0.08960047, 0.048678644, -0.26166618, 0.20802842, -0.44012845, -0.105084956, -0.056705445, -0.1789505, 0.1450788, 0.1183812) * inp_5_1_0; + result3 += M4(0.011550804, 0.038025778, -0.09636769, -0.14296567, -0.060081266, 0.05173794, -0.03250187, 0.22262566, -0.20090915, -0.0074857175, -0.5433949, -0.013365135, -0.014985263, -0.091340505, -0.031966522, 0.111169465) * inp_5_2_0; + result3 += M4(0.004021542, 0.16898811, -0.09772042, 0.1567671, 0.034985278, 0.009708978, 0.12037031, 0.18072696, -0.14124206, 0.1100557, -0.2309795, 0.12046959, -0.07495155, -0.09570597, 0.054468986, -0.04671279) * inp_5_0_1; + result3 += M4(0.03887686, 0.06836991, -0.22931919, -0.17009152, 0.19544592, 0.034817964, 0.015159909, 0.07725526, -0.037827812, 0.18052754, -1.0727265, -0.2248324, -0.23478907, -0.56630945, 0.107048504, -0.19957283) * inp_5_1_1; + result3 += M4(-0.0036268253, 0.059987787, -0.18994491, -0.026699148, 0.084675685, 0.089063816, -0.0665738, 0.2585772, -0.09294153, 0.049071066, -0.7784702, 0.09769145, 0.041793436, -0.030230202, 0.18409672, 0.18032874) * inp_5_2_1; + result3 += M4(-0.024319798, 0.15822768, -0.001500388, 0.14373888, 0.06296548, -0.07551756, 0.08211885, 0.09191918, -0.062487926, -0.03944449, 0.05229111, -0.040973827, -0.045246325, -0.04971226, 0.056707844, -0.07201494) * inp_5_0_2; + result3 += M4(0.31380945, 0.03942549, 0.5274574, -0.20498534, 0.045373682, -0.14587434, -0.014487029, 0.055261523, -0.038807593, -0.042912625, -0.28775012, 0.267774, 0.04890975, -0.16255964, 0.13299824, 0.4969454) * inp_5_1_2; + result3 += M4(-0.054900225, 0.0057915607, -0.047852773, 0.055206086, -0.060202286, -0.0153405685, 0.0303107, 0.13728504, -0.025481522, 0.036968987, -0.39513066, -0.08825466, -0.045987137, 0.0058396184, -0.0012962446, 0.095448785) * inp_5_2_2; + result4 += M4(-0.1294866, 0.02138291, -0.10303458, -0.22781478, -0.037161604, 0.08325151, 0.17125261, 0.005365751, 0.08294989, 0.085749105, -0.023346728, 0.055940583, 0.031337112, -0.113238096, 0.019536298, 0.14558831) * inp_5_0_0; + result4 += M4(-0.2114343, -0.14057158, -0.22970642, 0.00230447, -0.04878319, 0.33474055, 0.14460452, 0.13668068, 0.04356139, 0.056840193, -0.20109622, -0.022539018, 0.11512222, -0.19470896, 0.08962883, 0.1093798) * inp_5_1_0; + result4 += M4(0.03561315, -0.0040265564, -0.07582593, -0.14932466, -0.15610832, 0.21156691, 0.15697283, 0.053123556, 0.08185663, 0.12814, -0.09372812, -0.023147078, 0.14258163, -0.3290908, 0.14480329, 0.06404412) * inp_5_2_0; + result4 += M4(-0.1817035, 0.6072989, 0.0121303, -0.09942631, -0.064160556, 0.08650752, 0.19564025, 0.20608908, 0.07955238, 0.22513014, 0.22756377, -0.012018911, -0.043492977, 0.0025760017, 0.06848729, -0.09504291) * inp_5_0_1; + result4 += M4(0.122640625, 0.13967396, -0.123871244, -0.01828265, -0.0077766003, 0.07873682, 0.2725281, 0.022284776, -0.1532384, 0.23962492, -0.09862019, 0.040687796, -0.14854011, 0.2165895, -0.091223635, -0.23024976) * inp_5_1_1; + result4 += M4(0.14727849, 0.023067847, -0.099636264, 0.087126836, -0.10521028, 0.23338217, 0.06673692, 0.10734836, 0.093235046, 0.013245227, 0.17138568, 0.049127664, 0.07836385, 0.18599589, 0.08656943, -0.02972075) * inp_5_2_1; + result4 += M4(-0.089823686, -0.24819332, 0.18235214, 0.21639885, -0.09998666, 0.074534655, 0.30893874, 0.046496145, 0.07078351, -0.017009815, 0.026666401, -0.06423154, -0.00861895, -0.315302, -0.0304769, -0.22908765) * inp_5_0_2; + result4 += M4(0.026014168, 0.059482165, 0.34938964, 0.026913688, -0.17125194, -0.037049152, 0.1546895, 0.00034647883, 0.13521168, -0.07905523, -0.115048535, -0.033067502, 0.020866629, -0.96416926, -0.12991461, 0.2761755) * inp_5_1_2; + result4 += M4(0.0951916, -0.05240331, 0.04774486, 0.09090494, -0.12669313, 0.05543682, 0.011621517, 0.021827646, 0.039317675, -0.12534136, -0.06112589, -0.13986771, 0.0062395176, -0.3093545, -0.012223232, -0.24065082) * inp_5_2_2; + result5 += M4(0.3580817, -0.030778589, 0.0023805082, 0.035009954, 0.0034672893, 0.0059434483, -0.0628913, 0.16034299, 0.23968749, -0.05559468, 0.05995156, 0.21254182, -0.05512007, 0.027894514, 0.041044015, 0.0061496403) * inp_5_0_0; + result5 += M4(0.15321243, -0.31154323, 0.23011236, 0.026688907, 0.084365875, 0.23364569, -0.23044062, 0.11522651, -0.14199208, -0.18805383, 0.17606153, -0.072431125, 0.016062351, 0.08771873, 0.1227515, 0.18588558) * inp_5_1_0; + result5 += M4(0.021638915, -0.1425942, 0.057660725, -0.14851098, -0.04993011, 0.11703775, -0.14750518, -0.04756683, -0.02192176, -0.022002079, 0.12551798, -0.30334336, -0.023573454, 0.096975565, 0.045306653, -0.20732892) * inp_5_2_0; + result5 += M4(0.44978943, -0.2567354, 0.0013764008, -0.17940071, -0.078582495, 0.16570877, -0.034276266, -0.0017920799, 0.08697219, -0.0046514263, 0.05688368, 0.064191505, -0.054974906, -0.099886514, -0.036527075, 0.02958098) * inp_5_0_1; + result5 += M4(0.35954377, -0.017478041, 0.37014934, 0.041308004, -0.29862127, 0.19218269, -0.066696, 0.24381845, 0.34958637, 0.09147496, -0.051891852, -0.23789744, -0.038027, 0.08605349, -0.26660883, -0.18267189) * inp_5_1_1; + result5 += M4(0.079664245, -0.09594503, 0.05957056, -0.17564584, -0.06229915, 0.06231958, -0.14381641, 0.043530345, 0.14392576, 0.09072856, 0.1968185, -0.08853048, 0.17321119, 0.11203383, 0.07038388, 0.14226396) * inp_5_2_1; + result5 += M4(-0.00042395102, 0.014946294, 0.023875011, 0.18470277, -0.07724871, 0.019676274, -0.08447591, 0.09785722, -0.05185168, 0.063181706, -0.015388867, 0.08823325, -0.0064603076, 0.020791758, 0.0704453, 0.13020808) * inp_5_0_2; + result5 += M4(0.050801434, 0.18725401, -0.010562123, 0.08028587, -0.23434429, -0.052683614, -0.16841152, -0.0050541786, -0.119861215, 0.011041457, 0.07538003, -0.0576978, -0.26533553, 0.24711394, 0.015776431, -0.15346095) * inp_5_1_2; + result5 += M4(-0.032450754, -0.12898251, 0.0024378377, 0.047607746, -0.16179182, -0.0187819, -0.08517621, -0.0223974, -0.14000109, -0.008272115, 0.052717913, -0.018218433, 0.053910594, 0.1002998, 0.18950114, 0.15682216) * inp_5_2_2; + result6 += M4(-0.1427125, 0.23437913, -0.19240436, -0.21301696, -0.05031248, -0.009001654, 0.0017474538, -0.057970677, -0.012916516, -0.5946413, -0.054588284, 0.042539444, -0.028404504, 0.026533889, 0.025201924, -0.054962076) * inp_5_0_0; + result6 += M4(-0.0033247152, 0.09590354, 0.08760663, 0.0639957, -0.008410897, -0.22076, -0.05176233, 0.009790802, -0.14042431, -0.8530195, 0.19282465, 0.037369356, -0.06338543, 0.037549436, -0.2126743, 0.084449716) * inp_5_1_0; + result6 += M4(0.019052837, -0.13937615, -0.004341943, 0.036190584, -0.101516, 0.23998937, 0.06911134, 0.0124720065, -0.012925929, -0.06131768, -0.028915402, -0.046869628, -0.016983677, -0.02170675, 0.004891294, 0.025728356) * inp_5_2_0; + result6 += M4(-0.12403779, 0.07421022, 0.34714708, -0.0223222, 0.06382637, -0.06160024, 0.07190467, -0.012482603, -0.058164466, -0.5699183, -0.0031118088, 0.17073964, -0.090972625, -0.0014863753, 0.052913733, -0.03770148) * inp_5_0_1; + result6 += M4(0.37018707, 0.2087395, -0.1475791, 0.059893996, -0.08057628, 0.1406719, -0.04590291, 0.06397182, 0.23615834, -1.5653652, 0.51516014, 0.20767792, 0.043807745, -0.087411895, 0.4643824, -0.2431659) * inp_5_1_1; + result6 += M4(0.079334244, -0.027253637, -0.0052656233, -0.029792368, -0.015247179, 0.2450802, 0.1775175, 0.00032651974, -0.12888901, -0.09902306, -0.004560338, 0.033486564, -0.094092734, 0.15750176, 0.09947276, 0.08891794) * inp_5_2_1; + result6 += M4(0.14165, -0.40835375, 0.09504864, -0.31362104, 0.003275484, -0.0650579, 0.08259899, 0.035699498, -0.11981345, -0.5901641, -0.06041057, 0.0023245036, -0.010753459, -0.065767966, -0.04868017, -0.06148768) * inp_5_0_2; + result6 += M4(0.027657935, -0.2260556, -0.23709708, 0.116437845, -0.07683634, 0.19843261, 0.00125323, -0.031681817, -0.14730798, -0.24181736, 0.16877827, -0.061411735, -0.3334591, 0.031892557, -0.18347023, 0.023881098) * inp_5_1_2; + result6 += M4(0.031834584, -0.15610348, -0.021291824, 0.007144067, -0.06358461, -0.03350419, -0.003166176, 0.023516508, -0.07478699, 0.089031644, 0.036733273, -0.029883197, -0.14786538, -0.057040893, 0.0007235234, 0.007946586) * inp_5_2_2; + result7 += M4(0.20947367, -0.02882115, -0.21274045, -0.041673575, 0.020862905, 0.09812621, -0.01479245, 0.02998886, 0.0107883755, 0.016010856, -0.22037174, -0.031329464, 0.055873174, -0.19674042, -0.3776389, 0.04349502) * inp_5_0_0; + result7 += M4(0.09069688, 0.21014254, -0.5963385, 0.23423222, -0.13329448, -0.010570761, 0.017618233, -0.059912294, -0.14212526, 0.18916553, -0.0846305, 0.074028835, -0.004880115, -0.7172515, -0.84330726, -0.0040603173) * inp_5_1_0; + result7 += M4(0.0012102613, 0.13532892, -0.05921219, 0.026914231, 0.15885527, 0.062068883, 0.32618, 0.01983221, 0.07677748, 0.04760899, 0.1103253, 0.006299967, 0.039212476, -1.1822422, -0.39486572, 0.05188824) * inp_5_2_0; + result7 += M4(-0.018755654, -0.102507636, -0.19209415, -0.084044166, -0.0798725, 0.10826704, 0.09652802, 0.034425687, -0.07725495, 0.11021416, -0.031259567, -0.007052309, -0.008249081, -0.4450515, -0.073312104, 0.05304058) * inp_5_0_1; + result7 += M4(0.18562579, 0.09863308, -0.21657364, 0.4491991, -0.12871006, 0.035518132, 0.06760292, -0.012468921, -0.08468648, 0.097889595, -0.080418415, 0.06603839, 0.16029134, -1.2780255, -0.5123939, 0.041578036) * inp_5_1_1; + result7 += M4(0.056347378, 0.051266428, 0.0022314512, 0.019211384, 0.020051816, -0.023065113, 0.14817172, 0.035325315, -0.08813334, 0.21792139, -0.107613645, 0.21637446, -0.2626353, -1.9893125, -0.75468266, -0.028491504) * inp_5_2_1; + result7 += M4(0.014368917, 0.14294952, -0.38320738, 0.069414675, -0.06767831, 0.054307967, 0.063735984, 0.011272922, -0.051130503, 0.13047454, -0.10262314, -0.039571315, 0.002974242, -0.06390101, -0.021223033, 0.051700383) * inp_5_0_2; + result7 += M4(0.12085619, 0.26397443, -0.35913265, 0.13870652, -0.085972324, 0.17778155, 0.16959728, 0.04841899, -0.039187692, 0.048627313, 0.04736234, 0.008120106, 0.005444394, -0.6916086, -0.0025219654, 0.0066267964) * inp_5_1_2; + result7 += M4(0.07963682, 0.0122, 0.0042353515, 0.039935257, -0.0026367644, 0.10086984, 0.16151382, -0.00224164, -0.0431847, 0.02793446, 0.04340155, -0.04289826, -0.12281766, -0.67523026, -0.2171474, 0.0055699674) * inp_5_2_2; + const V4 inp_6_0_0 = inp[6][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_6_1_0 = inp[6][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_6_2_0 = inp[6][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_6_0_1 = inp[6][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_6_1_1 = inp[6][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_6_2_1 = inp[6][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_6_0_2 = inp[6][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_6_1_2 = inp[6][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_6_2_2 = inp[6][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.01231854, 0.09099252, 0.022946244, 0.08297145, -0.019116273, 0.0044271145, -0.10540851, -0.71004, 0.054459836, 0.18380989, 0.10206366, -0.3996084, 0.040124927, 0.07276976, 0.020511072, 0.1330955) * inp_6_0_0; + result0 += M4(0.00021396385, 0.07681068, -0.110088296, 0.113275394, -0.08838272, -0.031898905, -0.1391735, -0.56498015, -0.116450675, 0.16922408, 0.014033328, -0.53578943, 0.017148921, 0.012417857, -0.06743708, 0.06633183) * inp_6_1_0; + result0 += M4(-0.018098854, 0.13624974, -0.050053332, 0.11684962, -0.112249084, -0.010404017, -0.03036778, -0.3882712, 0.0527868, 0.055063315, 0.23352724, -0.32933038, 0.0252686, 0.013159813, 0.14096543, 0.024057312) * inp_6_2_0; + result0 += M4(-0.006187361, -0.038151503, 0.12015587, 0.090155534, -0.12143108, 0.059106637, -0.02472574, -0.36617404, 0.077264026, -0.22946018, -0.12138909, 0.01245029, 0.0045329197, 0.118264735, -0.09885005, 0.023871241) * inp_6_0_1; + result0 += M4(-0.031079983, 0.16016267, -0.12949716, 0.018936016, 0.21122845, 0.047992267, -0.1304207, -0.7452054, 0.21628508, 0.08039188, -0.042096667, 2.0649621, 0.078132614, 0.06496065, -0.07262386, -0.26538965) * inp_6_1_1; + result0 += M4(0.007734712, 0.16729037, 0.0046540704, 0.1503623, -0.019264821, 0.0066001816, -0.07285762, -0.5107723, 0.026378466, -0.058916178, -0.051529136, -0.48107275, 0.06602731, 0.031347938, -0.021869797, -0.087218374) * inp_6_2_1; + result0 += M4(0.052176222, 0.08475405, -0.0034809965, 0.08416541, -0.024401365, -0.025390834, -0.1866351, -0.6035755, 0.015564103, -0.02148876, -0.097081766, -0.24936226, -0.004921415, 0.020326754, -0.064142264, 0.06511841) * inp_6_0_2; + result0 += M4(0.077070825, 0.04553424, 0.18983321, -0.11692988, -0.071956605, 0.08778152, 0.31043553, -0.8349807, -0.14642672, -0.010712844, -0.056916144, -0.38834596, 0.03953989, -0.018705364, -0.019029478, 0.025981316) * inp_6_1_2; + result0 += M4(0.08911253, 0.07433768, 0.3026482, 0.09396495, 0.062067073, -0.13855615, 0.08529063, -0.31261137, 0.0827767, 0.017423075, 0.23351908, -0.22865114, -0.0006988492, -0.075410254, -0.10356574, -0.01920228) * inp_6_2_2; + result1 += M4(0.16692086, 0.1681319, -0.027668705, 0.0357351, 0.04478783, -1.3615508, 0.16238359, -0.20622155, 0.009226322, -0.6058478, 0.17141175, 0.07177683, 0.029655004, -0.042278104, 0.020429065, -0.11754116) * inp_6_0_0; + result1 += M4(-0.056276344, 0.011924444, 0.059304144, -0.029761907, 0.05648901, -0.78232783, 0.36322165, -0.09229923, 0.026683338, 0.06979355, 0.010189042, 0.023326937, 0.049643185, 0.21630695, 0.11989661, -0.3066141) * inp_6_1_0; + result1 += M4(-0.09902089, -0.051658772, 0.2163726, -0.03195207, 0.18893668, -0.14336692, 0.053387668, 0.22460079, 0.12283925, -0.07993935, 0.10816793, -0.16779625, 0.039105576, 0.031379238, -0.05974648, -0.35771257) * inp_6_2_0; + result1 += M4(-0.09528121, 0.19282289, 0.017492024, 0.11162626, -0.10649452, -0.40120256, -0.47130665, 0.16766542, -0.21852969, 0.08778599, 0.047800153, -0.14059094, 0.13896649, 0.032391652, 0.1289267, -0.13490139) * inp_6_0_1; + result1 += M4(0.1292054, -0.1111432, 0.06200731, 0.29972285, -0.14519946, -0.10362366, 0.2859835, 0.24241869, 0.10103597, 0.27169287, -0.49954337, -0.25025198, -0.059664782, -0.36696061, 0.022811987, -0.34421882) * inp_6_1_1; + result1 += M4(-0.046978038, -0.04253035, 0.06526447, 0.10294911, 0.16374624, -0.038954288, -0.0042913673, -0.102291785, 0.04000935, -0.082533866, -0.030262243, 0.4581597, -0.07894119, -0.10607972, 0.005460443, -0.38020784) * inp_6_2_1; + result1 += M4(0.040628765, 0.047096476, -0.1863696, 0.13811508, -0.17536464, -0.089079626, -0.13970748, 0.10210413, 0.090243645, -0.18709767, -0.2934424, 0.058423646, 0.008852994, -0.060686994, 0.12708178, -0.15863706) * inp_6_0_2; + result1 += M4(-0.08507474, 0.034850825, 0.036077287, -0.04457459, 0.014989728, -0.027375894, -0.13266571, 0.0063332724, -0.08948693, 0.026754241, 0.13646348, -0.26877627, 0.049975876, 0.050452083, -0.042310357, -0.20615625) * inp_6_1_2; + result1 += M4(-0.062459026, 0.062402043, 0.03471043, 0.15582362, -0.009285016, 0.051886212, -0.035492063, -0.24650547, -0.12275343, -0.05556574, 0.11676633, 0.1353064, 0.037673105, 0.066162795, 0.048917163, -0.3046069) * inp_6_2_2; + result2 += M4(0.070931084, -0.06814794, 0.113183714, 0.004157034, -0.004254921, 0.03653723, 0.023653282, -0.09949031, -0.09417475, -0.0713506, -0.01598105, -0.031386707, 0.06412983, -0.003332516, -0.009654981, 0.04679722) * inp_6_0_0; + result2 += M4(-0.13971889, -0.0029955038, 0.030724976, -0.034747105, -0.14185427, 0.12672651, 0.18157749, 0.064015634, -0.097591154, -0.008662035, -0.29854622, -0.00653906, 0.02662604, 0.05727379, 0.06844569, 0.03300791) * inp_6_1_0; + result2 += M4(-0.033787895, 0.03541103, 0.054050397, 0.017982055, -0.08776553, -0.03193391, 0.19953401, -0.1316237, -0.07819319, 0.032412138, 0.06304561, 0.1025258, 0.1197548, 0.03981806, 0.015472792, 0.036228433) * inp_6_2_0; + result2 += M4(0.058652364, -0.0861795, 0.087295026, 0.10473103, -0.040200293, -0.035208263, -0.21640055, -0.08914, 0.0055242474, 0.10682182, -0.2256692, 0.05267613, 0.058232304, -0.014754205, 0.056355882, -0.06968194) * inp_6_0_1; + result2 += M4(-0.06704611, -0.031780377, 0.068716496, -0.118073754, 0.08682216, 0.1617414, 0.009050403, 0.07027602, -0.1738756, -0.48633447, 0.26489118, -0.057144582, 0.07888944, -0.0443077, 0.06588128, 0.057636745) * inp_6_1_1; + result2 += M4(0.034971684, 0.11079261, 0.06916056, 0.07523564, 0.028880967, -0.05108757, 0.16491084, 0.15834938, -0.040426135, 0.11316172, -0.0044639097, 0.11993115, 0.043255787, -0.00079452124, -0.009261113, -0.043736085) * inp_6_2_1; + result2 += M4(0.08138826, 0.0016276254, 0.07471297, 0.031534787, -0.105642766, -0.14206013, -0.22113106, -0.029810762, -0.050457705, 0.048949435, 0.07358891, 0.011684654, 0.0672174, -0.015926696, -0.027410462, 0.0012992502) * inp_6_0_2; + result2 += M4(0.10355078, -0.04237281, 0.093611315, 0.023524906, 0.06956513, -0.0036909562, -0.011060128, 0.11688776, -0.08327058, 0.16784748, -0.2818095, -0.23129402, 0.03794536, 0.024148932, -0.046350144, -0.11938077) * inp_6_1_2; + result2 += M4(0.046911, 0.081882015, 0.01653193, 0.021760836, 0.434652, -0.18082868, -0.0397183, -0.08962073, 0.17877527, 0.32300794, -0.04681892, 0.18382329, 0.067989945, 0.016401801, -0.09724542, -0.10025261) * inp_6_2_2; + result3 += M4(0.051057804, 0.0016520222, 0.062105983, 0.12056436, -0.0899936, 0.14890116, 0.03038474, 0.085802756, -0.11033149, 0.0116347, -0.012035132, 0.043016437, -0.17182148, 0.059349585, -0.012545658, -0.0043172557) * inp_6_0_0; + result3 += M4(0.096188225, -0.055897813, 0.08319754, 0.1716169, -0.12413419, -0.037092984, 0.14436567, 0.25694096, 0.21850088, 0.15040623, 0.2170757, 0.014042242, -0.2146602, -0.0037457165, 0.0019651288, 0.008467248) * inp_6_1_0; + result3 += M4(0.0997741, 0.057268076, 0.12669899, 0.14344324, 0.082451485, -0.08715962, 0.07051524, -0.03754199, -0.16043258, 0.099826835, 0.07494132, -0.05123001, -0.12620164, 0.02840918, 0.0409345, 0.083929986) * inp_6_2_0; + result3 += M4(0.06308289, 0.04494612, -0.059385598, 0.114793494, 0.07921799, -0.0849568, -0.07156668, 0.076185755, 0.0035632171, -0.032233942, -0.03886473, 0.13073006, -0.1613391, -0.020031687, -0.06823047, 0.015578669) * inp_6_0_1; + result3 += M4(0.16801131, 0.12674585, -0.10847146, 0.08851929, 0.11157141, -0.0124572385, 0.031209966, 0.028390775, -0.13068324, 0.0045572207, -0.018403428, -0.29661167, -0.33593568, -0.002522017, -0.12786467, -0.012923993) * inp_6_1_1; + result3 += M4(0.08172253, 0.047185775, -0.019886838, 0.12756981, -0.05896981, 0.040990353, 0.1998765, 0.22073689, 0.1850459, -0.1774633, -0.16563854, -0.14595324, -0.30819464, -0.03032705, -0.06872377, -0.047536645) * inp_6_2_1; + result3 += M4(0.16373189, 0.025689907, 0.092418514, 0.23576991, 0.1352804, 0.035673857, -0.14253241, 0.16173278, 0.027204184, -0.04201797, 0.087649174, -0.1178203, -0.13154314, -0.016642634, 0.0045087817, -0.041030984) * inp_6_0_2; + result3 += M4(0.10113867, -0.04428575, -0.07010475, 0.11292271, -0.04571282, 0.0067607, 0.091835685, -0.1201531, 0.09398738, -0.26875952, -0.28279656, -0.38650483, -0.40327892, -0.039298613, -0.1094611, 0.11580644) * inp_6_1_2; + result3 += M4(0.014223586, 0.037842594, 0.011228763, 0.19101292, -0.22455701, 0.09835347, -0.06911222, -0.10460006, 0.10029441, 0.062288076, -0.02185914, -0.061974194, -0.36016008, 0.055539478, -0.100118056, 0.08895932) * inp_6_2_2; + result4 += M4(-0.11505866, 0.044597026, 0.22064252, 0.10775354, -0.1314016, 0.033694018, -0.009609121, 0.081915446, -0.022803884, 0.021888038, -0.0870109, -0.010788616, 0.057929434, 0.031752393, 0.026358262, 0.016398786) * inp_6_0_0; + result4 += M4(-0.089867964, -0.06908006, 0.3446153, 0.22101057, -0.15763664, 0.18939929, 0.13540536, 0.12814148, 0.090492286, -0.064007975, 0.07912236, 0.26258776, -0.009567706, 0.062413286, 0.08137614, -0.0001498577) * inp_6_1_0; + result4 += M4(-0.16480406, 0.14242022, 0.18511924, 0.06320044, -0.18933049, 0.0562187, -0.022504414, -0.020608587, 0.091771245, -0.11644348, -0.025648538, -0.089701496, 0.0043869917, -0.060820483, 0.062451825, 0.058923345) * inp_6_2_0; + result4 += M4(-0.13495824, 0.050304305, 0.2319598, 0.014136923, 0.038995493, -0.054977044, 0.25926968, -0.043866914, 0.18534565, -0.04039906, 0.08340674, 0.15519133, 0.017672537, 0.098669365, 0.053521566, 0.0021278427) * inp_6_0_1; + result4 += M4(-0.12071067, 0.024922159, 0.09990344, 0.123467684, 0.27024847, 0.22152676, 0.060609728, -0.20015186, -0.3647942, -0.030035714, 0.2577276, -0.48194617, -0.06986185, 0.0850343, -0.064970545, -0.083682455) * inp_6_1_1; + result4 += M4(-0.10906172, 0.062115267, 0.08882411, -0.0068026655, -0.090618365, 0.013813046, 0.11744967, -0.04803899, -0.1744502, 0.20182723, -0.022632668, -0.257664, 0.077535875, -0.0007203639, 0.0050463737, -0.014575507) * inp_6_2_1; + result4 += M4(-0.17387472, -0.017165119, 0.2196452, 0.17036793, 0.07965726, -0.12493114, -0.18868835, 0.071414165, 0.18446684, -0.2393954, -0.026303943, -0.047208134, -0.01585925, 0.054541755, 0.041949503, -0.053614605) * inp_6_0_2; + result4 += M4(-0.16839804, 0.045744903, 0.1355874, 0.07131851, -0.03876846, 0.102758825, -0.09127093, 0.084079534, 0.12902468, 0.062742546, -0.17598057, 0.42879, 0.07996395, -0.00681647, -0.04797707, 0.07783823) * inp_6_1_2; + result4 += M4(-0.07931935, 0.08416527, 0.04629002, 0.1603966, 0.08727672, -0.43798846, -0.20340535, 0.12898126, 0.019336661, 0.06438968, -0.06975458, -0.03562858, 0.057531197, 0.13945173, 0.052155957, -0.0045181024) * inp_6_2_2; + result5 += M4(0.030622005, 0.033648875, -0.13777481, 0.15526626, -0.035708513, 0.18079267, 0.124137096, 0.113988414, 0.06987326, 0.04900433, 0.009237052, -0.014229328, 0.06131387, 0.01557479, 0.074212946, 0.14779621) * inp_6_0_0; + result5 += M4(-0.06724888, -0.06945944, -0.03951733, 0.15693723, -0.16678195, 0.18380629, -0.15140302, -0.20907994, -0.040329836, -0.016879939, 0.005247614, 0.26749894, 0.039124787, -0.17014629, -0.031521734, 0.15898965) * inp_6_1_0; + result5 += M4(-0.06293328, -0.04847373, -0.09275776, 0.07814272, -0.39857167, 0.2055412, -0.21595891, 0.10131444, -0.033698026, 0.03664209, -0.09061471, -0.07494496, 0.07696634, 0.0012257962, -0.00016431425, 0.06366333) * inp_6_2_0; + result5 += M4(0.043890856, -0.00793157, -0.12026016, -0.047832433, 0.02862347, -0.056616865, -0.11114893, -0.10505224, -0.107157126, -0.18314476, -0.0828965, 0.21451165, 0.004773741, -0.004738795, 0.06366432, 0.22281435) * inp_6_0_1; + result5 += M4(-0.025479365, 0.06651183, -0.14315747, 0.12306561, -0.17136574, 0.066617385, -0.012325118, -0.06866185, 0.46885177, -0.88736266, -0.102902316, -0.2828635, 0.09272901, -0.063434675, 0.01574494, 0.007375193) * inp_6_1_1; + result5 += M4(-0.08663941, -0.009495437, -0.07875745, -0.08350019, -0.11980464, -0.2110022, 0.07229205, -0.13001315, 0.14270237, 0.05151154, -0.4315972, 0.045271885, 0.12048727, -0.11735883, 0.051436003, 0.15412854) * inp_6_2_1; + result5 += M4(0.087487034, 0.017998181, -0.12783113, -0.043093428, 0.022735367, -0.035608437, 0.024330879, 0.15068266, -0.20691997, -0.0054504676, 0.041575022, -0.243494, 0.05537266, -0.017127575, 0.034660775, 0.10041992) * inp_6_0_2; + result5 += M4(-0.16778582, -0.13401148, -0.015800253, 0.027800046, 0.31985217, 0.072311915, 0.34029612, 0.17704113, 0.049451526, 0.023873998, -0.069473416, 0.3196018, 0.040731203, 0.08344375, 0.054476954, 0.047070134) * inp_6_1_2; + result5 += M4(-0.015255039, 0.043247603, -0.00014471203, -0.11655925, 0.32191315, -0.018302968, 0.2619458, -0.07209381, -0.038179863, 0.2416478, 0.22229129, -0.1490129, 0.098998554, 0.030524861, 0.04652615, 0.19174734) * inp_6_2_2; + result6 += M4(-0.0054473733, 0.067063466, 0.06823057, 0.064516105, 0.043021705, 0.04897483, 0.029995786, -0.10215093, 0.110203154, 0.19435984, -0.0569155, 0.030893091, -0.010661117, 0.056097552, 0.030715019, 0.018484868) * inp_6_0_0; + result6 += M4(-0.062822275, 0.07521274, -0.007929009, 0.07175033, -0.031541668, 0.16003549, 0.018907294, 0.12415543, -0.13718969, -0.046264257, 0.16082197, 0.017948817, -0.07873198, 0.10366774, 0.03960055, 0.020668423) * inp_6_1_0; + result6 += M4(-0.07692578, 0.20961724, 0.01354989, 0.0041837213, -0.07013785, 0.15288238, 0.20706408, 0.07847916, 0.004052316, -0.061049223, -0.055710487, -0.02467601, -0.009446496, 0.033483155, 0.018704252, 0.008584069) * inp_6_2_0; + result6 += M4(0.044097174, -0.043551724, 0.061233778, 0.0321452, 0.09666465, 0.10479835, -0.11845245, -0.08803998, -0.0069932207, 0.00819712, 0.07323805, 0.09940119, -0.004126533, 0.13461123, 0.045838382, -0.049093816) * inp_6_0_1; + result6 += M4(0.0053979447, -0.077058345, -0.0038344897, 0.0719337, 0.07505565, 0.121630974, -0.16723238, -0.10887044, 0.12251016, -0.17831406, 0.1079947, -0.15539046, 0.02391581, 0.1618384, -0.14408867, -0.016452366) * inp_6_1_1; + result6 += M4(-0.09009834, -0.029852021, 0.14784035, -0.026464064, -0.15962908, 0.20117453, 0.11284715, 0.028830288, -0.054821603, -0.44161305, 0.04227926, 0.031299304, 0.08641188, 0.065547705, 0.0047196704, 0.03939317) * inp_6_2_1; + result6 += M4(0.044776578, -0.008652853, 0.12938873, 0.11171814, 0.16194141, -0.07667376, -0.057078365, -0.015170452, -0.14803539, -0.31466535, 0.051019568, 0.08542885, -0.006926177, 0.16131495, 0.07432172, -0.013930539) * inp_6_0_2; + result6 += M4(-0.087520055, -0.056832645, 0.010856316, 0.04177043, 0.061435044, -0.19447272, -0.2736066, -0.031030942, -0.24909818, -0.10766145, -0.067647755, 0.051106073, -0.00767404, 0.11462535, 0.013143749, 0.019922461) * inp_6_1_2; + result6 += M4(0.11938081, 0.029797485, 0.054951224, 0.0004187531, 0.23983611, 0.117955215, 0.20727374, 0.06512334, -0.076417685, 0.03149121, -0.17576326, -0.030175462, 0.080979064, 0.17874187, 0.044735294, 0.0048423605) * inp_6_2_2; + result7 += M4(0.03400089, 0.04921694, 0.27210364, 0.05072277, -0.10441755, -0.05182022, -0.0026635404, 0.056830935, 0.08254403, -0.15286063, -0.32687026, 0.004862999, -0.042072285, 0.06696901, -0.19231883, -0.0048277443) * inp_6_0_0; + result7 += M4(0.073315375, -0.040931437, 0.032351, 0.03557823, 0.109853536, -0.23763627, 0.19032846, 0.06562803, 0.08075361, 0.22219746, 0.19440892, -0.0057362746, -0.023556305, -0.027693825, -0.6525373, 0.015639974) * inp_6_1_0; + result7 += M4(0.07475429, 0.1793883, 0.030254774, 0.05467757, -0.14202604, 0.06304213, -0.07639892, -0.029303914, 0.058994807, -0.13070546, -0.18210283, -0.039206542, -0.049562097, -0.035817076, -0.41571015, -0.030183014) * inp_6_2_0; + result7 += M4(-0.10269313, 0.28263223, 0.2219601, -0.020736469, -0.12776718, 0.11246052, 0.15715519, 0.011642224, 0.10231811, 0.0075764074, -0.12445573, -0.0386185, 0.019501502, 0.06931784, -0.23888451, 0.018780526) * inp_6_0_1; + result7 += M4(0.06725344, 0.10823444, 0.18342838, -0.0029197328, 0.20367783, -0.17928654, 0.19976248, 0.24374752, -0.16427252, 0.007913998, 0.07557366, 0.101611935, -0.10227458, -0.05205662, -0.47026187, 0.0064496645) * inp_6_1_1; + result7 += M4(0.0032077604, 0.2783979, 0.26086158, 0.070586085, -0.13269812, -0.18812749, 0.21460396, -0.104481734, -0.084048174, 0.10300007, 0.020246375, -0.08484233, -0.06794632, -0.13087802, -0.32931918, -0.0010161671) * inp_6_2_1; + result7 += M4(0.001039722, 0.11514648, 0.10063334, 0.047795504, 0.0877899, -0.0148860775, -0.10532218, 0.056101102, 0.06223619, 0.035663653, -0.078576766, 0.021514872, -0.023836583, 0.022035373, -0.11905083, 0.010254982) * inp_6_0_2; + result7 += M4(0.017065566, 0.2158297, 0.07417096, 0.11424432, 0.12657474, 0.4434362, 0.004432999, -0.017752793, -0.21423887, -0.01039919, -0.098380454, -0.015807962, -0.05269289, 0.00017251779, -0.24819106, -0.024341995) * inp_6_1_2; + result7 += M4(-0.09856863, 0.29583266, 0.23068905, 0.06716765, 0.081535675, -0.009279454, -0.34590578, -0.16883141, -0.037199505, 0.04256068, 0.08576453, -0.0031449336, -0.038238805, -0.06439944, -0.16475017, 0.020458268) * inp_6_2_2; + const V4 inp_7_0_0 = inp[7][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_7_1_0 = inp[7][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_7_2_0 = inp[7][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_7_0_1 = inp[7][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_7_1_1 = inp[7][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_7_2_1 = inp[7][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_7_0_2 = inp[7][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_7_1_2 = inp[7][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_7_2_2 = inp[7][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.0025648084, 0.12526289, -0.14678705, -0.20021191, -0.046807274, -0.01686291, -0.09808052, -0.022675278, 0.03534894, -0.039643355, 0.12639496, -0.04211764, -0.021788446, -0.20868531, 0.21366677, 0.175423) * inp_7_0_0; + result0 += M4(-0.3026701, -1.5252979, -0.25879425, -0.044997208, 0.011189659, 0.037653044, 0.1640758, 0.07475355, 0.0017667233, -0.07372018, -0.038618185, -0.03615947, -0.2126783, -0.1061896, 0.39010486, 0.295421) * inp_7_1_0; + result0 += M4(-0.20572528, -0.28741428, 0.12653723, -0.084643185, 0.06082303, 0.085642144, 0.014465041, 0.030912746, 0.0017500189, 0.008217061, 0.0149926115, -0.042117372, -0.054201145, 0.14428295, 0.19283321, -0.25995392) * inp_7_2_0; + result0 += M4(-0.06252718, 0.089259274, 0.0022112362, -0.46951604, -0.008346746, 0.047610294, 0.07676301, 0.058288552, -0.016456489, -0.017622821, -0.020205861, 0.012302029, 0.074509226, -0.07129192, 0.10394136, 0.12221057) * inp_7_0_1; + result0 += M4(-0.004245082, -0.27393815, -0.27035642, -0.36941934, -0.032338016, 0.0364357, -0.11017005, -0.13537496, 0.0533642, 0.0005205563, 0.013267756, -0.06888909, 0.06560021, -0.12103099, 0.23193897, -0.02271881) * inp_7_1_1; + result0 += M4(-0.10273085, 0.011859719, -0.028414164, -0.24363193, 0.08455475, 0.013105101, -0.17271374, 0.119755924, 0.0153439315, -0.036716696, 0.08454803, -0.13076177, 0.055063963, -0.12813814, 0.07016775, -0.16438487) * inp_7_2_1; + result0 += M4(-0.041865863, -0.030979594, 0.060428467, -0.11376036, 0.030387161, 0.109690845, 0.047884576, -0.026200855, -0.010907044, -0.076233275, 0.030132938, -0.03462662, -0.025294013, 0.050076324, 0.009761742, -0.0813617) * inp_7_0_2; + result0 += M4(0.03703045, -0.02160848, -0.12644905, -0.04780207, 0.023734236, 0.07776927, 0.06599846, -0.009449072, -0.010327277, -0.08116192, 0.01921808, 0.045049377, 0.029745542, -0.18814455, -0.014886403, -0.0013435339) * inp_7_1_2; + result0 += M4(-0.04433287, -0.019759031, -0.031930804, -0.1356627, -0.0191406, -0.03747117, -0.047807746, -0.009009785, -0.051523708, 0.033809472, 0.08383874, -0.013744574, 0.07185183, -0.047077347, -0.013521437, -0.059219062) * inp_7_2_2; + result1 += M4(0.28843054, -0.25796375, -0.5877547, -0.011973724, 0.14814524, -0.15180282, -0.04453052, -0.24524786, -0.024242822, -0.013110795, -0.041762378, 0.23210354, -0.09606809, -0.14494194, 0.3518875, -0.024674369) * inp_7_0_0; + result1 += M4(-0.2455814, -0.4979598, 0.1657619, 0.15377375, 0.10516929, -0.07207404, 0.0020917002, -0.3801542, -0.03977665, -0.2002733, -0.05886868, 0.3682456, 0.071297295, 0.03868418, -0.065145634, 0.14696194) * inp_7_1_0; + result1 += M4(0.10822069, 0.08206827, -0.16062826, -0.09697469, 0.024189314, -0.08056657, -0.014331855, -0.44773558, 0.069561034, 0.041404806, -0.03767991, 0.30086318, 0.14757726, 0.15713966, -0.10964593, 0.14131321) * inp_7_2_0; + result1 += M4(0.09925729, -0.08878316, -0.2507936, 0.023167718, 0.11461078, -0.13421379, -0.04581909, -0.26081997, -0.055447813, 0.040214993, 0.05908097, 0.26105702, -0.17789166, 0.07863633, 0.30369294, 0.14754723) * inp_7_0_1; + result1 += M4(-0.18158494, -0.34316045, 0.48023736, 0.2730216, 0.16630661, 0.3341356, -0.122051485, -0.3366689, -0.03678378, 0.09521366, 0.0009976161, 0.1753873, 0.009166908, 0.022797368, 0.27146277, -0.113864675) * inp_7_1_1; + result1 += M4(0.041470826, 0.089445114, -0.047926847, -0.10239888, -0.046512537, 0.22696862, 0.12981784, -0.5809384, 0.018433359, -0.015404439, -0.00964156, 0.2261011, -0.08172258, 0.18121171, 0.01259903, 0.039109502) * inp_7_2_1; + result1 += M4(0.03518853, 0.007889052, 0.05324295, -0.028484104, -0.008522066, -0.012769131, -0.07928536, -0.15839511, -0.105335444, 0.032355875, 0.01508761, 0.22439949, 0.04630704, -0.017959382, -0.02340951, -0.11146924) * inp_7_0_2; + result1 += M4(0.033710063, 0.10001246, 0.015358725, 0.027672805, 0.017057784, 0.1878902, -0.015772091, -0.15147465, 0.011984561, 0.02918992, 0.07771228, 0.23467055, 0.069261536, -0.021490177, 0.16307217, -0.028804705) * inp_7_1_2; + result1 += M4(0.043618053, -0.015504806, -0.019166525, 0.027746234, 0.030604072, 0.017952675, 0.04415187, -0.09515134, -0.04567094, -0.006029701, -0.021109806, 0.140879, -0.0099356705, 0.09682651, -0.020528479, -0.00024386801) * inp_7_2_2; + result2 += M4(0.021549305, 0.099326536, 0.043911707, 0.054056592, -0.0023230196, 0.03999367, 0.043753807, 0.003063588, -0.01731856, -0.013823191, 0.008290244, 0.016949324, -0.08382676, 0.055040475, 0.051967587, 0.053922664) * inp_7_0_0; + result2 += M4(-0.16891643, 0.07061636, -1.4503644, -0.0056925244, -0.049581006, 0.033327784, -0.056672618, -0.019410936, -0.029678352, 0.022078699, 0.028606586, 0.048223116, 0.11085622, -0.16196068, 0.21870309, 0.13649808) * inp_7_1_0; + result2 += M4(0.11502068, 0.017529063, -0.23306581, -0.19868103, -0.034657627, -0.0044330903, 0.08659655, 0.114791095, 0.042793263, -0.04234944, -0.00694115, 0.08295241, 0.10340021, -0.13499334, 0.13025004, 0.13799603) * inp_7_2_0; + result2 += M4(0.09892189, -0.016424406, -0.2066706, 0.12350171, -0.03158015, 0.024397701, -0.00865445, 0.037127934, 0.0063031246, -0.04572847, 0.08756439, 0.031835385, 0.1180093, 0.009751706, 0.047152735, 0.11225161) * inp_7_0_1; + result2 += M4(-0.62929285, 0.397846, -0.6638081, 0.0013092268, 0.24246462, -0.07590893, 0.13833924, -0.10425346, -0.04332452, 0.045004047, 0.043573678, 0.08407402, 0.16554138, -0.2627138, 0.23132728, 0.058877945) * inp_7_1_1; + result2 += M4(0.110183395, -0.07977462, 0.0122079495, -0.18582295, 0.14411642, 0.02603325, -0.037123483, 0.065656975, 0.021856556, -0.08003947, 0.04024855, 0.0008351486, 0.23239839, -0.17722906, 0.063009135, 0.17553511) * inp_7_2_1; + result2 += M4(0.10135686, -0.047256086, 0.007585672, 0.007102436, 0.003607729, -0.043348387, 0.04746483, -0.018561093, 0.06902273, -0.032546375, 0.046427876, 0.021165675, 0.02319588, -0.015397912, -0.052085582, 0.053064834) * inp_7_0_2; + result2 += M4(-0.10677383, -0.13637324, 0.024599362, 0.039329786, 0.060702775, -0.057782713, -0.054117203, -0.024914186, -0.10224434, 0.08296002, -0.001128595, 0.07357599, 0.13979411, 0.031920835, 0.028207088, 0.09893815) * inp_7_1_2; + result2 += M4(-0.046456262, -0.019670827, -0.078224815, -0.078441784, 0.13658261, 0.040628888, 0.024616253, -0.009235978, 0.059899412, -0.056890212, 0.007007438, 0.012702514, 0.06479871, -0.099561945, -0.09196759, 0.021337587) * inp_7_2_2; + result3 += M4(0.2770843, 0.013149988, -0.042622216, 0.041015144, -0.22036408, 0.080840014, 0.011452011, 0.022036038, 0.13456473, -0.063971974, 0.0018988677, -0.023521842, -0.0006928711, 0.096433185, 0.13893716, 0.11341459) * inp_7_0_0; + result3 += M4(0.44847995, -0.73745227, 0.1682718, -0.3265818, -0.37244025, 0.058515035, 0.015252173, 0.032462012, 0.16546327, -0.04892529, -0.023886753, -0.05649095, 0.080640405, 0.16599071, -0.033286024, -0.22828318) * inp_7_1_0; + result3 += M4(0.0057077277, -0.13732924, -0.07188825, 0.0715182, -0.10463529, -0.039711874, 0.06204329, 0.022880994, 0.10745927, -0.027616361, -0.014605211, -0.031169904, -0.21925765, -0.05121392, 0.026651358, -0.032939285) * inp_7_2_0; + result3 += M4(0.123817965, 0.021003744, -0.084730506, 0.06836476, -0.3755028, 0.099626854, -0.08390442, 0.025404619, 0.22355863, -0.04411984, 0.09736561, -0.013341983, 0.08997362, 0.056509376, 0.034114253, 0.043466788) * inp_7_0_1; + result3 += M4(0.44270706, -0.0683795, 0.41327858, -1.166456, -0.5600959, 0.026772229, -0.22455886, 0.11989965, 0.0923035, -0.008618152, 0.0827072, -0.0921251, -0.14101982, 0.09475878, -0.055802915, 0.12503462) * inp_7_1_1; + result3 += M4(-0.3582938, -0.15613678, -0.078350164, -0.27746207, -0.41561893, 0.028780913, -0.078577, 0.18830773, 0.07804633, -0.036509305, -0.06176025, 0.0069189426, -0.11904288, -0.09882205, 0.23796675, 0.14364761) * inp_7_2_1; + result3 += M4(-0.029145889, -0.018105073, 0.05896387, 0.0029995858, -0.16947377, 0.022588518, -0.057111166, 0.07239648, 0.17606618, -0.009242618, 0.014176087, -0.08714544, -0.025814915, 0.090591304, 0.045414526, 0.08219933) * inp_7_0_2; + result3 += M4(0.041378107, -0.17849189, 0.08720181, -0.646194, -0.16831556, 0.05882143, -0.03847985, 0.23061049, 0.1389938, -0.05897706, -0.003541238, 0.09181541, -0.05018364, 0.21415457, 0.12638731, 0.44888103) * inp_7_1_2; + result3 += M4(0.018162427, -0.0051253447, -0.011680524, -0.107667096, -0.07367797, 0.026347395, 0.014787265, 0.057079323, 0.09755196, -0.033560645, -0.011545112, 0.0075151133, 0.0658228, -0.009581344, 0.08284546, 0.3095749) * inp_7_2_2; + result4 += M4(-0.079737715, -0.40348387, -0.26426393, -0.011289091, 0.0008866716, 0.08877403, 0.029058682, -0.002246997, -0.059729423, -0.088090286, -0.028212033, 0.009995482, -0.11797592, 0.09991555, -0.053679023, 0.013930643) * inp_7_0_0; + result4 += M4(0.57345444, -0.09387439, 0.35804713, -0.19315228, -0.017343676, 0.020514041, 0.14166196, 0.048639208, -0.08445982, -0.048066605, -0.077345535, -0.056066938, -0.24219427, 0.05647145, -0.2837218, -0.29364616) * inp_7_1_0; + result4 += M4(0.085741974, -0.49717352, 0.02962002, -0.033564236, 0.013486055, -0.11915149, 0.043650985, 0.07057155, -0.03231146, -0.050805684, 0.0388232, -0.0038629111, -0.11800806, 0.16445115, -0.20787911, -0.22196995) * inp_7_2_0; + result4 += M4(0.030490879, -0.4314764, -0.049261753, 0.18679148, -0.05455237, 0.015970761, 0.08853225, -0.13648161, -0.028622895, -0.1687855, -0.086259864, 0.08524485, -0.15395486, 0.100878164, 0.1540579, 0.09067588) * inp_7_0_1; + result4 += M4(0.42765537, -1.9201854, 0.010603859, -0.6963597, 0.015766239, 0.35401875, -0.010124867, 0.013946631, -0.10193607, -0.032334324, 0.09939644, 0.025689755, -0.08708885, 0.14129621, 0.18144359, -0.12881632) * inp_7_1_1; + result4 += M4(0.19141695, -0.18786584, -0.376979, 0.015583803, 0.025960565, 0.1198561, 0.09320064, 0.04630147, -0.01210611, -0.115236856, -0.046195645, -0.009790737, -0.13853866, 0.0087757865, -0.08943575, 0.070630655) * inp_7_2_1; + result4 += M4(-0.0010412656, -0.07117385, -0.006827727, -0.042927478, -0.041195534, 0.06866054, 0.07333482, 0.022468455, -0.029916646, -0.090581685, -0.0010470517, 0.039250698, -0.049642786, -0.013365773, 0.00030125616, 0.11373884) * inp_7_0_2; + result4 += M4(0.06734494, -0.15719602, -0.09600298, -0.46393052, -0.03186202, 0.11232978, 0.092726916, 0.19069138, 0.05551586, -0.11680064, -0.007558469, 0.035032336, -0.080813065, 0.18509631, 0.0031644418, 0.3684431) * inp_7_1_2; + result4 += M4(0.049931854, 0.027430901, -0.02175178, -0.0431114, -0.06867864, 0.10252557, -0.099218115, -0.033484507, 0.07566836, -0.11976758, 0.034866773, 0.09144374, 0.027752424, 0.042649746, 0.14925283, 0.31625772) * inp_7_2_2; + result5 += M4(-0.10893411, -0.008008089, -0.033243228, -0.34840506, 0.13377258, -0.07408689, 0.055212706, 0.14590612, -0.075179085, 0.019402541, -0.05829244, -0.15030795, -0.118763804, -0.00339957, -0.17599902, -0.0661123) * inp_7_0_0; + result5 += M4(0.10968293, 0.12893628, 0.41332203, 0.4638949, 0.19314818, -0.06839382, 0.044725202, 0.14144407, 0.03231626, 0.1284611, -0.0041659335, -0.45071155, 0.09169449, 0.11251113, -0.19100508, -0.4401045) * inp_7_1_0; + result5 += M4(-0.116008095, -0.4304109, 0.0067123496, -0.2914923, 0.096316285, -0.07121619, 0.07716929, 0.060829744, -0.02667789, 0.04735419, -0.071996935, -0.2833726, -0.120445386, -0.30460852, -0.21741919, -0.5111675) * inp_7_2_0; + result5 += M4(0.15396431, 0.059088722, 0.019183923, -0.033558667, 0.1326206, -0.0015199828, 0.11263575, 0.054716207, -0.03429147, 0.057047248, -0.048843246, -0.23856844, -0.08047074, -0.0583619, -0.15793824, -0.24397174) * inp_7_0_1; + result5 += M4(-0.10265652, 0.35704884, 0.43083915, 0.41368887, 0.12113184, -0.091761775, 0.006309817, 0.017715422, -0.11447838, 0.0012242236, -0.10764651, -0.42687738, 0.039671645, -0.21236551, -0.039478373, -0.30968052) * inp_7_1_1; + result5 += M4(0.18843968, -0.2350124, -0.019170957, -0.0691535, 0.09529857, -0.100980476, -0.06172172, 0.20962296, -0.028389372, -0.06276643, -0.0602007, -0.27551156, -0.15288739, -0.2860923, -0.051773462, -0.34352845) * inp_7_2_1; + result5 += M4(0.024042439, -0.005430514, 0.04384521, 0.045466665, 0.07861826, -0.08976203, 0.004388678, 0.06327909, 0.041972958, 0.03819288, -0.03636325, -0.21627569, 0.052073456, 0.063, -0.0017517147, 0.17293297) * inp_7_0_2; + result5 += M4(-0.039760187, -0.06190854, 0.05333062, -0.063601844, 0.09475966, -0.054131187, 0.020155566, 0.23628078, -0.020934671, -0.032518595, -0.008303033, -0.28182665, 0.014770909, -0.006195597, -0.024138452, 0.14770478) * inp_7_1_2; + result5 += M4(0.0033399519, -0.045446016, 0.022862913, 0.03829475, -0.02759851, -0.0657359, 0.049873903, 0.06989323, 0.05821027, 0.013484184, -0.048395537, -0.34920686, -0.016318822, -0.08493274, -0.027380776, 0.13732822) * inp_7_2_2; + result6 += M4(0.063858, 0.17975937, 0.27430567, 0.070124075, 0.010893028, 0.1625576, 0.08223857, 0.023882516, 0.05555982, -0.45737204, -0.012592253, 0.008212768, 0.018622011, -0.21203488, 0.03804557, -0.10322732) * inp_7_0_0; + result6 += M4(0.22367126, -0.27785185, -0.5485573, 0.032211665, -0.085173056, 0.22053249, -0.02428382, -0.011948985, 0.1814899, -0.16410795, -0.0024127504, 0.006097258, -0.028911812, -0.2904567, -0.10260736, -0.019928899) * inp_7_1_0; + result6 += M4(-0.26699287, 0.014501981, 0.0024913673, -0.03131132, -0.015583287, 0.07814092, 0.05178981, 0.010634761, 0.061294556, -0.17706826, 0.029143605, 0.0014303023, 0.16574372, -0.05003147, 0.56075877, -0.046562485) * inp_7_2_0; + result6 += M4(0.14946893, -0.18638834, 0.16153859, -0.28075913, 0.05694367, 0.14506286, 0.019418847, -0.010065474, 0.040359017, -0.88142097, -0.031873234, -0.006095112, 0.0043407925, -0.42950183, 0.03937959, -0.014487534) * inp_7_0_1; + result6 += M4(-0.04213115, 0.039264034, -1.476328, 0.22680476, 0.06273493, 0.11199137, 0.25075033, 0.021825919, 0.048435688, -0.6183676, 0.085707314, -0.056665014, 0.031227764, -0.32503843, -0.030608246, 0.07617304) * inp_7_1_1; + result6 += M4(0.05376526, 0.22797531, 0.40660712, -0.033960424, 0.08294127, 0.08539029, 0.015474785, 0.034975685, 0.02849205, -0.19692415, 0.07359567, 0.031673267, -0.012328677, -0.07949001, 0.38798198, 0.016132504) * inp_7_2_1; + result6 += M4(0.05585863, 0.00093287084, 0.019845022, -0.03503344, 0.11194936, 0.17812492, 0.06366071, 0.01418595, 0.018196419, -0.31741604, 0.026138872, -0.01738281, 0.03510042, -0.41914243, -0.023240814, -0.002430336) * inp_7_0_2; + result6 += M4(-0.02000724, 0.11472896, -0.022283651, -0.015328622, 0.14447932, 0.2224949, -0.006977726, -0.006962552, -0.026312059, -0.10852069, 0.055961847, 0.016283438, 0.18790397, -0.11394312, -0.09107971, 0.0045249294) * inp_7_1_2; + result6 += M4(0.010605566, 0.0784789, -0.036820155, 0.008404077, 0.11753294, 0.0987805, 0.107818775, -0.015405861, -0.006504625, -0.16418372, -0.007620516, 0.026731528, 0.092712246, 0.13523081, 0.004538151, 0.01887436) * inp_7_2_2; + result7 += M4(-0.04576845, -0.33329424, -0.14109035, 0.08503191, 0.013913061, 0.015043651, 0.106135435, 0.034806777, 0.04579647, -0.10357108, 0.2137351, 0.012389517, 0.11726017, 0.04425815, 0.08580434, -0.02033563) * inp_7_0_0; + result7 += M4(-0.08590565, -0.22857638, 0.34313104, -0.31230778, -0.069640994, -0.069582544, 0.1658746, 0.029551849, 0.053820264, -0.08880734, 0.20652655, -0.018208902, 0.104174234, -0.08724792, 0.2592679, -0.0037244805) * inp_7_1_0; + result7 += M4(0.0016008765, 0.022337046, -0.08957179, 0.16456534, -0.06976552, 0.20566517, -0.3157708, 0.016905164, -0.0012781883, -0.011794765, 0.19740543, 0.019428613, 0.15914935, 0.060073264, 0.07994299, -0.06332651) * inp_7_2_0; + result7 += M4(0.09119301, -0.20002475, -0.07669936, 0.1643349, -0.060126692, 0.16764893, -0.11436837, 0.015953891, 0.052920435, -0.059379105, 0.2306045, 0.025482927, -0.040881097, 0.1826107, -0.049378753, 0.008433811) * inp_7_0_1; + result7 += M4(0.027494263, -0.3948501, 0.13247472, 0.39170027, -0.112362884, 0.026262274, -0.1713266, -0.016728168, -0.009385176, -0.042910732, 0.12577814, 0.00023914242, 0.023254072, 0.04880443, -0.26621515, -0.0038994795) * inp_7_1_1; + result7 += M4(0.011830901, -0.63424397, 0.21526353, 0.23073396, -0.018827513, 0.078263186, 0.002266272, -0.0144259, -0.0065053087, -0.08099685, 0.07995013, -0.028439919, 0.031789385, 0.1926061, -0.08635181, -0.071400106) * inp_7_2_1; + result7 += M4(0.039354414, -0.0734294, -0.014211014, 0.017328981, 0.04569441, 0.09054408, -0.1105997, 0.0002912659, 8.348863e-05, -0.052722927, 0.13510354, -0.0033420618, 0.04445888, -0.019111622, -0.0010565611, 0.006738578) * inp_7_0_2; + result7 += M4(0.029739989, -0.11730508, 0.15684448, -0.037513692, 0.020392368, 0.15130892, 0.011011553, -0.0030526363, -0.036450185, -0.17872739, 0.17532124, -0.003100543, 0.0442909, 0.0076653264, 0.05813181, -0.030679816) * inp_7_1_2; + result7 += M4(0.012197272, -0.052711457, 0.097683325, 0.06498083, 0.054925352, -0.04803322, 0.14027563, -0.018213192, 0.00988908, -0.111124165, 0.048256498, 0.014215208, 0.02339212, -0.007800636, -0.25679168, 0.037007354) * inp_7_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(4, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 0), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 0), max(result3, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result4, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result5, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 1), max(result6, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 1), max(result7, V4(0.0))); +} + +//!DESC ArtCNN C4F32 DS (Conv2D-3-ReLU) +//!COMPUTE 48 32 12 16 +//!HOOK LUMA +//!BIND conv2d_2 +//!SAVE conv2d_3 +//!WIDTH LUMA.w 4.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[8][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(4, 2); + inp[0][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(2, 0), 0)); + inp[3][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(3, 0), 0)); + inp[4][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(0, 1), 0)); + inp[5][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(1, 1), 0)); + inp[6][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(2, 1), 0)); + inp[7][y][x] = V4(conv2d_2_mul * texelFetch(conv2d_2_raw, input_base + ivec2(3, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.054830547, 0.0012965808, 0.0064878096, 0.03045313); + V4 result1 = V4(-0.010292834, -0.017231606, 0.048370507, 0.0039505763); + V4 result2 = V4(-0.026531944, 0.012619296, -0.0048070257, -0.015144841); + V4 result3 = V4(-0.008347533, 0.010614438, -0.011837911, 0.009907202); + V4 result4 = V4(0.0066377404, -0.004486842, -0.018436108, -0.025362387); + V4 result5 = V4(-0.008088878, -0.01595404, 0.0020544769, -0.010945363); + V4 result6 = V4(0.019478869, 0.046713892, 0.043661587, 0.0020997524); + V4 result7 = V4(-0.008225499, 0.005836407, 0.00083672185, -0.028556151); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.10982058, -0.012740591, -0.006514866, 0.091516994, 0.29076537, 0.04349718, -0.009592644, 0.120071895, 0.29256305, 0.031112367, 0.047033552, 0.063008554, 0.2589514, 0.016059287, -0.0016483165, 0.10072922) * inp_0_0_0; + result0 += M4(-0.009976189, -0.034660067, -0.05988702, -0.037850473, -0.39774182, 0.008394261, -0.028436223, -0.22318241, 0.041616186, 0.01329385, 0.091405146, 0.0769655, -0.8712419, -0.050434224, -0.02453685, -0.031755432) * inp_0_1_0; + result0 += M4(-0.1691034, -0.033751413, -0.00948145, 0.0715841, -0.255899, 0.0100278435, -0.074026436, -0.20854044, 0.26269788, -0.015019593, -0.004113398, -0.1179569, 0.461238, -0.027665736, 0.07147676, -0.009157258) * inp_0_2_0; + result0 += M4(0.12896824, 0.09816039, 0.060741358, 0.08859413, -0.6366761, -0.046409193, 0.09188169, 0.11090699, -0.12806052, 0.028848626, -0.027123263, -0.106597364, -0.04566316, -0.016934546, -0.12885474, 0.13219365) * inp_0_0_1; + result0 += M4(-0.017897213, 0.25291327, 0.3699928, 0.3285568, -0.34114113, 0.016561827, 0.301675, -0.042429924, -0.3662829, -0.06127097, 0.04657896, -0.2437102, -0.384972, 0.08152618, -0.04296214, -0.28528953) * inp_0_1_1; + result0 += M4(0.08983714, 0.028156592, -0.075813256, -0.0015062761, -0.62384427, 0.026193274, -0.0770493, -0.29609, 0.41501474, -0.0013042127, 0.08811731, -0.0047251973, 0.07794938, -0.00055200455, 0.004936193, 0.0004992934) * inp_0_2_1; + result0 += M4(0.1599993, 0.051199175, -0.041085795, 0.14333038, 0.101438776, -0.0034577614, -0.054910917, 0.04861873, -0.1797071, -0.024281384, 0.10847992, -0.02191547, -0.33707967, -0.035223458, -0.010600252, 0.044390634) * inp_0_0_2; + result0 += M4(-0.059028365, 0.00056772155, 0.03863578, -0.13610825, -0.19611482, 0.01729689, -0.006402672, -0.019272286, -0.05055594, 0.013851041, 0.09243736, -0.02772995, 0.45680425, 0.047742736, -0.062269267, 0.14888741) * inp_0_1_2; + result0 += M4(0.07281392, 0.010458436, -0.015886214, 0.112827696, -0.1359395, 0.012323563, -0.016377, 0.03181373, -0.12467687, -0.006931877, 0.06592483, 0.018392684, -0.20582324, 0.019906094, 0.031877812, 0.07099835) * inp_0_2_2; + result1 += M4(-0.020107215, -0.05823192, 0.031058766, 0.031742103, -0.043240853, 0.024135886, 0.025899712, 0.09811553, 0.04911715, -0.07329647, -0.09429901, 0.08409397, -0.050274916, 0.05744452, -0.024009125, 0.030989407) * inp_0_0_0; + result1 += M4(-0.15032606, 0.09779696, -0.0343981, -0.12072217, -0.14514653, 0.04845875, -0.38898492, -0.06414933, -0.059351712, -0.1031306, -0.00257354, 0.012975814, 0.03865802, -0.10297252, -0.090366215, 0.113541104) * inp_0_1_0; + result1 += M4(0.006900664, -0.057086907, 0.053365584, 0.012915767, 0.03874495, -0.016744567, -0.08258552, 0.18280841, 0.020274008, 0.02681632, -0.06740229, -0.023802891, 0.050390042, 0.064588524, 0.0024872737, 0.11499453) * inp_0_2_0; + result1 += M4(0.08900168, -0.024585227, -4.393836e-05, -0.028076846, -0.11092466, 0.01795373, 0.08868382, 0.0009326618, -0.0005106514, 0.048026018, -0.0717146, -0.0043635056, -0.097015284, 0.09610532, 0.001636637, -0.02076414) * inp_0_0_1; + result1 += M4(-0.15526688, -0.1691233, 0.0693444, 0.12443224, 0.066984996, -0.49856913, -0.09991012, -0.28552386, 0.047772437, -0.05612997, -0.15591313, 0.037226766, 0.1865264, -0.57897836, -0.079939954, -0.51583236) * inp_0_1_1; + result1 += M4(-0.029476834, 0.11924295, 0.121609665, -0.021347066, -0.005625574, 0.13789868, 0.115449235, 0.3076058, -0.027459567, 0.059878554, -0.17003097, -0.06481992, 0.05404227, 0.041201327, 0.01696872, -0.029329) * inp_0_2_1; + result1 += M4(-0.0060892333, 0.05331656, 0.110168815, 0.10189149, 0.03358667, -0.097010806, -0.12102958, -0.097367086, -0.0052978084, 0.046278205, -0.06052234, 0.049059737, 0.0020159371, -0.080543764, -0.057223875, 0.012026612) * inp_0_0_2; + result1 += M4(-0.10299796, -0.17477255, 0.005007318, 0.2004568, -0.020753425, -0.027088644, -0.18493366, 0.03994144, -0.1488216, 0.11311822, 0.0015615877, -0.04890067, 0.07713986, 0.18248764, -0.24135862, -0.09876588) * inp_0_1_2; + result1 += M4(-0.147391, 0.056327097, -0.029427713, -0.17713077, -0.04469036, 0.060747553, -0.063875146, -0.0080002025, -0.027666062, 0.07703426, -0.090916045, -0.10940525, 0.0389736, 0.031133438, 0.05053823, 0.028630167) * inp_0_2_2; + result2 += M4(-0.057276152, 0.00078679423, 0.0408744, 0.022297073, 0.015301215, -0.04425997, 0.037435897, 0.06761282, 0.048210915, 0.01085797, -0.019703774, 0.030927764, 0.14718978, 0.12519802, 0.16016772, 0.03417672) * inp_0_0_0; + result2 += M4(0.0084984405, -0.036148183, -0.007619507, -0.05109775, -0.047221463, -0.1615655, -0.04290973, 0.0075745117, 0.08399659, 0.11573714, -0.0517214, -0.039162513, -0.0467893, 0.1202751, 0.066238165, -0.093324155) * inp_0_1_0; + result2 += M4(-0.04199616, 0.056634095, 0.02235933, 0.022045027, 0.11466109, -0.009668763, 0.13878249, 0.025846217, 0.07263205, -0.008121716, -0.039129794, 0.047639374, 0.09433126, 0.02704143, 0.071120635, -0.05351851) * inp_0_2_0; + result2 += M4(-0.05992555, 0.10942353, 0.0031044867, -0.045486856, 0.18733808, 0.0028055531, -0.09175669, -0.030181708, 0.08488209, -0.030838845, -0.057479724, 0.00064490386, -0.07514476, -0.09360068, 0.17441988, 0.026088655) * inp_0_0_1; + result2 += M4(0.22528516, 0.14562652, -0.36024526, 0.10402698, 0.3946752, -0.11583821, -0.1981431, -0.082013644, 0.11698827, -0.075526804, -0.11166025, -0.21014425, -0.23172316, -0.40062264, 0.43937913, 0.19389632) * inp_0_1_1; + result2 += M4(0.026450804, -0.066216044, 0.033631686, 0.10120838, -0.11859728, -0.1559114, 0.016163705, 0.16819659, 0.069713905, 0.026020955, -0.15332925, 0.020154823, 0.0446039, 0.10539022, 0.055499826, 0.0130553115) * inp_0_2_1; + result2 += M4(-0.1684037, -0.116589256, 0.11253206, -0.008386985, 0.11980866, 0.050803475, 0.050068505, 0.022354554, 0.19349831, -0.11571167, -0.04694596, -0.0054878863, -0.03736956, 0.08897893, 0.12670177, 0.033199914) * inp_0_0_2; + result2 += M4(-0.43475744, 0.13772966, 0.237789, -0.22752352, 0.21577641, 0.08492413, -0.096339256, 0.033130866, 0.08949253, 0.023196192, -0.099681474, -0.08569851, -0.104312934, 0.16826648, 0.057733756, -0.008398696) * inp_0_1_2; + result2 += M4(0.061192896, 0.034518342, 0.05700942, -0.15431897, -0.020047251, -0.10320459, -0.008780876, 0.008486292, 0.07375619, 0.041690726, -0.12648103, 0.0077065364, 0.09187749, -0.09938572, -0.059948005, -0.023804665) * inp_0_2_2; + result3 += M4(-0.06725944, 0.03286578, -0.007734225, 0.026448352, -0.085323654, -0.026685596, -0.053297203, -0.20300888, 0.025629446, 0.0025500143, 0.016327277, 0.048129305, 0.012929533, 0.0583211, 0.05188446, 0.13630399) * inp_0_0_0; + result3 += M4(-0.02862313, -0.08906275, -0.06691831, -0.02449247, 0.2138148, 0.021986913, 0.016723104, -0.5861432, -0.12450941, -0.061607152, 0.01106368, 0.010797367, 0.1372415, 0.08150557, 0.013545674, -0.15680812) * inp_0_1_0; + result3 += M4(0.043749206, 0.06667972, 0.03642912, -0.008158083, 0.2948974, -0.03496908, 0.0906917, -0.14049256, 0.013556757, -0.11214098, 0.0010274185, 0.041708805, 0.108135685, -0.0786029, 0.013609907, 0.079803474) * inp_0_2_0; + result3 += M4(-0.022389261, 0.07272213, 0.05119382, 0.079796635, -0.14026248, -0.017950958, -0.16332246, -0.037766658, -0.032462332, 0.008219144, 0.039300688, 0.013795919, 0.0014832972, -0.06991738, -0.12428483, -0.0060676765) * inp_0_0_1; + result3 += M4(-0.31921273, -0.0703039, -0.10103519, 0.3126733, -0.7845808, -0.07435058, -0.056235623, 0.053529203, -9.007399e-05, -0.03541949, -0.09128613, -0.042781524, 0.037208367, -0.28883278, 0.28332347, -0.07338347) * inp_0_1_1; + result3 += M4(0.12874386, 0.03007934, 0.027846077, 0.051513646, 0.25407577, -0.004487952, 0.10492367, -0.050154407, -0.06282506, -0.018956054, -0.10584363, -0.03215706, -0.14389335, 0.09960718, 0.07148565, -0.020797543) * inp_0_2_1; + result3 += M4(0.15774553, 0.15204975, -0.06643703, -0.07841874, -0.08816316, -0.0052060243, -0.022231286, 0.049692273, 0.081600696, -0.006822501, -0.020093966, 0.0039005424, 0.02539474, 0.0426019, 0.011218777, 0.0012189132) * inp_0_0_2; + result3 += M4(0.21383998, 0.039247356, 0.25203094, -0.28953102, -0.25474125, -0.03827542, -0.08541483, -0.0069801663, 0.03193942, 0.071598805, -0.05606597, 0.019687962, -0.063227646, 0.024089387, 0.03058773, 0.120866746) * inp_0_1_2; + result3 += M4(0.03986828, 0.14077576, -0.13876048, 0.011365385, -0.0075535867, 0.08901462, -0.08254162, 0.07051075, -0.058690306, -0.024374142, -0.13574947, 0.05008099, 0.08815143, -0.010121152, -0.011422719, -0.03709452) * inp_0_2_2; + result4 += M4(0.051281404, -0.03782294, 0.025835853, -0.056877207, -0.07859473, 0.018050497, 0.08758217, -0.17096779, -0.022018308, 0.031662114, 0.00942085, -1.6647848e-05, -0.014446886, -0.047296382, -0.023423195, 0.016275676) * inp_0_0_0; + result4 += M4(0.0048740045, 0.020889705, 0.017901434, -0.011705453, 0.05204315, 0.057203855, 0.19615111, 0.06608282, 0.14422786, 0.08305203, 0.015646417, -0.19646332, 0.134904, 0.0556263, 0.03491973, 0.0024849037) * inp_0_1_0; + result4 += M4(-0.021601832, -0.01379818, -0.03194438, 0.06687667, -0.069935486, 0.09274412, 0.025026627, 0.047901314, -0.10800558, 0.05906842, 0.04834568, -0.003381115, -0.12542026, 0.03208325, -0.03488763, -0.060235254) * inp_0_2_0; + result4 += M4(0.020030232, -0.028058836, -0.0337571, 0.0776937, -0.15539144, 0.10156384, 0.010436925, -0.092925884, 0.06297018, 0.08137466, 0.07226492, 0.0673315, -0.12145713, 0.06252977, 0.06872234, -0.08176458) * inp_0_0_1; + result4 += M4(-0.18246815, 0.0984792, -0.16689564, -0.10678902, -0.13269553, -0.06485133, -0.10494646, -0.12062552, -0.1280414, 0.14527173, 0.03377167, -0.0032539053, 0.36644167, -0.6223342, 0.21247585, -0.47251016) * inp_0_1_1; + result4 += M4(0.04034909, 0.0533942, 0.0039818794, -0.23308986, 0.08956089, 0.073255755, 0.10276742, 0.1417679, -0.102938384, 0.08783126, 0.04735973, 0.052596416, -0.06803056, 0.14252707, -0.082245395, 0.4382288) * inp_0_2_1; + result4 += M4(-0.0977779, -0.001968041, -0.027544986, -0.17584802, 0.05022558, -0.0074931043, -0.006445876, -0.11201318, 0.017534407, 0.07563944, -0.009787373, -0.068408474, 0.08161332, -0.032400206, 0.09716443, 0.012793285) * inp_0_0_2; + result4 += M4(0.019772273, -0.16194232, 0.08118386, -0.11017329, -0.027476585, 0.11962858, -0.087394014, -0.25397804, 0.0011119988, 0.091664195, 0.076695554, -0.08385371, -0.052885603, 0.12951685, -0.04826801, 0.23776641) * inp_0_1_2; + result4 += M4(-0.066594854, 0.11551415, -0.07419491, 0.16868998, -0.07188582, 0.10680877, -0.042380374, 0.1910413, -0.13705616, 0.09942634, -0.023658782, 0.031736117, 0.06737333, -0.039768115, 0.038838893, -0.27369988) * inp_0_2_2; + result5 += M4(0.0154745225, 0.017104393, -0.0050691343, -0.087723784, 0.025048187, -0.06093857, 0.01625022, 0.11829746, -0.048894852, 0.053379536, 0.01184427, -0.101745844, -0.121396765, -0.0070769317, -0.014296338, -0.10671555) * inp_0_0_0; + result5 += M4(0.03211086, -0.10416982, 0.017256986, 0.053225942, 0.017530173, -0.22437902, 0.023781708, 0.016116241, -0.06763079, -0.0050163623, 0.029018518, -0.0822437, 0.059028234, -0.10730533, -0.01410919, -0.12963182) * inp_0_1_0; + result5 += M4(-0.018984515, -0.011460061, -0.011605786, -0.01051599, -0.029741142, 0.21336283, 0.016556146, -0.00938771, -0.058469325, -0.12141413, -0.008489555, -0.014319098, -0.061594155, -0.03190426, 0.0055355197, 0.16515489) * inp_0_2_0; + result5 += M4(-0.09325728, 0.20043908, -0.038125373, -0.10577004, -0.0085631255, -0.12915641, 0.02049322, 0.11545498, 0.08479529, 0.12962444, 0.030004704, -0.08601475, 0.10801825, -0.0316153, 0.0015300467, -0.1432845) * inp_0_0_1; + result5 += M4(-0.47656843, -0.08622528, 0.04650464, 0.058655147, 0.038684655, -0.1103069, 0.024933843, -0.0734585, -0.08502867, -0.056103922, -0.037508775, -0.06297659, 0.1651581, -0.13589522, -0.113060765, -0.012947148) * inp_0_1_1; + result5 += M4(-0.14323075, -0.52012247, -0.013353716, -0.11537064, -0.008263955, -0.16005804, -0.025743697, -0.035305392, 0.005480209, -0.010242344, -0.024090962, 0.062970884, -0.031443458, 0.14990155, 0.002599178, 0.017292667) * inp_0_2_1; + result5 += M4(0.06217138, -0.15589373, 0.0427672, -0.035835527, -0.022398526, -0.06286331, -0.029754438, 0.016399672, 0.0143705895, -0.10320985, -0.009439498, -0.079153724, -0.019458398, 0.093156576, -0.041739464, 0.12525265) * inp_0_0_2; + result5 += M4(-0.027242051, 0.042486157, 0.049183488, -0.12694106, 0.061916534, -0.03918012, 0.019351417, 0.03769737, 0.028784147, 0.024148377, 0.022552356, -0.006455193, 0.15982468, 0.046071324, 0.013818503, -0.03650466) * inp_0_1_2; + result5 += M4(-0.015875053, 0.02279782, 0.023816364, -0.17201911, 0.018937368, -0.21505135, 0.011202766, 0.04400766, -0.045916524, -0.13069485, -0.008001815, 0.061571945, 0.011856554, -0.1408151, 0.040537097, -0.1264704) * inp_0_2_2; + result6 += M4(0.005923681, 0.005352953, -0.05858726, -0.0147767225, -0.050185766, 0.42076784, -0.09101376, 0.05470133, 0.013834389, -0.059668437, -0.047901224, 0.009360044, 0.060512207, 0.0033295883, 0.019845197, -0.025903147) * inp_0_0_0; + result6 += M4(0.021825632, -0.036418106, -0.02204049, 0.010476625, 0.12299869, -0.120608255, 0.2828243, 0.054611277, -0.015105706, -0.18700546, -0.14215119, -0.0024587978, -0.06819282, 0.0014524257, 0.09742223, 0.09239228) * inp_0_1_0; + result6 += M4(-0.023038361, -0.021974817, 0.030154571, -0.05224688, 0.017465075, 0.0023901768, 0.1876502, -0.015490592, 0.027054146, 0.085192464, 0.031080857, 0.017735621, 0.06502142, 0.0020099327, -0.07679857, -0.053366505) * inp_0_2_0; + result6 += M4(0.27612054, -0.068569474, 0.06668788, -0.024399295, -0.0354254, -0.1653161, -0.08574822, 0.06265596, 0.12067656, -0.037515216, 0.087070346, 0.052339975, -0.16693386, 0.35158756, -0.033580568, 0.048351478) * inp_0_0_1; + result6 += M4(-0.1451627, -0.13946442, -0.28245252, 0.18192442, -0.3191277, 0.1618985, -0.09399271, 0.14887439, 0.265996, -0.14910762, 0.26838923, 0.053043276, -0.32943666, -0.15529445, 0.3741341, -0.08322686) * inp_0_1_1; + result6 += M4(-0.111949034, 0.19337775, -0.06063224, -0.0019687032, -0.06869703, -0.23666489, 0.19445013, 0.06011342, 0.074637, -0.04439144, -0.048433952, 0.023817211, 0.12003794, 0.0027114318, 0.004754325, -0.035510935) * inp_0_2_1; + result6 += M4(-0.007629276, -0.016277451, -0.04153511, -0.026758553, -0.020788198, -0.29086918, 0.04163388, 0.010739646, 0.085602984, 0.019719234, -0.024032822, 0.027797762, 0.020408398, -0.065539986, 0.0052375905, -0.0031114172) * inp_0_0_2; + result6 += M4(-0.275924, 0.0053848987, 0.15395723, -0.051964633, 0.0053957747, -0.00085099175, 0.02753248, 0.09841061, 0.089889795, 0.014566465, 0.020319387, 0.062932044, 0.21208787, 0.16902515, -0.1467211, -0.010305351) * inp_0_1_2; + result6 += M4(0.17459784, -0.00029953953, -0.08352034, -0.026927141, 0.055285975, 0.106429756, -0.067698866, 0.025931839, 0.12085982, -0.061094202, -0.16430715, 0.024005966, -0.05673644, -0.057041544, 0.037052598, 0.020889034) * inp_0_2_2; + result7 += M4(-0.050024923, -0.036741998, 0.007931197, -0.0029766373, 0.0649808, -0.05594009, 0.02902618, -0.02127805, -0.024034005, 0.0036661315, -0.002485365, -0.053174797, 0.021335995, 0.07008121, -0.046694595, 0.023708422) * inp_0_0_0; + result7 += M4(0.06528063, 0.0016456957, -0.042569224, 0.08140906, 0.021788433, 0.09517711, -0.0015035786, 0.006665169, -0.070820145, -0.0005145233, 0.013988036, 0.025469568, -0.001545416, -0.17194119, -0.033752214, 0.00048347015) * inp_0_1_0; + result7 += M4(-0.05239349, 0.03667953, -0.033824805, 0.07528028, -0.20120917, 0.109877646, 0.018602708, -0.013749203, 0.0040373662, 0.08121354, -0.013561525, -0.11111449, -0.07492937, -0.07009904, -0.052078832, -0.029187785) * inp_0_2_0; + result7 += M4(0.06349731, -0.099767044, 0.027604964, 0.06477159, -0.09783192, 0.046788488, -0.0028254415, 0.00043641008, -0.04802619, -0.036774475, -0.028270615, -0.03370047, -0.008838439, -0.056983374, -0.100692995, -0.0651946) * inp_0_0_1; + result7 += M4(-0.02697025, -0.270191, 0.11418859, 0.025727864, 0.071478225, 0.006399729, -0.036792737, -0.08307892, 0.043991014, 0.121841215, 0.04848309, -0.09797963, 0.22107884, 0.008562042, -0.1554039, 0.07078047) * inp_0_1_1; + result7 += M4(-0.08243478, 0.0020487066, 0.06639316, -0.085234255, -0.1592255, -0.11378887, -0.002977941, -0.7125677, 0.012963613, 0.11818882, -0.044977147, -0.0566414, -0.16333202, -0.07057539, 0.074934684, 0.101134926) * inp_0_2_1; + result7 += M4(-0.019556068, 0.029935293, -0.007651191, 0.028322104, -0.012664136, 0.034410194, 0.012694688, 0.03455805, 0.004967433, -0.005150465, -0.0062974123, 0.010333286, -0.041668605, 0.055488486, -0.0058849417, -0.0859952) * inp_0_0_2; + result7 += M4(0.032658786, 0.023452517, -0.099079505, 0.08692457, 0.07745965, 0.03449986, 0.01379791, -0.014052497, -0.030491939, -0.005606245, -0.021408932, -0.05623972, 0.025385473, 0.063120745, -0.0036256856, 0.019120505) * inp_0_1_2; + result7 += M4(-0.18216048, -0.016892454, 0.06824489, -0.33376846, -0.03804535, 0.014542662, 0.06660792, 0.089577034, 0.013053466, 0.030362114, 0.0005584482, 0.12014436, -0.00020366225, 0.0449048, 0.029045431, 0.08328062) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.30269557, 0.024474755, 0.072306074, -0.012991355, 0.17527738, 0.010800459, -0.00096780446, 0.072000556, -0.30456918, -0.005365625, 0.03481661, 0.16322997, -0.61982894, -0.063553266, -0.1000607, -0.10658447) * inp_1_0_0; + result0 += M4(0.16335219, 0.018097393, -0.0010507766, -0.07043353, -0.06914506, -0.037559446, 0.043663267, -0.027523873, -0.8229066, 0.07463837, 0.17863247, 0.024560291, -0.75537246, -0.005596127, 0.046378642, -0.10640086) * inp_1_1_0; + result0 += M4(0.16047691, 0.029817173, 0.0048504593, 0.0782252, 0.05638609, 0.06369435, -0.03562657, -0.0060637677, -0.1415451, 0.0072941426, 0.04346028, 0.098513216, 0.17277186, 0.026861845, 0.044620182, 0.035208605) * inp_1_2_0; + result0 += M4(0.3584926, 0.056591805, 0.08261641, -0.06662095, 0.09711191, 0.047636468, -0.025771942, -0.051268168, 0.7935556, 0.12037038, -0.23237751, 0.035849806, 0.6076683, 0.06551957, -0.02528956, 0.02825518) * inp_1_0_1; + result0 += M4(0.37324554, 0.11062583, 0.07739545, -0.2523104, -0.026436845, -0.06383766, -0.15515967, -0.12802836, 0.32211027, 0.07670768, 0.010752895, 0.06034309, 0.018552115, -0.019111773, 0.15711148, 0.033862527) * inp_1_1_1; + result0 += M4(-0.33724996, -0.0035219744, 0.0005007514, -0.19320634, -0.039336964, 0.027562212, -0.14899504, -1.6607336, -0.2617643, 0.100311756, 0.061402686, 0.026553908, 0.04316806, -0.010881177, -0.018212492, -0.0010177726) * inp_1_2_1; + result0 += M4(-0.43921602, -0.012323956, 0.14045729, 0.0633853, 0.077174604, -0.017157676, 0.12514064, 0.11404692, -0.071571626, 0.055610113, -0.0015186972, 0.0011426981, 0.03418083, 0.04378983, -0.075370684, 0.017247284) * inp_1_0_2; + result0 += M4(0.39954907, 0.046008635, 0.08850861, 0.05915571, -0.42833132, 0.016262649, 0.14638217, 0.035248242, -0.24839708, -0.02133576, 0.07961118, 0.10459972, -0.101847984, -0.010747174, 0.019404406, 0.10121528) * inp_1_1_2; + result0 += M4(-0.08269866, 0.00688575, 0.10716432, 0.05514754, -0.384778, 0.03511083, -0.7797304, 0.46902186, 0.1304648, -0.011732216, 0.056029465, -0.20490888, -0.36163238, -0.013551068, -0.09974534, -0.1968689) * inp_1_2_2; + result1 += M4(0.03181346, -0.005073577, -0.0132824015, 0.010721783, 0.03866599, -0.017298562, -0.044141285, 0.01892538, 0.027609875, 0.0690624, 0.13973358, 0.022184154, -0.022919571, -0.0404139, -0.0062865894, -0.18302135) * inp_1_0_0; + result1 += M4(0.036394123, -0.06723908, 0.05656019, -0.0487031, -0.004957291, 0.024583632, -0.06758531, 0.015293052, -0.07354126, -0.022916403, -0.1085896, 0.11678869, 0.042573653, 0.04405999, 0.06869961, -0.0046094386) * inp_1_1_0; + result1 += M4(-0.019397294, -0.09568965, 0.13015778, 0.08441093, -0.03433671, 0.002452876, 0.13544545, -0.025439415, 0.1073646, 0.11668207, -0.16208902, -0.032764878, -0.022722026, -0.16466609, 0.043614812, 0.07122477) * inp_1_2_0; + result1 += M4(-0.030047065, 0.0113305375, 0.08112173, 0.027220847, 0.032589316, 0.005793805, -0.09789739, 0.10665455, -0.05670955, 0.1605578, 0.20278448, 0.3262937, -0.03152907, -0.02711759, 0.1960279, 0.037902206) * inp_1_0_1; + result1 += M4(-0.06732175, 0.09075589, 0.059716046, 0.09257597, -0.03157995, -0.0699462, -0.009831851, -0.16099973, 0.20591694, 0.10295932, -0.6288529, 0.0024988367, -0.039713223, -0.25592822, 0.03758623, 0.06858805) * inp_1_1_1; + result1 += M4(0.06519385, 0.17362168, -0.09969061, -0.16651925, 0.11196604, 0.12122083, 0.035175093, -0.032635886, 0.043285746, 0.06778545, 0.16352718, -0.15932071, -0.04434414, 0.0003528175, 0.13820007, 0.1674394) * inp_1_2_1; + result1 += M4(0.11447479, -0.016538067, 0.021553246, 0.08342736, 0.010986007, -0.11829318, 0.11487773, -0.17347062, -0.027311489, -0.08904312, 0.036699004, 0.14675663, -0.1231484, 0.15359169, 0.08499425, 0.17710738) * inp_1_0_2; + result1 += M4(-0.075537615, 0.13846144, -0.04160933, 0.062621385, -0.0051212977, -0.024924116, 0.038809385, -0.20541279, 0.08553491, 0.061504062, -0.3024476, -0.1819159, 0.106576174, 0.027823731, 0.065816246, 0.1088652) * inp_1_1_2; + result1 += M4(-0.033302438, 0.08049959, -0.0025926507, -0.17453663, -0.49338788, 0.07417215, -0.20396125, 0.1693647, 0.06905949, 0.07936141, -0.14016181, -0.010198017, -0.057946414, -0.08739994, 0.22005717, 0.26872683) * inp_1_2_2; + result2 += M4(0.022753663, 0.035411138, -0.1354691, 0.0076684523, 0.019066427, -0.023406312, 0.052692134, -0.011588697, -0.022667633, -0.010193716, -0.0985684, 0.022027202, -0.058258355, -0.0876388, 0.026646296, -0.13696992) * inp_1_0_0; + result2 += M4(0.11024083, 0.0042924155, -0.17406626, 0.07390863, -0.060180243, -0.045007274, -0.06408562, -0.0891837, 0.10861634, 0.054801397, -0.2165749, 0.06857541, -0.047029186, -0.0654428, -0.04817841, 0.0420361) * inp_1_1_0; + result2 += M4(0.06859174, 0.18640882, 0.017156472, 0.03057497, 0.07479399, 0.024887502, 0.06418304, 0.02584432, -0.031406976, -0.005787644, -0.009339056, -0.008957542, 0.0103491, 0.057798054, -0.02751038, -0.03289279) * inp_1_2_0; + result2 += M4(0.07493084, 0.051820397, -0.16289212, 0.03160181, -0.08288271, 0.0661164, -0.16012284, 0.084629446, 0.19783445, -0.26249158, 0.07055087, 0.12808587, -0.022840956, 0.0036855547, 0.049803365, -0.059684306) * inp_1_0_1; + result2 += M4(0.22209504, -0.03546477, -0.19937533, 0.09869711, 0.10014813, -0.38678938, 0.4144948, 0.21822804, 0.11514099, 0.3643559, -0.41228855, -0.24910495, 0.086637005, 0.0053489283, -0.1275489, -0.070925) * inp_1_1_1; + result2 += M4(-0.060611747, 0.061933815, -0.08615913, -0.01295277, -0.14138399, 0.16389652, 0.08678853, 0.38904756, 0.01739179, -0.09852084, -0.20937067, 0.19373156, -0.054982513, 0.01186394, 0.02588956, 0.07218609) * inp_1_2_1; + result2 += M4(0.028843088, 0.12052598, -0.14811821, 0.019479118, 0.027513694, 0.16287196, 0.11698507, -0.103557646, 0.28963044, 0.0003964868, -0.05982367, 0.029035741, 0.0008978427, -0.23884556, -0.12006983, 0.020042367) * inp_1_0_2; + result2 += M4(0.14947018, -0.017167613, -0.19448759, 0.059883833, -0.06284381, 0.29311362, 0.36026067, 0.04379264, 0.1915929, -0.2665795, -0.12984599, 0.08890368, -0.00023197167, 0.10725576, -0.027011951, 0.009788535) * inp_1_1_2; + result2 += M4(0.050289962, -0.03545846, -0.042906597, 0.03214387, -0.6424356, 1.0542774, 0.42425898, -0.06613076, -0.024413206, -0.20536068, -0.043584146, -0.0047029504, -0.08573395, -0.12284028, 0.064642794, 0.05384897) * inp_1_2_2; + result3 += M4(-0.020012267, 0.012859643, 0.015370767, 0.07618518, -0.038946133, -0.0071750456, -0.03493357, -0.025624147, 0.09811349, 0.045265503, 0.025548207, 0.018746309, 0.12870269, 0.088603266, 0.028311914, -0.12095206) * inp_1_0_0; + result3 += M4(-0.13689539, 0.01248729, -0.04580356, 0.01621743, 0.12967376, 0.032390703, 0.12357428, -0.0989263, 0.11705827, -0.22203815, -0.09600206, 0.17552039, 0.11204767, 0.16064024, -0.085557, -0.01693152) * inp_1_1_0; + result3 += M4(-0.12909119, 0.022679834, -0.06860134, 0.02731248, -0.07287666, -0.04076358, -0.036916994, 0.07345657, 0.25613928, -0.23727654, 0.008401201, -0.21287763, -0.087643944, -0.0030912769, 0.01616772, 0.08233766) * inp_1_2_0; + result3 += M4(-0.0849945, 0.040283732, -0.0002361443, 0.05403328, 0.017037027, 0.0015854764, -0.023552608, 0.10702082, -0.2776833, -0.17257352, -0.20315248, 0.09896589, -0.07247323, 0.039611705, -0.08314167, -0.034638207) * inp_1_0_1; + result3 += M4(0.08833979, -0.025370013, 0.042159013, -0.04433219, 0.13150145, 0.12805696, 0.40037584, 0.25763384, 0.06593088, 0.1972655, 0.20752302, -0.26399875, -0.02485801, 0.07402455, -0.052619148, 0.066685215) * inp_1_1_1; + result3 += M4(0.08259008, 0.025988085, -0.14765613, -0.14172907, 0.056767177, 0.032773487, -0.24328338, 0.009497725, 0.21833076, -0.034707095, -0.046802852, -0.050703935, 0.11939457, 0.10291383, -0.030698648, 0.12951323) * inp_1_2_1; + result3 += M4(0.06176872, 0.05075453, 0.02771466, 0.022697663, -0.06550375, 0.11939141, 0.053551078, -0.017284516, -0.06873912, -0.15980148, -0.09160511, -0.07310046, -0.18072455, -0.15445977, -0.22140184, 0.09153849) * inp_1_0_2; + result3 += M4(-0.024409248, 0.0024001535, -0.07802349, 0.053587735, -0.12622099, -0.09523909, 0.20193392, 0.1647152, 0.117360495, 0.25452694, -0.10429262, 0.16203742, -0.09467241, 0.38643107, -0.1329574, 0.15046106) * inp_1_1_2; + result3 += M4(0.08801183, 0.079525605, -0.17040928, 0.039099287, -2.0701196, 1.0211174, -0.112164974, -0.11844553, 0.029075297, -0.11323424, 0.014148607, 0.1310756, 0.15000159, -0.30582106, 0.03360387, -0.14169903) * inp_1_2_2; + result4 += M4(-0.016603397, 0.013941391, -0.015546802, 0.1714543, -0.026720505, 0.014055414, 0.02051034, -0.029670438, -0.13825439, -0.044931296, -0.07340305, 0.22062492, -0.042984795, -0.10420866, -0.004644297, -0.009833013) * inp_1_0_0; + result4 += M4(-0.023275193, 0.04257238, -0.026264105, -0.0508946, 0.023640722, 0.040554818, 0.061302382, 0.018225372, -0.06066702, 0.02117856, 0.19365843, -0.17996845, -0.004065635, 0.006170249, -0.005316913, 0.1931039) * inp_1_1_0; + result4 += M4(-0.11080621, 0.12125387, -0.09969529, 0.07826912, -0.00467889, -0.08452116, -0.11980451, 0.024678951, -0.01928157, 0.044728525, 0.16327979, -0.26458976, 0.03224589, 0.02401515, -0.039033264, 0.053628873) * inp_1_2_0; + result4 += M4(-0.14608693, -0.007973844, -0.082519025, -0.05725343, -0.09058293, -0.07408936, 0.06420212, 0.1469696, -0.08183665, 0.19863471, -0.2528339, 0.16488287, -0.029332854, 0.020286981, -0.15635143, 0.30133048) * inp_1_0_1; + result4 += M4(-0.23231204, 0.10305437, -0.14025065, -0.2212385, 0.2867491, -0.064046875, 0.3145619, 0.055842843, 0.06859873, 0.22729145, 0.27076298, 0.15291668, 0.14494711, -0.049178306, -0.117558606, -0.1358841) * inp_1_1_1; + result4 += M4(-0.19027685, 0.0658207, 0.10741228, -0.013328404, 0.01085595, 0.021311216, -0.2613098, 0.036061294, -0.010575938, -0.13170883, 0.11104949, -0.66600585, 0.03113766, -0.02486045, -0.0242793, -0.11614288) * inp_1_2_1; + result4 += M4(-0.032819185, 0.014689205, -0.0027553523, -0.050498907, 0.025851093, 0.04340202, -0.013173224, -0.06984222, -0.18823458, -0.0840787, -0.12827387, -0.039105415, -0.055798266, 0.05020136, -0.07649838, 0.29797465) * inp_1_0_2; + result4 += M4(-0.2808994, 0.09720502, -0.000854193, -0.102636635, -0.12361861, -0.09703597, 0.089782685, -0.10886694, -0.07962227, 0.13679606, 0.123063125, 0.13545127, 0.023218371, 0.18287455, -0.15057807, -0.4666422) * inp_1_1_2; + result4 += M4(-0.15712953, 0.075165324, -0.040125176, 0.19242266, -0.25188085, 0.13886544, 0.61723804, 0.116459906, 0.03286226, -0.017309083, 0.011404921, -0.37526968, 0.045802023, -0.11269483, 0.10749571, 0.07697939) * inp_1_2_2; + result5 += M4(-0.03911439, 0.026189936, 0.007847939, -0.040387575, -0.038696777, 0.09524303, -0.018494349, -0.12762623, 0.020617101, -0.11656945, -0.008982797, -0.0022253338, 0.029266238, -0.23067324, -0.050875355, -0.084742144) * inp_1_0_0; + result5 += M4(-0.06777168, -0.21798666, -0.022399884, 0.067011766, 0.05105622, -0.089263536, 0.02690526, 0.11249946, -0.19087774, -0.07889786, -0.060218334, 0.27934235, 0.008272654, 0.18985388, -0.054262936, -0.06694628) * inp_1_1_0; + result5 += M4(-0.10240771, -0.04430134, -0.0037491682, 0.014672962, 0.033399668, 0.13299502, 0.023993675, 0.034441773, 0.15730496, -0.09426704, -0.0149276825, 0.10052365, -0.030169783, -0.17205209, 0.02082356, -0.012137901) * inp_1_2_0; + result5 += M4(0.00850388, -0.17375591, 0.021272168, -0.0028996866, -0.021047948, -0.102435, -0.059557483, -0.013514055, -0.04658541, -0.15552434, 0.08742993, -0.050793927, -0.022599846, -0.18440396, 0.019807735, -0.15563595) * inp_1_0_1; + result5 += M4(-0.023653727, -0.11540974, 0.099953406, 0.14761837, -0.0059183715, 0.19195135, 0.33243492, 0.105192214, 0.06144109, -0.48182294, -0.07469599, 0.06416651, -0.076081716, -0.12234789, 0.012383203, -0.22974844) * inp_1_1_1; + result5 += M4(-0.025606385, -0.161005, -0.0249916, 0.03627222, -0.1308855, 0.05132972, -0.015126548, -0.10892074, 0.14474423, -0.24236955, -0.08069982, 0.117432386, -0.0076897796, 0.0032170191, -0.031750042, -0.08547233) * inp_1_2_1; + result5 += M4(0.023146098, 0.08316227, 0.059037372, -0.055162914, -0.07097596, -0.049974356, -0.0436943, 0.04592139, -0.02501389, -0.04799623, 0.10315793, -0.06637637, 0.09045691, -0.6113871, 0.0697879, -0.0823258) * inp_1_0_2; + result5 += M4(0.03099753, 0.06475188, 0.060946546, -0.015843933, -0.16026522, -0.13000119, 0.19894855, -0.011193683, 0.14915963, -0.09406111, 0.033710547, 0.09237775, -0.011312366, -0.17021745, -0.036476675, -0.28746206) * inp_1_1_2; + result5 += M4(0.016429052, -0.05797785, 0.066454455, 0.07269945, 0.2145377, 0.133942, -0.044717114, -0.34782046, -0.08404225, -0.10399573, 0.014317495, -0.0896574, -0.097591184, -0.30324572, -0.010489775, -0.07374811) * inp_1_2_2; + result6 += M4(0.016494539, -0.121091604, 0.06054299, 0.03004157, -0.06542263, 0.058107913, -0.086591534, 0.026495336, 0.010657284, -0.061960723, 0.12176603, -0.071122155, 0.23403807, 0.10989286, 0.1848039, -0.056117553) * inp_1_0_0; + result6 += M4(-0.054966435, 0.07282338, -0.02435177, 0.021567814, 0.096014254, -0.023505222, 0.17366008, -0.014335525, -0.0011055338, -0.1318606, 0.086757325, -0.055904664, 0.17704555, -0.15156521, 0.17922059, 0.03214013) * inp_1_1_0; + result6 += M4(-0.0786131, -0.020328617, -0.04547878, 0.0013788455, -0.11473682, -0.012737104, -0.10713952, -0.011520205, -0.09900169, -0.16086456, 0.14561777, -0.035957765, 0.008269635, 0.017093785, -0.1037307, 0.0036418466) * inp_1_2_0; + result6 += M4(0.031397294, -0.07540801, -0.037602127, 0.06567893, 0.050398745, 0.08258671, 0.16388349, 0.009146902, -0.30595106, 0.39656153, -0.50477564, -0.0014968803, 0.061396755, 0.088925414, -0.08439351, 0.013863179) * inp_1_0_1; + result6 += M4(-0.10432704, -0.06577285, 0.093821384, 0.04107468, -0.07777119, -0.2249931, -0.24430999, -0.02417863, 0.17419653, -0.3386946, 0.16103752, 0.10330558, 0.07329377, 0.15135153, -0.32571897, -0.008295151) * inp_1_1_1; + result6 += M4(0.016331948, -0.06236673, 0.14914186, 0.14669977, -0.027860314, 0.11981889, 0.25596422, 0.03605577, -0.19203454, -0.3623619, 0.02186408, 0.19966854, -0.08421466, 0.07800755, 0.16180833, -0.050675165) * inp_1_2_1; + result6 += M4(0.12513113, -0.19236597, -0.055917047, 0.059285834, 0.04631141, -0.06637595, 0.069366336, 0.11438423, -0.026736215, 0.036037363, 0.021823253, -0.053096615, 0.14108121, 0.19560942, -0.30060548, -0.012995197) * inp_1_0_2; + result6 += M4(0.16300343, 0.12243012, -0.14078994, 0.036281344, -0.11110958, 0.1166609, 0.046082694, -0.047192413, 0.073975876, 0.31089678, -0.12439041, 0.037810072, 0.017263288, -0.108918145, 0.039634183, 0.022181584) * inp_1_1_2; + result6 += M4(0.18956064, -0.022126596, -0.14967448, 0.0975421, 0.8716915, 1.1406955, 0.18743217, -0.262032, 0.008468656, -0.16995469, 0.38257113, 0.07979466, -0.20802194, 0.17705217, 0.15278205, -0.052346867) * inp_1_2_2; + result7 += M4(-0.014168415, 0.0028227556, -0.011094773, 0.03414833, -0.016941529, 0.018039742, 0.023924772, 0.044051953, -0.06597208, 0.14796792, -0.00030572028, 0.0016482981, -0.039208032, 0.12105214, 0.012112879, -0.058318406) * inp_1_0_0; + result7 += M4(-0.02254172, 0.07434322, 0.030422486, 0.025256548, 0.060421214, 0.00039682197, 0.03704722, -0.003694749, -0.17357789, 0.08272758, 0.06215911, -0.077005, -0.0050363303, -0.019033076, -0.02483429, 0.043140613) * inp_1_1_0; + result7 += M4(-0.04218801, -0.13153923, 0.03815967, -0.07583708, -0.014611307, -0.14244065, -0.022095192, -0.08031202, -0.017516967, 0.3088922, -0.017189479, 0.06363921, 0.027827049, -0.053178754, -0.025168562, 0.025001332) * inp_1_2_0; + result7 += M4(-0.025126325, -0.00031959143, 0.0066268165, -0.016415348, -0.081795506, -0.08576364, 0.01052557, -0.016369233, -0.008558037, 0.05234396, 0.05808942, 0.06265084, 0.039303627, -0.10785717, -0.032388244, 0.176247) * inp_1_0_1; + result7 += M4(-0.18299799, -0.024562242, -0.029792702, -0.07807039, 0.16036591, 0.17115456, 0.14453392, 0.098073915, -0.09789746, -0.4444426, 0.2066417, 0.0061070966, -0.124437496, -0.23774308, 0.06040171, 0.09863888) * inp_1_1_1; + result7 += M4(-0.040129814, 0.123747505, 0.12618391, -0.58781093, 0.006509252, -0.052109238, -0.059657697, 0.05094686, 0.21263094, 0.1718124, 0.13251536, -0.29256305, -0.013811634, 0.036461562, -0.039024904, -0.08942828) * inp_1_2_1; + result7 += M4(-0.07205996, -0.023193875, 0.02413695, -0.005410371, -0.0329929, -0.05130934, 0.008741132, -0.037632667, 0.014091258, -0.019722303, -0.02750181, 0.020811226, -0.12573652, 0.03452404, -0.011810205, -0.08503362) * inp_1_0_2; + result7 += M4(-0.06660542, -0.004078647, 0.008184792, -0.15180305, 0.16185701, -0.10736026, -0.11906615, -0.20625357, -0.18091203, 0.03147689, 0.13583875, -0.16741589, -0.034853216, -0.05600319, 0.05886042, 0.1576273) * inp_1_1_2; + result7 += M4(-0.09327809, -0.05312218, 0.04556382, -0.39802355, 0.3064705, -1.3490797, 0.3018286, 0.23860133, 0.061773017, 0.13580303, 0.05393095, -0.18875845, -0.04584805, 0.009606055, -0.007949275, -0.08936126) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.021997444, 0.044049546, -0.030772122, 0.41508996, -0.19588752, 0.0075623174, -0.115546905, -0.059804954, -0.6696464, -0.04947869, 0.110914424, -0.018229363, 0.060386267, 0.044989806, 0.04060435, 0.15933013) * inp_2_0_0; + result0 += M4(-0.16872247, 0.12348137, 0.08762962, 0.0060786083, -0.05960576, -0.02287395, -0.07336312, -0.28710604, -0.283261, 0.05996977, 0.14308323, 0.24931699, 0.1593908, 0.01737162, 0.03557824, 0.057269245) * inp_2_1_0; + result0 += M4(0.04366554, -0.010207282, 0.009146312, -0.0108441245, -0.1516246, -0.022801729, 0.011468555, 0.06972773, -0.40637326, 0.011701978, -0.034046967, -0.007526116, -0.29465833, -0.017827703, 0.015436831, 0.10179091) * inp_2_2_0; + result0 += M4(-0.012710725, 0.018422538, 0.077280074, -0.037839267, -0.33691335, -0.031597123, 0.06198087, 0.03641066, -0.21688773, 0.02239475, 0.011060993, 0.15002233, 0.25705907, 0.11278149, -0.06355379, 0.009697891) * inp_2_0_1; + result0 += M4(-0.1155845, -0.01163228, 0.1422029, -0.07330355, -0.008602184, 0.11368691, 0.03082402, 0.18690431, 0.16100468, -0.08916578, 0.5522677, 0.17935137, -0.14923705, 0.042491175, -0.04387118, -0.036680695) * inp_2_1_1; + result0 += M4(0.48946202, 0.021047471, -0.054350443, -0.18858969, -0.00542162, 3.6431604e-05, -0.05637342, 0.008359004, -0.3686211, -0.03162433, 0.059451472, -0.0092607085, -0.12588061, 0.004459396, 0.038965862, 0.13677111) * inp_2_2_1; + result0 += M4(0.18901907, -0.04228128, 0.013302958, 0.029529579, 0.0341256, -0.010738776, -0.008861197, -0.051687468, -0.027258344, -0.012591743, 0.03346695, -0.023558926, -0.114794, 0.008244787, -0.0088010775, 0.033434853) * inp_2_0_2; + result0 += M4(-0.16742985, 0.026331449, 0.05012329, 0.048419163, 0.41793993, 0.025040464, 0.01610751, -0.09716056, 0.09943026, -0.0015133824, 0.0033379279, -0.18956405, 0.10443189, 0.021406546, -0.035613455, -0.061603043) * inp_2_1_2; + result0 += M4(0.021601658, -0.015586206, 0.018320113, 0.053182647, -0.124976344, -0.0051255194, -0.070529625, 0.035067342, 0.16870965, 0.0024438957, -0.06977562, -0.11300458, 0.1596587, 0.007964323, 0.034449283, -0.018044638) * inp_2_2_2; + result1 += M4(-0.008813268, 0.018908674, -0.07150236, 0.052042812, 0.02642266, 0.08658468, 0.07085128, -0.023014054, -0.061222788, 0.066560015, -0.35415155, -0.18382077, -0.007835073, 0.012178085, 0.0703424, 0.1085751) * inp_2_0_0; + result1 += M4(-0.006009746, 0.012783441, -0.13207084, -0.19561172, -0.062245026, -0.043850552, 0.023896812, -0.20729296, -0.15156464, 0.025482161, -0.2708885, -0.42137152, 0.021738213, 0.18821439, -0.019050872, 0.09660338) * inp_2_1_0; + result1 += M4(-0.033591483, 0.008725917, 0.028338626, -0.05716644, 0.009005115, -0.1712277, -0.0821282, 0.1127398, -0.0010452829, 0.13593921, 0.017277464, -0.055401348, -0.011198611, 0.054470792, -0.05236175, -0.059327457) * inp_2_2_0; + result1 += M4(0.1736332, -0.22738853, -0.14361833, -0.21622773, -0.010308091, -0.0042392923, -0.1603784, -0.0063405503, -0.09024079, -0.13907702, -0.39666745, -0.4329024, 0.030122086, 0.16427542, -0.012811582, 0.15375149) * inp_2_0_1; + result1 += M4(0.09846725, -0.08639054, -0.0447524, -0.13340083, -0.19458963, 0.33186463, 0.09810691, 0.07893366, 0.4220245, -0.75361836, 0.19528766, -0.31414455, 0.1293179, -0.0013319645, 0.13985872, 0.29513425) * inp_2_1_1; + result1 += M4(0.13184151, -0.087994754, 0.1844651, -0.17508732, 0.049291972, 0.053399846, -0.031077217, 0.041508056, 0.025074461, 0.0017657205, -0.24002784, 0.0049937614, 0.11017485, -0.09641372, -0.16722536, -0.16167179) * inp_2_2_1; + result1 += M4(0.09991439, 0.023448879, -0.075822555, 0.02100272, -0.036018115, -0.069850296, 0.057555184, 0.094630055, -0.022452323, 0.09070093, -0.15554021, 0.05747267, -0.07371389, 0.038306884, -0.020492801, 0.0019010724) * inp_2_0_2; + result1 += M4(-0.009647361, 0.023211418, -0.06521856, -0.0144808795, -0.034097657, -0.18075426, -0.03551263, 0.11647566, 0.0071723526, -0.20010452, -0.21579625, 0.17365079, -0.01047968, 0.027456664, -0.07157368, 0.005232428) * inp_2_1_2; + result1 += M4(0.10803588, 0.04938575, -0.0038869027, -0.013368346, -0.100351274, 0.028455064, -0.040416975, -0.08912241, -0.041403398, 0.036996566, -0.042103283, 0.31879035, 0.027408354, 0.013636946, -0.09977277, 0.07362493) * inp_2_2_2; + result2 += M4(-0.11624354, -0.074867785, 0.10025746, 0.013830487, -0.029371267, -0.09734533, 0.027255073, 0.046926424, 0.08359563, 0.011743867, -0.16400759, 0.03056084, 0.041996956, -0.107946776, 0.025973141, 0.048463963) * inp_2_0_0; + result2 += M4(0.05525578, -0.308283, 0.041809913, -0.032293487, 0.07349483, -0.13939571, -0.04460139, 0.02715225, 0.2179399, -0.13865696, -0.27787468, 0.11205488, -0.06393625, -0.074597225, -0.002686919, 0.028047793) * inp_2_1_0; + result2 += M4(-0.094650224, -0.10884903, 0.008471161, 0.010110828, 0.0044701477, 0.016495997, -0.060995277, 0.16716228, 0.057599105, -0.011413096, -0.1769324, 0.07813809, -0.018895393, 0.06649551, 0.03401761, -0.061807733) * inp_2_2_0; + result2 += M4(-0.016222082, -0.1361606, 0.010170801, 0.0078088753, -0.006569495, -0.038807865, 0.0071600596, 0.006556699, 0.33211276, -0.11541637, -0.27552143, 0.032811254, 0.14589228, -0.31307983, -0.041263882, 0.045589656) * inp_2_0_1; + result2 += M4(-0.19408686, 0.07328485, -0.2723991, 0.03292708, -0.03276843, -0.0021388177, 0.025440231, 0.020864552, 0.4946809, -0.5028873, 1.2360919, 0.18543124, -0.14062038, -0.45266026, -0.051517818, -0.07946748) * inp_2_1_1; + result2 += M4(0.101486355, -0.110838085, -0.100334816, -0.06806774, 0.038783833, -0.14677909, -0.02135858, 0.042495932, 0.23560962, -0.11233732, -0.31377485, 0.20676668, 0.115377106, 0.21643944, 0.07656673, -0.029281162) * inp_2_2_1; + result2 += M4(-0.022647236, -0.056124248, -0.029345546, -0.08842019, -0.026206177, -0.2001142, 0.024282888, -0.018178977, 0.17126927, 0.114405416, -0.14800842, 0.057950426, 0.0019471733, 0.04153646, -0.033398405, -0.018740349) * inp_2_0_2; + result2 += M4(-0.028510725, -0.13194804, -0.058474723, 0.15739538, -0.22837207, 0.2936676, 0.17756914, -0.17392308, 0.29371956, -0.06232126, -0.17738655, 0.12433346, 0.00036821538, -0.04049821, 0.12775612, -0.03410144) * inp_2_1_2; + result2 += M4(-0.049271945, 0.07341013, -0.029218232, 0.044777937, 0.047895044, 0.016777143, 0.0770696, -0.080288544, 0.12856913, 0.077402525, -0.09243285, 0.14783, 0.018761791, -0.07868494, 0.0038686912, 0.023355907) * inp_2_2_2; + result3 += M4(-0.0029995563, -0.13207191, 0.01146984, -0.19970092, -0.06331003, 0.037494518, 0.06209565, 0.11000684, 0.15045387, -0.09143123, -0.14541022, -0.115673035, -0.04994145, 0.04097571, -0.113562085, 0.053608663) * inp_2_0_0; + result3 += M4(-0.18109503, 0.06472273, 0.12718305, 0.120410495, -0.09936854, -0.035682097, -0.008422925, 0.088556394, 0.31332913, -0.027132012, -0.075477965, -0.005758827, 0.11464046, 0.028312951, -0.027150951, -0.16116877) * inp_2_1_0; + result3 += M4(0.0877825, 0.17123228, 0.2082314, -0.12994865, -0.0070057088, -0.016857732, 0.04226811, 0.056832854, -0.08325704, -0.11599846, 0.11562998, -0.04030524, -0.020303925, -0.009562874, 0.00033680667, -0.09528862) * inp_2_2_0; + result3 += M4(-0.085425824, 0.07744438, 0.019893674, -0.0326164, -0.19022621, -0.056022335, 0.077502415, 0.06535808, -0.16737926, -0.052317273, -0.06842497, -0.023366082, -0.1893424, -0.15218306, -0.024155376, 0.0037170032) * inp_2_0_1; + result3 += M4(0.16134766, 0.022937534, 0.012012558, 0.014299104, -0.1540332, 0.050365888, -0.07502351, 0.4454789, -1.3961762, -0.409505, -0.20002379, 0.11962769, 0.115599185, -0.25595054, 0.033835527, 0.082020186) * inp_2_1_1; + result3 += M4(-0.038860165, 0.012057152, 0.014026204, -0.15625226, 0.18684216, -0.3406752, -0.04533004, 0.03181735, 0.07668722, -0.40258294, 0.22383828, 0.096628584, -0.14252743, 0.12657546, -0.0005994765, 0.027612105) * inp_2_2_1; + result3 += M4(-0.08842523, -0.07339288, -0.0291693, 0.010607715, 0.01738062, 0.028641904, -0.008154934, -0.06921586, -0.1265699, -0.033918753, 0.025832465, -0.05287533, 0.059064966, -0.019668518, 0.012982388, -0.08999742) * inp_2_0_2; + result3 += M4(0.02235242, -0.14085144, 0.06261052, 0.038736455, 0.04892613, 0.18863972, 0.13817543, -0.2107788, -0.4000103, -0.25693175, -0.006828332, 0.014900624, 0.07850594, -0.11873039, 0.022611257, -0.08396981) * inp_2_1_2; + result3 += M4(-0.000430553, 0.10634275, -0.038480487, 0.06344152, 0.089059435, -0.087476514, -0.086669914, -0.07314378, 0.103207834, -0.1929012, 0.14462645, 0.006974721, 0.054145847, 0.07826243, -0.016338583, 0.03196374) * inp_2_2_2; + result4 += M4(0.06768001, -0.00499547, -0.003675126, 0.0021674372, -0.005389211, 0.01193385, 0.0058679217, 0.22818673, 0.10959775, 0.090091, 0.17508048, -0.26410308, 0.032208588, -0.023449732, 0.030592103, 0.04377794) * inp_2_0_0; + result4 += M4(-0.005548309, 0.038780797, 0.07501425, -0.09693298, 0.08645423, 0.010519084, 0.042117484, -0.18862607, -0.2615312, 0.16094548, 0.19046587, -0.057982862, 0.13564762, 0.015395081, 0.10041826, 0.1280523) * inp_2_1_0; + result4 += M4(0.051592816, -0.1338818, 0.007333832, -0.123867884, -0.12680902, 0.06317454, 0.06440648, 0.12702128, -0.13188729, -0.036226053, 0.06359583, -0.11264101, 0.0660465, -0.006911252, -0.014305653, -0.028108718) * inp_2_2_0; + result4 += M4(0.049971808, -0.05761393, 0.11083267, -0.18402518, 0.06735368, 0.0041248915, 0.026761187, 0.010691537, -0.06932569, 0.2151191, 0.19134477, 0.15462732, 0.1109586, -0.15138485, -0.15404533, -0.21345302) * inp_2_0_1; + result4 += M4(0.018412264, -0.033277724, 0.0898307, 0.2566932, -0.051799186, 0.02853305, -0.12949951, 0.029116428, -1.2733469, -0.5277587, -0.36332208, -0.35201743, 0.19711241, -0.14139847, 0.20627017, -0.36296353) * inp_2_1_1; + result4 += M4(0.07577946, -0.0005393289, -0.026576016, 0.22958, 0.013882234, -0.012866181, 0.16016053, 0.082879774, -0.4841638, 0.0410127, 0.026998263, -0.011007121, 0.064556554, 0.059679985, -0.110813856, -0.11247338) * inp_2_2_1; + result4 += M4(0.0187036, -0.026425784, 0.04100837, -0.040003598, -0.026095727, 0.018318983, -0.00015628185, -0.18648197, -0.048101194, 0.035294995, 0.1561849, 0.0048523545, 0.03734202, 0.051587924, 0.0284748, 0.110711984) * inp_2_0_2; + result4 += M4(-0.09949442, 0.003933561, 0.016302442, 0.19469865, 0.08564367, -0.06126775, -0.0131361075, -0.07832848, -0.2131697, 0.14222373, -0.04763422, -0.03758709, 0.015545757, -0.01926171, 0.120433465, -0.17747171) * inp_2_1_2; + result4 += M4(-0.031215243, 0.0013107703, -0.06944148, -0.29730096, -0.034608968, 0.057521135, 0.076586805, 0.339433, 0.04639953, 0.11480179, 0.034000043, 0.19678573, -0.0015786143, 0.029393451, -0.031088682, 0.07424715) * inp_2_2_2; + result5 += M4(0.084909126, 0.26261202, 0.006332271, -0.06169323, -0.0049925353, -0.12078485, 0.03131402, 0.021565568, -0.04591256, -0.11447064, -0.08151524, 0.19689722, -0.025483731, 0.10425385, 0.043867875, 0.101235926) * inp_2_0_0; + result5 += M4(0.1826475, 0.09245448, 0.017294127, 0.15367286, 0.041482806, -0.11556683, 0.008357756, 0.06606663, 0.03601229, 0.24304186, 0.010745679, 0.020015173, 0.10999528, -0.07473047, 0.014502385, 0.08732145) * inp_2_1_0; + result5 += M4(-0.0055459463, -0.15590164, -0.012428197, -0.26767948, -0.037749413, 0.2883306, 0.0138880145, 0.0993656, 0.024365727, -0.04036223, 0.008223542, -0.15287904, 0.0076344674, 0.1015054, 0.001841306, 0.020273104) * inp_2_2_0; + result5 += M4(0.0696052, -0.16385162, 0.0054490613, 0.19719483, -0.022028316, 0.03143943, -0.044547305, -0.019765042, -0.03168259, 0.013942067, -0.06350953, 0.08778414, 0.0052135354, -0.14678457, 0.16753992, -0.11525738) * inp_2_0_1; + result5 += M4(-0.028089492, 0.08591536, 0.039103355, -0.0011989027, -0.033978198, 0.067759655, 0.0030280973, 0.06262906, 0.1330275, -0.11050622, -0.018213795, -0.06664296, 0.09275364, -0.14832732, 0.060728148, -0.045669857) * inp_2_1_1; + result5 += M4(0.0054600644, 0.2107651, 0.02991181, 0.007781589, -0.039414156, -0.08060699, -0.04085221, -0.0261821, 0.08123445, 0.16569555, 0.03717093, -0.03405933, 0.011837371, -0.15332748, 0.0045701964, 0.020739155) * inp_2_2_1; + result5 += M4(-0.048538465, 0.12959155, -0.02496248, -0.124020666, -0.0075986707, -0.01746584, 0.036758613, 0.1080295, 0.02932849, -0.07417961, -0.044769544, 0.07281821, 0.06306576, -0.032910217, 0.01845823, 0.00016905635) * inp_2_0_2; + result5 += M4(-0.0060093035, -0.04267317, 0.03150853, 0.18961181, -0.041447956, 0.19851932, -0.0159659, -0.08628438, -0.23440832, -0.07044305, 0.02353935, 0.14871973, -0.005455909, -0.049727786, 0.0042388714, -0.12666693) * inp_2_1_2; + result5 += M4(0.047896713, 0.03794731, 0.014777414, -0.112578444, 0.04885318, -0.041999713, -0.004987667, 0.047805145, -0.082744926, 0.044025544, 0.041299365, 0.32537654, -0.020033896, 0.016646098, 0.03738507, -0.008161087) * inp_2_2_2; + result6 += M4(-0.21378931, 0.025034526, -0.054272383, -0.019605987, -0.21245867, 0.1425532, -0.06789373, 0.06773302, 0.30062482, -0.4553844, 0.28158724, 0.11054188, -0.16239841, 0.055942602, -0.19231087, 0.03758331) * inp_2_0_0; + result6 += M4(-0.101065405, -0.23890175, -0.107009605, -0.02441922, -0.027624216, -0.10614663, 0.0009074589, 0.037790842, 0.08398399, -0.22567214, 0.19783333, 0.19830455, -0.06674321, 0.12420932, 0.013650824, -0.01383124) * inp_2_1_0; + result6 += M4(-0.06046827, 0.073138736, 0.053774636, -0.04245042, -0.019614398, -0.12021351, 0.0640192, -0.012950124, -0.014771404, -0.0427789, 0.13314049, 0.087598614, -0.040899213, -0.178054, 0.007863442, 0.02005637) * inp_2_2_0; + result6 += M4(-0.08274766, -0.29248264, 0.06568095, 0.056109387, 0.06571921, -0.06501575, 0.009707104, 0.03690564, 0.06955326, -0.49741158, 0.3535879, 0.22558925, -0.17582366, 0.2541142, -0.040331922, -0.0079253325) * inp_2_0_1; + result6 += M4(0.02198145, 0.069614016, -0.19633263, -0.059362266, 0.141866, 0.19931817, -0.33870012, -0.06054324, -0.5628778, -0.29990846, -0.7620501, 0.18394424, -0.32113722, 0.25916022, 0.43595913, 0.0062956167) * inp_2_1_1; + result6 += M4(-0.061240643, 0.16374242, 0.16411644, 0.03160084, -0.20708153, 0.2418872, 0.09821428, -0.051060483, -0.31409428, -0.38504866, 0.28581563, 0.039346352, 0.13049528, -0.19173239, -0.08671701, -0.015251079) * inp_2_2_1; + result6 += M4(-0.0058384403, -0.018982723, 0.011247627, 0.023360295, -0.11788587, -0.05886444, 0.060266808, -0.016258547, 0.032792643, 0.13078995, 0.16720574, 0.1021891, -0.012916022, 0.12341831, -0.017956322, 0.0076645515) * inp_2_0_2; + result6 += M4(-0.08174487, -0.07655943, -0.069761775, -0.03984005, -0.18635997, -0.0769797, 0.058497705, -0.012397948, -0.26593667, -0.35763168, 0.3053035, 0.16697241, 0.025686216, -0.04025118, -0.05504943, -0.011258202) * inp_2_1_2; + result6 += M4(0.13846257, -0.020727726, 0.07195738, 0.07012813, 0.037056886, 0.084274344, 0.032341506, -0.03719822, -0.17256403, -0.07522735, 0.29564136, 0.10684864, 0.023120116, -0.10850621, 0.05907603, 0.0064585027) * inp_2_2_2; + result7 += M4(0.045512248, -0.14047314, -0.035316534, -0.021711236, -0.036649406, 0.024272496, -0.016466994, -0.02366704, -0.18736261, 0.16358788, 0.07416578, 0.029167552, 0.025188375, 0.05859252, 0.015015997, -0.028118413) * inp_2_0_0; + result7 += M4(0.20272353, 0.017243473, 0.085268095, 0.08761214, 0.09177632, 0.09122613, 0.003279683, 0.09298329, -0.05158523, 0.32321978, -0.019729676, 0.15123686, -0.030318592, -0.066809036, -0.028933106, 0.027836226) * inp_2_1_0; + result7 += M4(0.038886297, -0.075095125, 0.042839754, 0.111518875, -0.068027765, 0.05661839, -0.024160957, -0.048064195, 0.016453968, 0.30065125, 0.07987168, 0.120915346, 0.061439663, 0.025587967, 0.0131863, 0.20637646) * inp_2_2_0; + result7 += M4(0.006688766, 0.060313687, 0.0837338, 0.15295516, 0.13921517, -0.079802856, -0.01659336, 0.06276737, -0.07732095, 0.048029214, 0.0381174, 0.036477562, -0.20164026, -0.05498727, -0.10001294, -0.23249875) * inp_2_0_1; + result7 += M4(0.051556252, -0.05396095, 0.040760484, 0.09800702, 0.02520163, -0.11875378, -0.01601254, -0.06958395, 0.30008873, 0.35510468, -0.105978206, 0.07572828, 0.31786868, -0.019430265, -0.013444821, -0.41228822) * inp_2_1_1; + result7 += M4(-0.08480888, -0.013091551, 0.057829924, -0.1287473, 0.13693194, 0.0879522, 0.006954083, 0.12910074, -0.04565487, 0.3312227, 0.010747744, 0.30918542, 0.010689856, -0.0077504627, 0.062206283, 0.082858674) * inp_2_2_1; + result7 += M4(0.11036713, -0.12419677, -0.016698154, -0.044147998, 0.005315988, -0.0006600803, -0.01754046, 0.16190018, -0.0629583, 0.034030754, 0.05002628, 0.048739817, 0.07426313, 0.05956884, 0.011966195, -0.017436745) * inp_2_0_2; + result7 += M4(-0.042909056, 0.054021057, 0.029829059, -0.019860597, 0.0011133277, -0.0040212767, 0.015729701, 0.11518584, 0.0102282455, -0.055085283, -0.0012885286, 0.059330195, 0.043187365, 0.0011614253, 0.0035695732, -0.117765844) * inp_2_1_2; + result7 += M4(-0.053579032, -0.14519134, -0.0009934311, 0.30362862, -0.054370902, 0.022161335, 0.048316855, -0.26521692, -0.09139777, 0.024469515, 0.019602634, 0.16453758, 0.0048577576, 0.032204863, 0.007978113, 0.06834206) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.024283165, 0.0497675, 0.04209054, 0.092265576, 0.088880785, -0.046750903, -0.045728102, -0.17453833, 0.29950008, 0.0146090435, -0.0011412527, -0.14314497, -0.23439139, 0.015760273, -0.16294831, 0.30919287) * inp_3_0_0; + result0 += M4(0.061753, -0.033532623, 0.03762749, 0.19825752, 0.18266286, -0.01920836, -0.035078272, -0.32341257, 0.10836479, -0.039737623, 0.0729989, 0.19063786, 0.32724187, -0.0011040698, 0.058104776, -0.08130756) * inp_3_1_0; + result0 += M4(-0.21395864, -0.026054421, -0.038373783, 0.13997832, -0.36665928, -0.029073277, -0.033403404, 0.04015593, -0.21957956, -0.028362159, -0.1450803, -0.13167295, -0.3943738, -0.002117162, 6.80439e-05, 0.18164949) * inp_3_2_0; + result0 += M4(-0.1434857, -0.08827172, -0.027521979, 0.23548244, -0.3949513, -0.015710838, 0.058741063, 0.064829126, 0.465586, 0.026308114, 0.040384986, -0.2314333, 0.107608266, -0.02262083, -0.015638571, 0.06151825) * inp_3_0_1; + result0 += M4(-0.26365027, -0.053397793, -0.04360752, 0.19367543, 0.13468939, -0.08598628, 0.12173429, 0.27593765, 0.11159633, -0.04606838, 0.18434636, -0.15351029, -0.31877097, -0.08277191, 0.13640311, 0.43145153) * inp_3_1_1; + result0 += M4(-0.29464522, -0.016439011, -0.0007571344, -0.0901558, -0.16341409, -0.017229151, 0.06966537, 0.03856679, 0.025108457, -0.012485797, -0.039611492, -0.08781126, 0.0012011288, -0.023230432, -0.084057346, -0.08234134) * inp_3_2_1; + result0 += M4(-0.028691113, -0.024441332, 0.022529928, -0.036946177, 0.21718341, -0.018645508, -0.003931241, 0.07723482, -0.1957138, 0.0037524952, 0.057339102, -0.01670828, 0.42378765, 0.036199115, -0.12905419, -0.08846306) * inp_3_0_2; + result0 += M4(-0.22478113, -0.02726013, -0.0001153188, -0.15506884, 0.2507988, 0.008661592, -0.002995308, -0.06615709, 0.012039729, -6.456574e-05, -0.05536171, 0.11630848, -0.3596208, -0.018060783, 0.045303576, -0.122143075) * inp_3_1_2; + result0 += M4(0.2922931, -0.0013313533, 0.021835366, -0.02792814, 0.067805834, -0.016357137, -0.008075278, 0.07338922, -0.28518853, -0.02674647, -0.045892086, -0.11064384, 0.1366556, 0.001744449, -0.062589146, -0.029331636) * inp_3_2_2; + result1 += M4(0.03306756, 0.08148378, 0.070178896, 0.052487683, 0.07591529, -0.090010285, 0.007501459, 0.056432553, -0.06423492, 0.1266206, -0.021761503, -0.13821425, 0.02684785, -0.17751159, 0.12499386, -0.057041626) * inp_3_0_0; + result1 += M4(-0.06305808, -0.003029339, -0.19723316, -0.024612572, 0.11675237, 0.13206732, -0.03728425, -0.27787682, -0.13386591, -0.074129164, -0.09049858, 0.070392884, 0.14579253, 0.046249837, 0.072523214, -0.046256673) * inp_3_1_0; + result1 += M4(-0.0063220146, 0.1374682, 0.015501421, -0.080531456, 0.044265956, 0.0005256883, -0.10039987, 0.010353571, 0.035639998, 0.034562804, -0.08557062, -0.067820825, -0.02594958, -0.06751282, -0.06054404, 0.023464454) * inp_3_2_0; + result1 += M4(-0.085628495, 0.026122717, -0.06251034, -0.07813039, 0.064764075, -0.061093684, -0.07498958, -0.012146885, -0.17425966, -0.13078488, 0.06621085, -0.23579246, 0.04649797, 0.15963934, -0.11426605, -0.05393359) * inp_3_0_1; + result1 += M4(0.03467501, 0.16204786, 0.24464224, -0.12930612, -0.02998436, -0.12982363, 0.25033334, -0.073294155, -0.076955386, -0.14043267, 0.042640664, -0.098987386, 0.36499172, -0.07694139, -0.3014398, -0.2403275) * inp_3_1_1; + result1 += M4(0.081303716, 0.0056330943, -0.18961811, -0.12822051, -0.018000025, -0.011524642, -0.0653646, 0.092894234, -0.16605528, 0.10648042, 0.04756378, 0.08239565, 0.10655016, 0.17190112, -0.07503134, 0.154786) * inp_3_2_1; + result1 += M4(0.07877548, -0.08406755, -0.12263102, -0.09839205, -0.075989164, 0.016300429, 0.075301066, -0.06671542, -0.013989192, 0.07865056, -0.02705995, -0.024814703, -0.23029742, 0.13086364, 0.09879467, -0.024085043) * inp_3_0_2; + result1 += M4(-0.04949895, -0.09944479, -0.035490494, -0.1424056, -0.0015483812, -0.26415774, 0.11374783, 0.036845163, -0.049487595, 0.17304853, 0.04286757, -0.041421346, -0.096647084, -0.039364494, -0.07092455, 0.0992368) * inp_3_1_2; + result1 += M4(-0.0024822522, 0.12610573, -0.17481326, -0.2254312, -0.04052593, 0.033977542, 0.0023851853, -0.01991922, -0.09567233, -0.23604324, -0.06909622, 0.021230001, -0.17774828, -0.04969453, -0.049829256, -0.019926505) * inp_3_2_2; + result2 += M4(0.0062232227, 0.094732285, 0.015565098, 0.04789409, 0.026134744, -0.008908634, -0.041622743, 0.022860143, -0.08880754, -0.19595368, 0.05804228, 0.011920187, -0.024099331, -0.18070142, 0.25316343, -0.060002785) * inp_3_0_0; + result2 += M4(0.005514768, -0.062968925, 0.073958896, -0.04179116, 0.039438695, -0.21735449, 0.12938812, -0.0050266474, 0.011303574, 0.23483977, 0.039844885, -0.05560983, 0.063854314, -0.060952738, -0.1393973, -0.37114406) * inp_3_1_0; + result2 += M4(-0.08650923, -0.022224752, 0.046040937, -0.03707218, -0.057128944, -0.04894333, 0.028075451, 0.029029025, -0.008812495, 0.052698623, -0.023792142, 0.053784177, -0.034399096, -0.07688924, 0.089087985, -0.028468607) * inp_3_2_0; + result2 += M4(-0.09355074, 0.046843387, 0.087332726, -0.0765222, 0.0110076, 0.17207216, -0.039755315, 0.02719246, 0.04381996, 0.20847405, 0.10894148, -0.022410456, -0.1150142, -0.036474664, 0.17182417, -0.07701843) * inp_3_0_1; + result2 += M4(-0.06772556, 0.08335604, 0.123895146, -0.07623608, 0.13438194, -0.23226596, 0.110187896, 0.16492964, 0.095936894, -0.14422974, 0.15958638, 0.03922633, 0.05117355, -0.36853608, 0.263776, 0.010799132) * inp_3_1_1; + result2 += M4(0.050241955, -0.048252743, -0.12763028, 0.06064551, -0.014493719, 0.0017694595, -0.015567814, 0.011761102, -0.063168906, -0.23498815, -0.024338067, 0.123438045, -0.118218645, -0.078737825, 0.020180874, 0.057110343) * inp_3_2_1; + result2 += M4(0.04900988, 0.08846855, 0.0063234842, -0.02012749, -0.054708242, 0.06490428, 0.09369349, 0.005039888, -0.177668, 0.01925192, 0.031191912, -0.060283747, -0.0040654177, 0.054145835, 0.051896956, -0.08723232) * inp_3_0_2; + result2 += M4(-0.096907, -0.021857888, 0.031266436, 0.1563737, 0.023062097, 0.13897826, 0.0296652, 0.014089084, 0.08765817, -0.05589916, 0.08080417, -0.08152843, -0.012584313, 0.11186676, 0.048213404, 0.015569989) * inp_3_1_2; + result2 += M4(-0.004038501, 0.16766591, -0.06617166, 0.10924829, -0.0071942075, -0.047832843, -0.008327084, 0.13958019, -0.08314241, 0.012938414, -0.07989016, 0.027157735, -0.14717053, 0.013168049, 0.056328453, -0.018062972) * inp_3_2_2; + result3 += M4(-0.11588345, -0.048860267, 0.04026564, 0.17827415, 0.0998871, -0.012426343, -0.009579661, 0.1319731, -0.091814525, -0.103054315, 0.20802924, 0.11932583, -0.120917186, 0.122815885, -0.05694828, -0.13992405) * inp_3_0_0; + result3 += M4(0.014388141, -0.07566682, -0.08008407, -0.13993433, 0.23215155, 0.0134389885, -0.026175631, -0.008143313, 0.034986496, -0.10352601, -0.0503453, -0.01887341, -0.08861837, -0.003583383, -0.06424219, -0.22196539) * inp_3_1_0; + result3 += M4(0.09338533, 0.028920205, 0.09371106, -0.07352844, 0.15835868, -0.02322297, 0.0988949, -0.030822724, 0.0024296145, -0.087591305, 0.22056332, 0.14175497, 0.14240375, -0.12589665, -0.0123874, 0.026726576) * inp_3_2_0; + result3 += M4(0.101009525, 0.049909282, -0.04649289, -0.09258099, 0.06756247, 0.12446199, 0.10324761, 0.035537526, -0.17805111, -0.11862091, 0.16292283, 0.032120794, -0.43927768, -0.16580313, -0.13630247, 0.116159216) * inp_3_0_1; + result3 += M4(-0.11253715, 0.035468232, -0.006094205, -0.00010499996, -0.03449603, 0.18416508, -0.22004342, 0.46060896, -0.3149324, -0.161782, -0.012070646, 0.0034640853, -0.07505667, -0.22911847, 0.029920409, 0.27075434) * inp_3_1_1; + result3 += M4(-0.045219302, -0.10022268, 0.28776914, -0.050829034, -0.1324678, 0.033043787, 0.04906001, 0.058482345, 0.17684563, -0.41000494, 0.39598793, 0.010794503, 0.061513547, -0.09219405, 0.11772378, 0.043420322) * inp_3_2_1; + result3 += M4(-0.05644918, 0.046518896, 0.05667718, -0.061204486, 0.20956382, 0.06949218, 0.045475535, -0.0062713427, -0.112300575, 0.06525255, 0.044088792, -0.05253521, -0.14794695, 0.00177525, 0.025166538, 0.01934682) * inp_3_0_2; + result3 += M4(-0.09059353, -0.32730135, 0.15618397, 0.08136938, 0.12091326, 0.050191343, -0.0126025975, -0.1528945, -0.1624242, -0.15662487, 0.005773003, 0.18454179, -0.07416858, -0.101768754, 0.060565114, -0.13774152) * inp_3_1_2; + result3 += M4(-0.14014047, 0.21495755, 0.1400506, -0.0013616432, 0.01401761, 0.10157003, 0.14277904, 0.06724122, 0.14065036, -0.16474451, 0.056039203, -0.09650645, 0.0794867, 0.090995364, 0.017693464, 0.045717765) * inp_3_2_2; + result4 += M4(-0.08290411, 0.07583921, -0.04734093, -0.12625407, -0.0842713, 0.027178466, 0.004364405, 0.006723222, 0.048661474, 0.09233898, 0.12611432, 0.31598994, 0.12500937, -0.07337151, -0.05784687, -0.06958127) * inp_3_0_0; + result4 += M4(0.057006232, -0.06276555, 0.13384582, -0.054232262, 0.031532332, -0.041165788, 0.08581619, 0.02009011, 0.029177727, 0.037220247, 0.027474059, 0.21850125, 0.12020816, -0.05292536, 0.0070272335, -0.066589676) * inp_3_1_0; + result4 += M4(-0.09705502, -0.007289397, 0.09680575, 0.11166659, 0.0034842931, -0.0844569, 0.114105746, 0.28044242, -0.20696156, -0.03241134, -0.010843034, 0.23451081, 0.09897717, -0.055849615, -0.030103019, -0.003095836) * inp_3_2_0; + result4 += M4(0.029930903, 0.008243335, 0.12038666, -0.14418308, -0.0015808095, -0.05616462, 0.01209605, 0.053444922, -0.10969763, 0.0577243, 0.20015837, 0.41953164, 0.12984945, 0.08349547, 0.050895657, 0.26564953) * inp_3_0_1; + result4 += M4(-0.06064571, 0.060401887, -0.036347233, 0.06238602, -0.14779256, 0.049735166, -0.102892995, 0.07332941, -0.013753356, -0.114176646, -0.10219833, 0.10913866, -0.09358662, -0.3322366, -0.07978764, -0.30454326) * inp_3_1_1; + result4 += M4(-0.036417656, -0.074414335, -0.05450449, 0.090627216, 0.007347477, 0.016971903, 0.00850598, 0.15366736, -0.101376526, -0.033855323, 0.1703145, 0.017130794, -0.01863804, -0.014399785, 0.015363004, -0.35543576) * inp_3_2_1; + result4 += M4(0.08879393, -0.046444066, 0.15485217, -0.02280739, -0.0014371987, 0.005564266, 0.07250395, 0.12936455, -0.111821726, -0.011816954, 0.035920687, 0.08683232, 0.004791557, 0.008852828, 0.0027795548, -0.31812134) * inp_3_0_2; + result4 += M4(-0.05225231, -0.16132718, 0.029878085, 0.13999972, 0.11916739, -0.0927804, 0.028337408, 0.051797315, 0.004983357, -0.017986676, -0.0845371, 0.061577987, 0.03583781, -0.077512816, -0.048737008, -0.2468147) * inp_3_1_2; + result4 += M4(-0.15567273, 0.016630119, -0.1259014, 0.17257217, 0.042694878, -0.06027838, -0.019028008, 0.011012398, -0.024295779, -0.06981502, 0.064501025, 0.29617837, 0.024673456, 0.007618219, 0.027032338, 0.43974623) * inp_3_2_2; + result5 += M4(-0.044054244, -0.22991493, 0.028760482, 0.11415289, -0.03990307, -0.014809855, 0.01915687, -0.08390316, 0.022934312, 0.07109665, -0.019307228, 0.079597086, 0.022698887, -0.06078006, -0.030629935, -0.03551745) * inp_3_0_0; + result5 += M4(0.057413004, -0.12888329, -0.01309833, 0.10970439, 0.08519955, -0.10797157, -0.09017191, -0.09058301, -0.021061527, 0.12536007, 0.0009481246, 0.013948104, 0.23868974, -0.25675, 0.0360314, 0.09580469) * inp_3_1_0; + result5 += M4(0.13406447, -0.23385373, -0.013457494, 0.06326356, 0.09611541, 0.23785551, -0.018960256, 0.038806852, -0.031713154, 0.16223979, 0.027510801, 0.10484777, 0.038933262, 0.1478121, 0.012894038, 0.1713614) * inp_3_2_0; + result5 += M4(0.05781802, -0.25729373, -0.024763575, 0.103165254, 0.013313597, 0.19201177, -0.04671426, -0.037270553, -0.11421036, 0.14077225, -0.03230022, 0.16660379, -0.0109087275, 0.10391722, 0.012093664, -0.067868076) * inp_3_0_1; + result5 += M4(0.07763934, -0.14978814, -0.03393292, 0.41640243, -0.08365926, -0.11057797, 0.0645677, 0.022094479, 0.0071299206, 0.2865454, 0.06872672, 0.17326848, 0.15701757, -0.19093269, 0.04973328, -0.008444333) * inp_3_1_1; + result5 += M4(-0.007034914, -0.03130845, 0.015889382, 0.20091657, 0.038499758, -0.01991946, -0.025980828, 0.036220644, -0.046328038, 0.20740509, 0.022268564, 0.10047856, 0.025131112, -0.07421299, -0.0066541648, 0.027847596) * inp_3_2_1; + result5 += M4(-0.05832757, -0.22972517, -0.08122026, 0.09228985, 0.038165085, 0.023070628, -0.023780597, 0.0122694, -0.03132796, 0.10273563, 0.022454556, 0.15121804, -0.037277255, -0.15060231, -0.025135025, 0.034539178) * inp_3_0_2; + result5 += M4(-0.10743921, -0.038944654, -0.016727895, 0.33521724, -0.040666234, 0.10731634, -0.08402313, -0.033649124, 0.010878088, 0.16072121, -0.0029569878, 0.009882774, -0.09027276, 0.080400966, 0.011087642, -0.07735867) * inp_3_1_2; + result5 += M4(0.09296584, -0.4422661, -0.008140259, 0.22512265, 0.07227426, 0.19396716, -0.010994545, 0.01596842, -0.017072415, -0.057259444, -0.025023792, -0.054752175, 0.01964511, 0.04410241, -0.017442709, 0.026149442) * inp_3_2_2; + result6 += M4(-0.14465208, 0.052414786, -0.10324293, 0.043296814, -0.0065701497, 0.284348, 0.088501304, 0.02364426, -0.018061107, -0.27728018, 0.06673837, -0.043344155, -0.055777367, 0.095413126, -0.084193215, -0.019277465) * inp_3_0_0; + result6 += M4(-0.03289761, 0.060269997, -0.037370358, 0.03455, 0.23031938, -0.0960787, 0.16084133, -0.015020456, -0.036135703, 0.0015686582, -0.024946745, 0.0014197099, 0.017655753, 0.0874854, -0.027340759, 0.09841798) * inp_3_1_0; + result6 += M4(-0.1289917, -0.098799415, -0.14170569, 0.0020071268, -0.0690942, 0.050342314, 0.040754493, -0.011776017, -0.105071805, 0.040584493, -0.06626002, -0.035702202, -0.16230677, -0.07215765, 0.022972744, -0.06026864) * inp_3_2_0; + result6 += M4(0.037230387, -0.043833714, 0.09105837, -0.014592812, 0.12744612, 0.32406375, 0.13302492, 0.01414794, 0.011576483, -0.5599568, 0.022151038, 0.024990482, 0.014135616, 0.20804837, -0.033429373, 0.04993635) * inp_3_0_1; + result6 += M4(-0.2591266, -0.1823409, -0.071213484, -0.010348561, -0.012311407, 0.10029026, -0.3059883, 0.16752581, -0.13978365, -0.2672502, -0.22415243, 0.049176916, -0.12087738, 0.14781684, -0.12381877, -0.0030827867) * inp_3_1_1; + result6 += M4(-0.022580065, -0.058024984, 0.091736086, -0.02749568, 0.016032806, -0.032259338, -0.014710801, -0.031026777, -0.23686303, 0.13892634, 0.2228778, -0.017671678, -0.024856837, 0.18229605, 0.16825965, -0.06214024) * inp_3_2_1; + result6 += M4(-0.08364155, -0.02936373, 0.09070326, 0.03580639, -0.0351979, 0.18541162, 0.0020878087, -0.008411181, -0.036377754, 0.08249375, -0.07135602, -0.0076352847, -0.15029375, 0.24912156, 0.10706906, -0.0847039) * inp_3_0_2; + result6 += M4(-0.18271367, -0.13727036, 0.10006786, -0.039201215, -0.2927287, -0.21505424, 0.19938983, 0.011092712, 0.12819457, 0.12716632, -0.09388147, -0.020313218, -0.09050144, -0.11972295, 0.15428178, -0.0041933535) * inp_3_1_2; + result6 += M4(0.12788516, -0.03425613, -0.050770186, -0.015303022, 0.034824573, -0.0037806693, -0.029709935, -0.073458716, -0.034717567, -0.035268117, 0.03545894, 0.0040188264, 0.016481591, -0.008730628, 0.034666605, -0.05890681) * inp_3_2_2; + result7 += M4(-0.055325568, -0.07653447, 0.0064974306, -0.036004025, -0.050747108, -0.049278356, -0.0015913406, -0.0295292, 0.05677361, 0.11795071, 0.007659743, 0.14516187, 0.063124515, -0.02677223, 0.059773576, 0.07873373) * inp_3_0_0; + result7 += M4(-0.018679123, -0.06523358, 0.014471994, -0.034016907, -0.11572341, 0.19372271, 0.02323371, -0.025854953, 0.07890665, -0.003981726, -0.0016486332, 0.0019313947, 0.046618175, -0.45814046, -0.025193462, -0.15063004) * inp_3_1_0; + result7 += M4(-0.031975295, 0.042037755, 0.018787742, -0.035285443, 0.011452343, 0.07545121, -0.016744, 0.045516856, -0.03898138, 0.006110149, 0.00040688645, 0.2023965, -0.029057851, 0.113781966, -0.0040228264, -0.05689903) * inp_3_2_0; + result7 += M4(-0.10792631, -0.0074666715, 0.009675205, -0.045531865, -0.15179047, -0.009790886, -0.025036544, -0.047867645, 0.26350698, -0.14740969, -0.0101214005, 0.3249405, 0.082714014, 0.016668236, 0.013723304, -0.018905688) * inp_3_0_1; + result7 += M4(0.055604637, 0.14202286, -0.093780614, -0.047645394, 0.012365282, 0.15699707, 0.0076153325, 0.016230915, 0.024937283, 0.02176795, -0.08995523, 0.2716097, 0.26775718, 0.18402198, -0.046548117, -0.015260937) * inp_3_1_1; + result7 += M4(0.068360254, -0.0986738, -0.045730673, 0.18361628, -0.04210607, -0.04912704, -0.06883431, -0.287089, 0.13788974, 0.11286571, -0.06858426, 0.34948456, 0.0033379109, -0.037565716, -0.052660394, -0.06377529) * inp_3_2_1; + result7 += M4(0.077899106, -0.04598531, 0.015534113, -0.00073033787, -0.026151834, 0.00032459627, -0.0029609238, -0.013592551, 0.05483648, 0.05432821, -0.017464997, 0.09295904, -0.008487986, 0.09710061, 0.015405445, 0.049106844) * inp_3_0_2; + result7 += M4(-0.0056601516, 0.025121285, -0.061511125, 0.042798955, -0.02476289, -0.064376734, 0.00019398564, -0.14655946, 0.09633312, -0.0421261, 0.034395702, 0.18609671, 0.16801009, 0.019355727, -0.03428645, 0.0912915) * inp_3_1_2; + result7 += M4(-0.05483083, -0.115898006, -0.02791033, 0.29514515, -0.06980501, -0.011925553, -0.042923976, 0.0023969517, 0.03060759, 0.03044715, -0.014774592, 0.12648693, -0.0123675605, 0.03650439, 0.016308002, 0.06412725) * inp_3_2_2; + const V4 inp_4_0_0 = inp[4][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_4_1_0 = inp[4][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_4_2_0 = inp[4][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_4_0_1 = inp[4][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_4_1_1 = inp[4][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_4_2_1 = inp[4][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_4_0_2 = inp[4][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_4_1_2 = inp[4][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_4_2_2 = inp[4][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.18671563, 0.011007786, -0.019565666, -0.16721845, 0.3396576, -0.0040437514, 0.029993847, 0.10844761, -0.10774442, 0.01726972, 0.01727367, -0.24374896, 0.053115454, -0.059017625, 0.071100354, 0.01158527) * inp_4_0_0; + result0 += M4(0.16077441, 0.008739098, -0.0958093, -0.31102344, 0.360259, 0.022435881, 0.00294363, 0.29604894, -0.03139089, 0.06157452, 0.0039129914, -0.4264208, -0.10862725, -0.023980858, 0.036441203, 0.11493091) * inp_4_1_0; + result0 += M4(-0.1828809, -0.012715486, 0.008071946, 0.0034295933, 0.7968775, 0.034102093, -0.02228984, -0.08469485, -0.049122155, 0.012258304, -0.014740524, -0.038235273, -0.17386423, -0.006689065, 0.014004448, -0.0023374695) * inp_4_2_0; + result0 += M4(0.049398612, -0.019011958, 0.096648306, -0.06975673, -0.2859634, 0.002320488, 0.027722683, 0.08107191, 0.51173383, 0.03163909, -0.074041896, -0.092033714, 0.17895018, 0.006966968, -0.0079196915, -0.01761527) * inp_4_0_1; + result0 += M4(-0.14754301, 0.14123687, -0.023562888, -0.123279326, 0.1995399, 0.021962682, -0.017955476, 0.08554631, -0.22334902, 0.05179767, -0.054125935, 0.042983744, -0.09859608, 0.029277636, 0.025738848, -0.29354262) * inp_4_1_1; + result0 += M4(0.2905504, -0.0055426797, 0.040520735, 0.006563564, -0.06513221, -0.0014715588, 0.037878856, -0.05056981, 0.4913108, 0.040443465, -0.043129094, 0.097800545, 0.08404051, 0.04351597, 0.08522453, -0.02732656) * inp_4_2_1; + result0 += M4(0.080269516, -0.0311205, 0.079562254, 0.08109762, 0.57053447, -0.030450398, 0.04647022, -0.0718735, -0.16160007, 0.007957556, 0.07915407, -0.0581235, -0.39995733, -0.010502564, 0.034433004, 0.054193277) * inp_4_0_2; + result0 += M4(-0.15542449, -0.023501785, -0.010192405, 0.08507459, 0.1975596, 0.0037485538, -0.12301532, -0.028392443, -0.070247084, 0.032272387, -0.042492792, 0.16417025, -0.25550207, 0.01390695, -0.07521389, 0.04799159) * inp_4_1_2; + result0 += M4(0.08423475, -0.02638225, 0.04063541, 0.012670396, 0.0068036937, -0.025370894, 0.0004282429, 0.015731903, -0.011617622, -0.02155093, 0.024528667, 0.026475519, -0.23353197, 0.0022783815, 0.07034933, -0.04010941) * inp_4_2_2; + result1 += M4(-0.07825759, -0.038268555, -0.14281398, 0.12364303, 0.031731438, -0.19155267, 0.1114541, 0.046652257, 0.12904848, 0.11521979, -0.09940924, -0.036593784, 0.010878354, 0.05868903, -0.18103519, 0.12952593) * inp_4_0_0; + result1 += M4(0.0868141, 0.23006985, 0.019333737, -0.15485746, 0.03593383, -0.047892574, 0.0980809, 0.16176724, 0.14827013, -0.0354172, 0.03207481, 0.036897894, -0.036856364, -0.12252235, -0.104194045, 0.0070654177) * inp_4_1_0; + result1 += M4(-0.031276423, 0.08201624, 0.15860677, -0.049821, -0.0132355755, -0.017923497, -0.0698732, -0.024869822, 0.08522283, -0.07772247, -0.082442336, 0.056966454, 0.037081074, -0.01685068, -0.12089761, 0.015036329) * inp_4_2_0; + result1 += M4(0.06920925, -0.14711545, -0.043020148, -0.27729544, 0.032940667, -0.12623659, -0.049926672, -0.08014844, -0.10112552, 0.05759975, 0.00666061, -0.06391868, 0.009890536, -0.006222198, -0.013850685, 0.058191296) * inp_4_0_1; + result1 += M4(-0.05096672, 0.09124099, 0.44005808, 0.29929984, 0.015805753, -0.062670395, 0.1964175, 0.16380383, -0.0716157, 0.20988245, 0.1529413, 0.06861653, 0.121379115, -0.33514094, -0.02916709, 0.04951275) * inp_4_1_1; + result1 += M4(0.016275372, -0.22383131, 0.003793926, -0.07776438, 0.015962467, -0.033935986, -0.03924903, -0.10662822, 0.02068318, -0.051470168, -0.049629997, 0.08728509, -0.017298343, -0.20376, -0.015252269, -0.050460514) * inp_4_2_1; + result1 += M4(0.024207205, 0.060881548, 0.028375672, -0.17706855, 0.06188294, 0.08860895, 0.010041935, 0.034763977, 0.015148256, -0.07430798, -0.08011852, 0.057848807, 0.008911355, -0.019565018, -0.16178733, -0.04136675) * inp_4_0_2; + result1 += M4(0.06454287, 0.10210875, -0.033464856, -0.07513092, 0.023692554, 0.08148411, 0.10072244, 0.056796115, -0.010498132, 0.016708005, 0.07634566, 0.016010612, 0.0049315076, 0.1741713, -0.06222367, -0.08142443) * inp_4_1_2; + result1 += M4(0.087150246, -0.05966943, 0.045536947, 0.117682226, -0.04751186, -0.10200599, 0.059109718, -0.019480744, 0.059142776, 0.015344558, -0.054946624, -0.073430985, -0.021776598, 0.061559692, -0.107282475, 0.03965959) * inp_4_2_2; + result2 += M4(0.0020025254, 0.022251166, 0.00020157064, -0.040389594, 0.03649809, 0.12783991, -0.1926349, 0.033586685, 0.04192445, 0.17252682, -0.033448916, 0.008182044, 0.0678849, -0.037545826, -0.12726957, 0.069658935) * inp_4_0_0; + result2 += M4(-0.08797048, -0.33720347, -0.06843994, -0.009388004, 0.007355689, 0.16356027, -0.14867967, 0.074103355, 0.034870073, 0.023578513, -0.031897698, 0.032564428, -0.107870474, -0.035462074, -0.26793018, 0.026975883) * inp_4_1_0; + result2 += M4(-0.043934062, 0.13283846, -0.017962202, -0.06690337, 0.041170668, -0.03378914, -0.0321454, -0.011846852, 0.009516877, -0.026580429, 0.0038966432, 0.052053582, 0.092849925, 0.045884762, -0.016070126, 0.042846553) * inp_4_2_0; + result2 += M4(0.11459171, 0.16836528, 0.0067692325, -0.079261854, -0.0998232, 0.14362013, 0.079440504, -0.01310343, -0.06368294, 0.037007377, -0.040556017, 0.04391934, 0.25572732, 0.022206828, -0.14677086, 0.0815601) * inp_4_0_1; + result2 += M4(-0.27271116, 0.049193546, 0.03336971, -0.008202585, -0.1564803, 0.05234511, 0.0049210233, 0.061044786, -0.19119234, 0.078088306, 0.14981882, -0.10732807, 0.422677, 0.052270968, -0.26214805, 0.087457865) * inp_4_1_1; + result2 += M4(-0.04687676, 0.015422423, -0.00086431607, -0.01271057, -0.011118379, 0.04597728, -0.053011242, -0.056572095, -0.055644285, 0.03096736, 0.02310477, -0.055334385, 0.18751022, -0.10813116, -0.08271084, 0.09245653) * inp_4_2_1; + result2 += M4(-0.086186506, 0.1830434, -0.11030644, -0.023001134, -0.0015605387, 0.05605546, 0.015870629, 0.07216331, -0.047273155, -0.008794701, -0.07601067, 0.056934644, 0.1943258, 0.10497332, -0.027516173, -0.0063392227) * inp_4_0_2; + result2 += M4(-0.10981476, -0.10139037, -0.10839621, 0.14178525, -0.049079288, 0.139396, -0.028117048, 0.013654328, -0.13395016, -0.08480129, 0.035256725, -0.017280353, 0.15663345, -0.15014705, -0.11252795, 0.03081507) * inp_4_1_2; + result2 += M4(-0.08621381, 0.033718638, -0.13189682, 0.15058693, -0.0071148723, -0.024167918, 0.04010849, -0.013371304, -0.06671668, 0.044749618, -0.010760944, -0.11224522, 0.09868325, -0.024926199, -0.08014657, -0.09766281) * inp_4_2_2; + result3 += M4(0.17560296, -0.065775886, -0.006459535, -0.08693382, 0.0053581237, 0.0005426898, -0.02508934, 0.10989717, 0.11865435, 0.05586065, 0.09484076, 0.11796001, 0.07598771, -0.088916354, -0.016355693, -0.03920977) * inp_4_0_0; + result3 += M4(0.26716024, 0.09332428, -0.035672527, -0.033889934, 0.10380577, -0.10792809, 0.032491803, 0.11598221, -0.16717017, 0.049164187, -0.00051478465, 0.1332475, 0.23637128, -0.15503877, 0.083327465, 0.025073275) * inp_4_1_0; + result3 += M4(-0.028856063, 0.02228463, -0.0022270556, -0.15169096, -0.41227904, -0.0053139855, -0.37183005, 0.049269505, -0.12184315, -0.04017246, -0.05167311, -0.031152649, 0.07082666, 0.037031624, 0.10764349, -0.026905924) * inp_4_2_0; + result3 += M4(-0.01049915, 0.11739014, 0.08397187, -0.07710815, 0.23864214, 0.043800138, 0.12961175, 0.027600035, 0.18636715, 0.04545033, 0.0034640585, 0.039043125, 0.06100653, -0.08165919, -0.014627799, 0.0049396595) * inp_4_0_1; + result3 += M4(-0.05829264, -0.10692941, -0.021784848, -0.06650629, -0.00804042, 0.049246345, -0.09714333, 0.16783571, 0.06641079, 0.2334157, 0.093779504, -0.11016423, -0.006515934, -0.05372289, 0.019857274, -0.18465406) * inp_4_1_1; + result3 += M4(-0.13213427, -0.027656022, 0.050408516, -0.037032105, -0.032862313, 0.08121426, -0.07104203, -0.092463195, -0.069118746, -0.025219934, -0.12793308, 0.023097545, 0.07132469, 0.17039154, 0.07423295, -0.0036142585) * inp_4_2_1; + result3 += M4(-0.04168379, 0.0033692447, 0.012247811, 0.09033096, 0.17067008, 0.09933842, 0.016770627, -0.007999331, 0.14856173, -0.06804571, 0.105862424, 0.07969015, 0.08403425, 0.02671861, 0.06085429, -0.023640487) * inp_4_0_2; + result3 += M4(-0.094923325, -0.19971143, -0.05059042, 0.053266875, 0.04858924, -0.15709706, 0.02546693, -0.13396575, -0.013702026, 0.17228442, 0.0046156617, 0.028252859, -0.09793701, -0.065703064, -0.115298204, 0.18663837) * inp_4_1_2; + result3 += M4(-0.09268958, 0.06416263, 0.07325169, 0.021971846, 0.06529956, 0.05037626, -0.0048930887, -0.13996537, 0.021141198, -0.1462973, -0.084567554, -0.01506454, 0.046998132, 0.0940624, -0.009522079, 0.05108342) * inp_4_2_2; + result4 += M4(0.069145024, -0.002882422, 0.14015664, -0.3613045, -0.03500846, 0.010326944, -0.17969237, 0.03879933, -0.10790703, 0.05544771, -0.16222806, 0.25108773, -0.102622315, -0.05397919, 0.11332763, 0.0912472) * inp_4_0_0; + result4 += M4(-0.11699772, -0.07309899, 0.11169658, 0.20529273, -0.12752043, -0.010938826, -0.087930165, -0.31073257, 0.12356881, -0.004743108, -0.10544772, 0.026410654, -0.034311354, -0.032509685, 0.12069683, -0.16127245) * inp_4_1_0; + result4 += M4(2.5769134e-05, -0.12754111, -0.013598903, 0.18318334, 0.037678923, 0.029320713, -0.1304927, -0.078414895, 0.042846095, 0.0010713389, -0.031247243, -0.22965492, -0.016956974, 0.006286483, 0.02243632, 0.07687705) * inp_4_2_0; + result4 += M4(-0.025986128, -0.08457622, 0.0944553, 0.21025968, 0.006382023, -0.10306406, 0.10097979, 0.23452103, -0.061959043, -0.0061988565, -0.17389442, -0.03595001, -0.18099315, 0.057607207, 0.08662925, -0.013712116) * inp_4_0_1; + result4 += M4(-0.052100703, -0.30572578, 0.14966764, 0.045666996, -0.24847466, 0.20545833, -0.023848133, -0.08467902, 0.1645116, 0.017262885, -0.0007100575, -0.07007358, 0.02723553, 0.15521146, 0.057702918, -0.17873062) * inp_4_1_1; + result4 += M4(-0.15634713, -0.12681459, -0.011408221, -0.032487165, -0.08068434, -0.0351298, 0.012920307, -0.0006185524, 0.09506192, -0.042032827, -0.007050135, -0.0031894052, 0.041373055, 0.04421661, 0.06818887, -0.0038908457) * inp_4_2_1; + result4 += M4(0.037681356, -0.029321436, -0.013248218, 0.089514375, -0.008286719, -0.009140873, 0.110401236, 0.004529786, -0.055987794, 0.009363701, -0.03484658, -0.01143862, -0.045685917, 0.071437545, 0.07896014, 0.23226053) * inp_4_0_2; + result4 += M4(-0.0583445, -0.08874884, 0.032947738, -0.06377378, 0.08441811, -0.12823875, 0.06867126, -0.18895656, 0.036097523, 0.0049911137, 0.017927792, -0.18964991, -0.15198527, 0.15733323, -0.038631085, 0.027422786) * inp_4_1_2; + result4 += M4(-0.045293506, -0.074421905, -0.07400106, -0.056590274, -0.023945067, -0.014327954, 0.041554324, 0.19357534, 0.010129685, -0.017104065, 0.04833267, 0.099298745, -0.0653345, 0.09198819, -0.025699483, -0.09877697) * inp_4_2_2; + result5 += M4(0.05126989, -0.11165201, -0.03949107, 0.012827274, -0.006800151, 0.09410788, 0.019508006, -0.107812144, -0.06189274, 0.052835558, 0.019383252, -0.014363576, -0.0042283707, -0.040233325, -0.030328318, 0.038988646) * inp_4_0_0; + result5 += M4(0.22562496, -0.0056842566, -0.03390179, -0.23338172, -0.21150047, 0.34632647, 0.006602348, -0.07612761, -0.18690059, -0.102153264, -0.032041606, 0.07698139, -0.10188392, -0.13299339, -0.032924596, -0.04988135) * inp_4_1_0; + result5 += M4(0.06044232, 0.064126134, -0.0237404, -0.029693652, -0.036573835, -0.25192642, 0.016799156, 0.020292873, -0.0040292405, 0.017333206, 0.025323324, 0.052257467, 0.04532647, -0.016759923, -0.005387829, -0.004145057) * inp_4_2_0; + result5 += M4(-0.03471845, 0.027523719, 0.019660402, 0.013593585, -0.01743864, 0.14991951, 0.025586575, -0.011178313, 0.028091853, -0.19830616, 0.022843217, 0.0051481067, -0.02228959, -0.24773867, -0.018356087, 0.12924021) * inp_4_0_1; + result5 += M4(0.09892557, -0.04075304, 0.0035159294, -0.10459814, -0.15160754, -0.0030324275, 0.016313735, 0.054924972, -0.051287953, -0.13989593, -0.02803562, -0.083574645, -0.07067514, -0.054376304, -0.04322344, -0.049143065) * inp_4_1_1; + result5 += M4(0.053454738, 0.12871616, 0.059428584, -0.00423104, 0.0081377905, -0.093068875, -0.03779241, 0.01766545, -0.019672636, 0.03187528, 0.012627105, -0.0010256567, -0.02833987, 0.020976631, -0.03236893, -0.10342855) * inp_4_2_1; + result5 += M4(-0.026647745, -0.037815906, -0.020683073, -0.05764755, 0.07456962, -0.22506273, -0.018697001, -0.059746843, -0.025869744, 0.0815025, 0.048052017, 0.0666039, 0.036375795, 0.019151406, 0.009605656, -0.006283438) * inp_4_0_2; + result5 += M4(0.032922212, -0.16051689, -0.028198011, -0.07303507, -0.074081145, 0.25798026, 0.027467784, 0.026003916, 0.060250074, -0.03564738, -0.07060636, -0.049254812, 0.012059596, -0.1604841, 0.024879508, 0.084039226) * inp_4_1_2; + result5 += M4(-0.03193242, 0.02572299, 0.048717547, 0.089661784, 0.022612734, 0.102245755, 0.00841563, 0.014134972, -0.0017746104, 0.05108323, 0.00070015993, 0.047171485, 0.010799258, -0.06220687, 0.017520819, 0.0025798979) * inp_4_2_2; + result6 += M4(0.105994225, -0.19868919, 0.011871991, 0.0076910174, -0.14289175, -0.02238566, -0.018845633, -0.02703022, 0.022486374, -0.056684755, 0.1003435, -0.039022073, -0.058879618, 0.06729891, 0.12517802, 0.003658135) * inp_4_0_0; + result6 += M4(0.14659826, 0.08146107, 0.06869505, 0.05703236, -0.028249646, 0.17645714, -0.21517038, 0.0076926774, 0.1773575, 0.19912657, 0.011452382, -0.07637672, -0.25087115, -0.105868444, -0.09984039, 0.00850327) * inp_4_1_0; + result6 += M4(0.012133553, -4.635346e-05, -0.044151314, 0.0471454, 0.08650078, 0.013975081, 0.03158762, -0.011354539, 0.0780001, 0.06690665, 0.08589582, -0.01869028, -0.01677636, -0.12475332, 0.024094861, -0.0044213566) * inp_4_2_0; + result6 += M4(0.07298494, -0.15864012, 0.20889348, -0.021786392, 0.11997609, -0.14258158, 0.13700382, -0.02590116, 0.005856892, -0.022935728, -0.011136262, -0.12636122, -0.026897948, 0.09783801, 0.01365595, 0.08559514) * inp_4_0_1; + result6 += M4(0.008573796, 0.36784512, -0.09835621, -0.037670255, -0.022125605, 0.012232725, 0.017062489, 0.0096913, 0.055019606, -0.025391987, -0.022888258, -0.049804796, -0.105870776, -0.20554258, 0.14477159, 0.12848486) * inp_4_1_1; + result6 += M4(-0.030278437, -0.1380488, 0.114217125, 0.075079, -0.047917333, 0.050868314, -0.19001642, 0.03261282, -0.0044744117, 0.09962044, -0.04763892, 0.018165126, 0.034206823, -0.11597154, 0.11092557, 0.03325106) * inp_4_2_1; + result6 += M4(0.04633899, 0.03912767, -0.09579782, 0.060845785, -0.029730491, -0.06978176, -0.13629054, 0.023090914, 0.08038462, -0.18146084, 0.071845144, -0.0055421204, 0.09605012, 0.0964328, 0.013261676, 0.04259341) * inp_4_0_2; + result6 += M4(0.066784844, -0.14903262, 0.024951074, 0.075918905, -0.17786124, -0.09201577, 0.24612312, -0.013250502, 0.03977437, 0.02722111, -0.0096855955, -0.049702514, 0.22972526, 0.08658453, -0.18677714, 0.00039259586) * inp_4_1_2; + result6 += M4(0.04781108, -0.068694636, -0.10319322, 0.020910783, -0.04294151, -0.047346912, -0.15175053, -0.00068040827, 0.0031489204, 0.02630967, -0.09309033, 0.040807083, 0.09417282, -0.1022639, -0.005895056, 0.0477383) * inp_4_2_2; + result7 += M4(0.049177706, -0.030941142, 0.0070032566, -0.08539875, 0.021399044, -0.029841773, -0.0073910006, -0.0038321654, 0.06277513, 0.039198477, -0.030060902, 0.027599119, -0.042601507, 0.10326694, -0.012771646, -0.03979841) * inp_4_0_0; + result7 += M4(-0.078266025, 0.046536334, 0.033601347, 0.009142793, -0.034472767, -0.23237887, -0.041013196, -0.017589966, -0.0101782745, -0.08564077, 0.04426092, 0.00503341, 0.11267203, 0.26962793, -0.051341593, -0.034072153) * inp_4_1_0; + result7 += M4(0.06208209, -0.18352069, -0.004219006, -0.037164498, 0.027144313, -0.049438242, 0.013342793, 0.103080325, 0.029959202, -0.01693596, -0.004267126, -0.04411009, 0.01046045, 0.15092407, -0.030891724, 0.25189477) * inp_4_2_0; + result7 += M4(-0.036467325, -0.045477964, -0.011840119, -0.015907153, 0.013154312, -0.008553453, 0.008570545, 0.029735109, 0.044728443, 0.081235975, -0.04847781, -0.00295823, -0.12288811, -0.0010027557, 0.0066455165, -0.068108626) * inp_4_0_1; + result7 += M4(0.16969146, -0.100116886, 0.008268357, 0.10946563, -0.10654125, 0.06998944, 0.029377474, -0.015355576, -0.16766389, -0.20505778, 0.017986748, 0.033132747, 0.10764003, -0.02415494, 0.034058247, 0.07083134) * inp_4_1_1; + result7 += M4(0.054632343, -0.018059323, 0.008385867, 0.017824594, 0.05275564, -0.034722816, 0.013699103, 0.13630769, -0.006114431, -0.076319136, 0.05666484, -0.015281957, 0.067867644, 0.05887549, 0.026778, 0.021443866) * inp_4_2_1; + result7 += M4(0.009649359, -0.0076094316, 0.04627633, -0.123604715, -0.023757117, 0.007498384, 0.0037702848, 0.0042312513, 0.044805396, 0.05304793, -0.017555103, 0.11178705, 0.020255571, 0.01510768, -0.011929654, 0.016395317) * inp_4_0_2; + result7 += M4(0.060495935, -0.075412564, -0.011714262, -0.028777624, 0.036349464, 0.010554533, -0.017276483, 0.014811549, -0.040656872, 0.097686425, 0.06282261, -0.09207576, -0.04596563, 0.07891032, 0.020275546, -0.24185641) * inp_4_1_2; + result7 += M4(0.0663436, -0.08257041, -0.008731263, 0.34673077, -0.08118538, -0.0046493784, 0.010682317, -0.15008071, 0.101572864, 0.062296055, 0.034948315, -0.010925607, 0.0053622792, 0.07923177, 0.009801937, 0.18502559) * inp_4_2_2; + const V4 inp_5_0_0 = inp[5][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_5_1_0 = inp[5][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_5_2_0 = inp[5][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_5_0_1 = inp[5][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_5_1_1 = inp[5][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_5_2_1 = inp[5][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_5_0_2 = inp[5][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_5_1_2 = inp[5][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_5_2_2 = inp[5][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.07869333, -0.00035128652, 0.022898614, -0.012425706, -0.04523789, -0.00554883, 0.035654984, -0.09758672, 0.17274638, -0.00078226364, 0.11401323, 0.22211851, -0.20208736, -0.017870452, -0.06545396, 0.08890102) * inp_5_0_0; + result0 += M4(-0.32873765, 0.0016164917, 0.01716955, 0.24452612, 0.3071801, -0.0024067913, -0.034127872, -0.06382891, 0.060509503, -0.005660867, 0.15617707, 0.29242027, -0.03558213, -0.024359392, 0.06148011, 0.12935658) * inp_5_1_0; + result0 += M4(0.26454037, 0.00089075457, 0.018350126, 0.07323487, 0.68328065, -0.0024056665, -0.04161967, -0.18188752, -0.07905459, -0.023154857, -0.0092441635, -0.04956989, -0.2314631, 0.0039305864, -0.022860853, -0.07631401) * inp_5_2_0; + result0 += M4(-0.0038970276, -0.014908787, 0.0684872, -0.12164261, -0.5654355, 0.008098003, 0.02807298, 0.07976401, -0.2742832, 0.06580561, 0.012161846, 0.23362854, 0.3323281, 0.00038569167, -0.059329838, -0.14608262) * inp_5_0_1; + result0 += M4(-0.318843, -0.05809332, -0.0905257, 0.13430594, 0.1763401, 0.13379827, -0.05285944, -0.25087997, -0.25691295, 0.09705721, -0.0086598, 0.16804737, 0.16234742, -0.018796036, -0.0146961305, 0.012803926) * inp_5_1_1; + result0 += M4(-0.3687057, 0.027534785, 0.089020625, 0.048740935, 0.33015457, 0.055929296, 0.0423266, -0.00042862532, -0.65630263, 0.044620927, -0.042774618, -0.064371966, -0.07599462, -0.012021491, 0.050905824, -0.008724924) * inp_5_2_1; + result0 += M4(-0.18874244, 0.013953216, -0.03258164, 0.075005144, 0.025068179, -0.01680127, 0.02372482, 0.05022162, 0.11775188, -0.0077294754, 0.025189329, 0.08765877, -0.19321209, 0.011285351, -0.03456609, -0.07313599) * inp_5_0_2; + result0 += M4(-0.48788357, -0.050879117, -0.021839213, -0.07366132, -0.21457158, 0.040539674, 0.05531499, 0.08236575, 0.31520548, -0.041763797, 0.056597754, -0.113837786, -0.151603, 0.015293674, -0.047634486, 0.103072695) * inp_5_1_2; + result0 += M4(-0.0777336, -0.008974059, 0.014881637, -0.083502695, -0.1704324, 0.038487818, 0.06559258, 0.12768595, 0.15679763, 0.013372798, -0.030217202, -0.037186217, 0.02880897, 0.0055609215, 0.007871192, -0.033056986) * inp_5_2_2; + result1 += M4(-0.12952425, 0.03721746, -0.035637632, 0.011933187, -0.036226973, -0.06437253, 0.13445026, 0.03394418, 0.1516447, 0.035568077, 0.24680257, -0.15145738, -0.016980328, -0.085753605, -0.17648911, -0.0068147765) * inp_5_0_0; + result1 += M4(-0.078856885, -0.07582558, 0.10946699, -0.029691309, 0.059291027, -0.17677361, 0.08992794, 0.04016863, -0.00038459155, -0.29349446, 0.13076018, 0.15964578, 0.03102614, 0.044825442, -0.042552024, -0.017371753) * inp_5_1_0; + result1 += M4(-0.043538082, 0.04203705, -0.0026763624, 0.02145284, -0.08864483, 0.034567166, -0.059803315, -0.021143297, -0.03709001, 0.09168868, 0.08747861, 0.08939103, -0.11063337, -0.10472133, -0.038399506, 0.059378058) * inp_5_2_0; + result1 += M4(0.026306508, -0.09015751, -0.05076055, 0.049613666, -0.050214484, -0.110159375, 0.18269265, -0.10263938, 0.0027290583, 0.10587823, 0.2078708, 0.18030132, -0.013006935, 0.026716385, -0.05439159, -0.016593486) * inp_5_0_1; + result1 += M4(-0.0018730204, -0.12725502, -0.095247835, -0.18146436, -0.027124807, 0.24049643, 0.20137446, 0.071600236, -0.064398095, 0.019145656, -0.30381453, -0.1900997, 0.06479129, -0.10385521, 0.0926918, 0.10271915) * inp_5_1_1; + result1 += M4(-0.12086527, 0.06267545, 0.049382135, -0.11529424, -0.112643935, -0.034091912, -0.035225626, -0.016406411, 0.118374266, 0.030822283, 0.1584464, 0.08448635, -0.034706075, -0.21329069, -0.064829126, 0.0451281) * inp_5_2_1; + result1 += M4(0.039971948, 0.04942478, 0.031031318, -0.08522106, 0.13778934, -0.090367086, -0.07451306, -0.15202044, 0.02120986, 0.06494965, 0.047448635, 0.043437555, -0.09407728, -0.054798916, -0.0114540905, 0.12336493) * inp_5_0_2; + result1 += M4(0.035171557, -0.037406277, 0.027900036, -0.08886569, 0.021939408, -0.07062506, 0.0062860283, -0.12200291, 0.0012390914, -0.09562543, 0.1194021, 0.09370839, 0.02484605, -0.051458817, -0.03631423, -0.013663657) * inp_5_1_2; + result1 += M4(0.030942678, -0.08716443, 0.03165094, 0.10127806, 0.016895788, 0.065503776, -0.04853291, -0.12899692, -0.028207228, -0.014250527, -0.034553766, 0.03330464, 0.0475289, 0.038898353, -0.062322, -0.044877715) * inp_5_2_2; + result2 += M4(0.021333138, 0.013268967, -0.015901806, -0.046588786, 0.0034785832, 0.0831568, 0.043451313, 0.0009396029, -0.06399435, 0.054420426, 0.0063771103, -0.027554097, -0.034235477, -0.023794109, 0.0054998253, 0.0046750433) * inp_5_0_0; + result2 += M4(-0.048246786, 0.22831313, -0.014618013, 0.008491458, 0.06813362, 0.10156819, -0.019818539, 0.07891646, 0.123127885, 0.16703428, 0.0045574415, 0.0676125, 0.02016334, -0.18210115, 0.009630271, 0.029004991) * inp_5_1_0; + result2 += M4(-0.01673904, 0.04105361, -0.03589782, -0.0071025356, 0.085280895, -0.006099745, 0.0333405, 0.023406666, 0.002361316, -0.030961443, 0.0341426, -0.037059058, 0.030845396, 0.010022956, -0.036231074, -0.08843495) * inp_5_2_0; + result2 += M4(-0.0046882043, -0.04331871, 0.0053232284, 0.022607893, -0.057038147, -0.08441694, 0.100728266, -0.044547223, -0.21838132, -0.09227369, -0.1598035, 0.102324896, 0.10879561, -0.08552537, 0.12732802, -0.062754355) * inp_5_0_1; + result2 += M4(-0.19478069, 0.069152564, 0.059341524, -0.08595255, 0.16276842, 0.1780508, 0.10221329, -0.032430016, 0.035120975, 0.0007167226, 0.024983447, -0.014336769, -0.027756715, -0.17439899, -0.041124605, 0.12268519) * inp_5_1_1; + result2 += M4(0.03140482, -0.032615893, -0.07159878, 0.019304452, 0.074276455, 0.096589126, 0.03794335, -0.029392608, 0.0015624304, -0.1876843, 0.02035078, 0.12729327, 0.05165021, 0.029002959, -0.08181941, 0.013726391) * inp_5_2_1; + result2 += M4(0.057264715, -0.020870764, -0.014013703, -0.006178171, -0.14789797, 0.06832935, 0.0068656513, -0.016575057, -0.05024657, 0.1306498, -0.07247172, -0.00039102216, -0.030370452, -0.09067211, 0.10256602, 0.04603874) * inp_5_0_2; + result2 += M4(-0.04731265, -0.0450603, 0.00024730418, 0.018841753, 0.012970629, -0.07924305, -0.09827355, 0.032717872, 0.1290668, 0.059932217, -0.007988637, 0.003939825, 0.062332142, -0.05914839, 0.018148884, -0.01327255) * inp_5_1_2; + result2 += M4(0.107830815, 0.013075259, -0.11039031, 0.052275967, 0.027585676, -0.043224003, 0.09770686, -0.13639812, -0.028442947, 0.00020570598, 0.019433506, -0.027970882, 0.0061857193, -0.037253305, -0.018408528, 0.0474903) * inp_5_2_2; + result3 += M4(0.015677845, -0.00671084, 0.019166647, -0.033845436, 0.060717802, 0.06417002, 0.090390675, -0.004397716, -0.16850543, 0.06244075, -0.07570655, 0.022061221, 0.022521907, 0.011098941, -0.024522034, -0.038981784) * inp_5_0_0; + result3 += M4(-0.021185506, 0.08965549, 0.039249115, 0.07136724, -0.080724545, -0.013874093, 0.07638509, 0.072556265, -0.19393668, 0.1401979, 0.034555063, 0.14185809, 0.09639788, -0.10919841, 0.086399354, -0.15379573) * inp_5_1_0; + result3 += M4(-0.17099692, -0.08714954, -0.03801139, -0.065560766, -0.09060775, 0.05145639, -0.09605068, 0.06911095, 0.07026578, 0.09323299, 0.05844946, 0.050781656, 0.085839376, 0.117615536, 0.102985196, -0.05098219) * inp_5_2_0; + result3 += M4(-0.002876606, -0.02218488, 0.060924545, -0.18816549, 0.1337594, -0.075137, 0.039093472, -0.003535261, 0.04947663, -0.080551505, -0.18947463, 0.13170737, -0.29970402, -0.0010217266, -0.08042049, 0.05852891) * inp_5_0_1; + result3 += M4(0.11629283, -0.052787248, 0.08910508, 0.011113786, 0.055172123, 0.060877237, 0.18369572, -0.12718171, -0.12961869, 0.2022103, -0.28783035, 0.11361625, 0.121732086, -0.19074959, -0.006026067, -0.074463435) * inp_5_1_1; + result3 += M4(0.07337377, 0.16794255, 0.13359612, 0.04595141, -0.24953586, 0.05813992, -0.17401415, 0.07559845, 0.094264, -0.1356181, 0.05777148, 0.027211571, 0.04444463, -0.009073971, 0.055189658, -0.037160527) * inp_5_2_1; + result3 += M4(-0.25800025, -0.12835032, -0.060990572, 0.08991051, 0.107343994, -0.01543463, 0.07718182, -0.028928423, 0.017609239, 0.020304795, 0.013512198, -0.06750834, -0.11718272, -0.048897132, -0.0774759, -0.013367303) * inp_5_0_2; + result3 += M4(-0.13356136, 0.22312234, 0.047576934, -0.011558663, 0.15920341, 0.021484494, 0.11451094, 0.11846407, 0.0022281893, 0.015195137, -0.066550754, -0.11097011, -0.14604366, 0.07637948, -0.020782305, 0.09131394) * inp_5_1_2; + result3 += M4(-0.040715873, 0.08183543, 0.14434236, -0.017248407, -0.055361044, 0.16718467, -0.15207382, 0.057854794, 0.0938, -0.14241678, 0.0013146093, -0.014982696, -0.029765692, -0.062207278, 0.060647294, 0.061205126) * inp_5_2_2; + result4 += M4(0.040047716, -0.03474733, -0.010585424, -0.13982292, 0.0058999523, -0.05611864, -0.020375658, 0.1171784, -0.13653414, -0.010510062, -0.23348054, 0.32841045, 0.085443914, 0.05582177, 0.17286402, -0.07536615) * inp_5_0_0; + result4 += M4(-0.105701044, 0.0055946168, -0.068424866, 0.28518826, -0.1419545, -0.0033480595, -0.15887958, -0.1284714, 0.092785075, -0.013294496, -0.13797504, -0.11374121, -0.05244038, -0.041745532, -0.044629905, 0.14592455) * inp_5_1_0; + result4 += M4(-0.039473385, 0.016667891, 0.0031978255, 0.22926466, -0.035728347, -0.0048006247, -0.037035193, 0.022211924, 0.075197875, -0.011515439, -0.0002350182, -0.110827066, 0.062430806, 0.08953754, -0.100933895, -1.0008845) * inp_5_2_0; + result4 += M4(0.04095642, 0.03523955, 0.021876441, 0.07468147, -0.03628491, -0.13145937, -0.026317293, -0.18755473, -0.09626215, -0.028636714, -0.0940683, -0.0022245885, 0.1907466, -0.0075104735, 0.08550026, -0.23362629) * inp_5_0_1; + result4 += M4(0.09143216, -0.1266632, 0.05783249, -0.25104415, -0.16001162, 0.1260253, -0.01635084, 0.14715743, -0.06203885, 0.31056342, -0.021755705, -0.15887757, 0.16263153, -0.047489706, 0.036556732, -0.49565074) * inp_5_1_1; + result4 += M4(-0.05200418, 0.123212405, -0.01685267, -0.2663876, 0.00015575066, 0.23154494, -0.05773033, 0.03588002, -0.06586105, -0.02152106, 0.06252535, -0.00962661, 0.015322261, 0.052863587, -0.013198681, -0.58656317) * inp_5_2_1; + result4 += M4(-0.00039269286, -0.052142624, -0.042898796, -0.018772414, 0.093489796, -0.10340082, 0.016464384, -0.032887347, 0.048430678, -0.031949352, 0.0027134572, -0.17016664, 0.052216176, 0.0075392616, -0.092704825, -0.33045995) * inp_5_0_2; + result4 += M4(0.11755991, -0.042255007, -0.017143914, -0.20726724, -0.08805177, -0.013268589, 0.055681717, 0.31767672, 0.101473354, -0.024414746, 0.0074703894, -0.1769745, 0.029685616, 0.0989569, -0.005018177, -0.17162028) * inp_5_1_2; + result4 += M4(-0.008338706, 0.01324496, -0.067789726, -0.111777425, 0.002397612, 0.11389789, -0.002835333, -0.2839883, 0.0054740873, -0.020009434, 0.085438564, 0.019215684, 0.025188267, -0.039302133, 0.01737349, -0.45482114) * inp_5_2_2; + result5 += M4(0.011233528, -0.030370748, -0.0056033977, 0.1405769, -0.013632174, 0.1811034, 0.01791712, -0.0217345, -0.07560408, 0.075660355, 0.0057367035, 0.0065147276, 0.021670358, 0.11397549, -0.051262494, 0.06001228) * inp_5_0_0; + result5 += M4(-0.038376495, 0.052995272, -0.033120967, -0.08012776, -0.07851079, 0.19220532, 0.07857965, -0.059333064, -0.2307005, 0.052897662, -0.0027991813, 0.06745769, 0.28804463, 0.17595169, 0.08324931, 0.08291818) * inp_5_1_0; + result5 += M4(-0.00089322776, -0.12731972, 0.005975614, 0.021670679, -0.096803114, -0.13316235, 0.004712358, 0.026525665, -0.020871181, -0.09755728, -0.016133219, -0.071284294, -0.08137697, 0.21427888, 0.018336821, -0.33874258) * inp_5_2_0; + result5 += M4(0.03580351, 0.0019478424, 0.0070350426, 0.008283084, 0.045394633, 0.025900071, 0.042914424, 0.041449305, 0.045430068, -0.25429165, 0.06961166, -0.08076151, -0.065529324, 0.13570659, -0.057939768, -0.091177434) * inp_5_0_1; + result5 += M4(0.014707097, -0.14771028, -0.09050319, 0.037257493, 0.03551058, -0.072607145, -0.01910474, -0.16191821, 0.025728233, -0.033240207, -0.022957142, 0.027783198, 0.12536895, 0.24879834, -0.0027322322, -0.27055278) * inp_5_1_1; + result5 += M4(0.08564408, -0.096858606, -0.03321823, 0.00391585, -0.0714128, 0.09010456, 0.07945547, -0.017609628, 0.021018073, -0.10225811, -0.007876666, -0.052467708, 0.018096993, 0.33184934, 0.032097474, -0.104311384) * inp_5_2_1; + result5 += M4(-0.048686717, -0.06793839, 0.029256001, -0.008618766, -0.031727325, 0.026663907, -0.017281586, 0.022322832, 0.04476352, -0.16771935, -0.013644622, -0.0037746977, 0.01837814, 0.11802892, 0.02561466, -0.16415071) * inp_5_0_2; + result5 += M4(-0.04738057, -0.22266848, -0.057847474, -0.061348636, 0.09780719, 0.13411331, 0.047367968, 0.07509483, -0.10801688, 0.06818776, -0.006035024, -0.03861783, 0.038379334, -0.018639319, -0.04932617, -0.17377199) * inp_5_1_2; + result5 += M4(-0.024082847, 0.011026896, 0.011392431, -0.0006626239, -0.013934467, -0.026957529, 0.019667279, -0.081639156, -0.0017702146, -0.06961195, -0.021819504, -0.09337104, 0.03227134, 0.06111691, -0.035430565, 0.05397633) * inp_5_2_2; + result6 += M4(0.08723617, -0.15685703, -0.011420155, -0.011860816, -0.019349966, -0.17326365, 0.023602288, -0.0006519195, 0.18131952, 0.2316517, -0.008294209, 0.047665905, -0.08477736, -0.046739988, 0.011925728, 0.02837569) * inp_5_0_0; + result6 += M4(0.05739363, -0.08614754, -0.16947506, -0.0020167672, -0.15113881, 0.13837765, -0.076638274, -0.0018632106, -0.10137812, -0.0672288, 0.011497005, 0.016244607, -0.10425687, -0.2854549, -0.13122094, -0.029997258) * inp_5_1_0; + result6 += M4(-0.057944074, -0.030108927, -0.1373179, 0.014940308, 0.036806006, 0.067855015, 0.17665218, 0.015243376, -0.046586033, 0.09691151, 0.034589026, -0.0027722016, 0.120801926, 0.09981655, 0.06498883, -0.02791484) * inp_5_2_0; + result6 += M4(-0.1055818, -0.20216429, 0.07618889, 0.05045324, -0.124078676, 0.0971568, -0.083990894, -0.0037262768, -0.16862415, 0.17035407, -0.20748077, 0.074987166, 0.009541244, 0.052398782, -0.018709803, -0.0114659285) * inp_5_0_1; + result6 += M4(-0.15500383, -0.13540241, -0.04381884, -0.03180128, 0.17580117, -0.13147719, 0.15651031, -0.06405652, 0.22646862, -0.17062064, -0.0012268446, -0.03821348, 0.09470291, -0.039777637, 0.06915523, -0.085813634) * inp_5_1_1; + result6 += M4(0.08187127, -0.06517709, -0.10847888, 0.085252166, 0.16315693, -0.036993474, -0.22202265, 0.0655328, -0.10142412, 0.17265755, -0.023184417, -0.005069489, 0.06851217, -0.2839705, -0.07529304, -0.036122385) * inp_5_2_1; + result6 += M4(0.014243031, 0.0743126, -0.12589347, 0.024750315, -0.014277149, -0.086918235, -0.0027030325, 0.060844444, -0.023898343, 0.13895226, 0.02028287, 0.05840617, 0.09580089, -0.060213435, -0.012504373, -0.075233646) * inp_5_0_2; + result6 += M4(0.020566981, 0.0024632663, 0.057662457, -0.018373294, 0.06949214, 0.16002536, -0.106589325, -0.011401631, -0.0647302, -0.21078208, 0.15034719, -0.012464964, 0.06277858, 0.1289562, 0.015662557, -0.022599358) * inp_5_1_2; + result6 += M4(-0.05505452, 0.03801007, 0.15293477, 0.049188383, 0.079358615, -0.09684197, -0.20114851, 0.086659975, 0.013301751, 0.018846836, 0.023613641, -0.036579743, -0.0149609, 0.015458627, 0.0065408773, -0.030299045) * inp_5_2_2; + result7 += M4(0.09383784, -0.029282423, -0.0015916231, -0.028218687, 0.037501723, -0.090598546, -0.025329769, 0.032853372, -0.12469133, -0.13983399, 0.008903812, 0.05373196, -0.09197212, -0.0056824116, 0.03545236, 0.035810795) * inp_5_0_0; + result7 += M4(-0.120160215, -0.10225633, 0.058183365, 0.0026089968, -0.008311286, 0.050880123, -0.015544347, -0.04903525, -0.00052959606, -0.23820823, -0.030964691, 0.059779994, 0.09381282, 0.31728634, -0.07896495, 0.030616276) * inp_5_1_0; + result7 += M4(0.008316228, -0.014775666, -0.0074982387, -0.008071902, 0.018461678, -0.15894704, 0.020570362, -0.0845733, -0.044071596, -0.06492385, -0.018960292, -0.20498532, 0.0025616996, -0.06250713, 0.016197, 0.1513245) * inp_5_2_0; + result7 += M4(0.098134495, 0.024417605, 0.0019695126, 0.18716235, 0.15864988, -0.057607673, -0.05244622, 0.017549768, -0.21017174, 0.050304946, -0.07619447, -0.089705996, 0.108391434, -0.041835867, 0.041826982, -0.03904611) * inp_5_0_1; + result7 += M4(-0.08746314, -0.09396118, -0.022764442, 0.22329745, -0.18711771, -0.0009974316, 0.016967025, -0.13114603, -0.16269569, 0.10433014, 0.10256059, -0.13948326, 0.12696609, -0.04163431, -0.09377791, 0.047001574) * inp_5_1_1; + result7 += M4(-0.07977763, 0.19222559, 0.04622463, 0.207601, -0.014672887, -0.023854997, 0.06709907, -0.052483622, -0.037427552, 0.0782116, 0.0015768566, -0.15164335, -0.0064576617, 0.07888817, -0.022705128, 0.28746942) * inp_5_2_1; + result7 += M4(0.04720968, 0.0049305507, 0.03612931, -0.028772319, 0.13834672, -0.0059638037, 0.02689541, 0.018205956, -0.08386549, -0.06962395, -0.024217827, 0.0055049807, 0.013359512, -0.02760608, -0.016856447, -0.032100037) * inp_5_0_2; + result7 += M4(-0.039101366, -0.08461363, 0.012724582, 0.04656306, -0.1325854, 0.13503754, 0.021149468, 0.05541479, 0.08042394, -0.018439054, 0.06391846, -0.012647834, -0.14745922, 0.010879956, 0.0025640684, -0.013240188) * inp_5_1_2; + result7 += M4(-0.02938828, -0.060744494, 0.009262373, 0.003389516, -0.004608473, 0.07026646, 0.06646974, -0.16484001, 0.052399166, 0.025905645, 0.00056221406, -0.1480289, 0.03031097, 0.041789845, -0.033455618, 0.21912785) * inp_5_2_2; + const V4 inp_6_0_0 = inp[6][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_6_1_0 = inp[6][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_6_2_0 = inp[6][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_6_0_1 = inp[6][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_6_1_1 = inp[6][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_6_2_1 = inp[6][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_6_0_2 = inp[6][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_6_1_2 = inp[6][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_6_2_2 = inp[6][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.16726878, 0.02337552, 0.077711836, -0.035303667, 0.28888148, 0.011903164, 0.009890893, 0.13408768, -0.014630918, -0.024531221, -0.14364067, 0.35552832, 0.051582493, -0.027729131, -0.008941915, -0.050198626) * inp_6_0_0; + result0 += M4(0.06031827, 0.01283958, -0.054500632, -0.29180694, 0.1926464, 0.046478286, -0.012953861, 0.028309867, 0.07338482, -0.09366655, -0.18952733, 0.4947672, 0.13597332, 0.029126797, 0.003940812, 0.022494985) * inp_6_1_0; + result0 += M4(-0.06131129, 0.0065805055, 0.03400541, 0.0868839, -0.47281447, -0.0378859, -0.0038852096, -0.13411734, 0.0014843142, -0.0239335, -0.12203969, 0.25322163, -0.3501995, 0.03919864, -0.028649045, -0.12838832) * inp_6_2_0; + result0 += M4(-0.057226177, -0.015708182, 0.029291067, -0.09890923, -0.8038662, 0.029186271, 0.031551156, 0.11095968, -0.18775234, -0.10426555, -0.21890208, 0.44498083, -0.35465837, 0.014768906, 0.04590378, 0.020186672) * inp_6_0_1; + result0 += M4(-0.1810541, -0.05556737, -0.02345663, -0.019031838, -0.18267672, -0.0110956505, 0.059411153, -0.1799912, -0.42325044, -0.046144508, -0.3669907, 0.41050506, -0.03827697, 0.43151984, 0.060965925, 0.037502024) * inp_6_1_1; + result0 += M4(-0.25076795, -0.040769655, 0.014912258, 0.062949985, 0.62499535, 0.040447697, 0.13525623, 0.024621977, -0.0022891725, 0.047021404, -0.14613773, 0.12370907, -0.31843406, -0.056210525, 0.107680835, 0.0869449) * inp_6_2_1; + result0 += M4(0.075500175, -0.04237024, 0.0061615417, 0.014606728, 0.20219068, -0.037102263, -0.01404636, -0.14407852, 0.25612894, -0.03724413, -0.1371565, 0.05132959, 0.11178826, 0.013937922, -0.078624934, -0.08033157) * inp_6_0_2; + result0 += M4(-0.37913552, 0.033618778, 0.0004890857, 0.06519555, -0.018196115, 0.0033920875, 0.050734352, -0.030579861, -0.64095217, -0.009908416, -0.22201966, -0.0823433, 0.14061137, 0.09472235, -0.069085084, -0.018985178) * inp_6_1_2; + result0 += M4(-0.12943813, -0.03931841, 0.013589274, -0.009239447, -0.040991627, 0.0061563873, 0.013980528, 0.04348537, -0.028306589, -0.02088455, -0.118037865, 0.041151322, -0.5478752, -0.047780987, -0.07446175, 0.051432613) * inp_6_2_2; + result1 += M4(-0.008555478, 0.04565402, -0.20191152, 0.08482234, 0.028767552, -0.12927094, 0.061445545, 0.08831772, -0.11385296, -0.12331531, -0.17769542, 0.05100599, -0.058694936, 0.050537553, 0.09582638, -0.019451087) * inp_6_0_0; + result1 += M4(0.22051308, 0.22837734, -0.074975744, -0.07225254, -0.100266196, 0.07685327, -0.07391262, 0.17098041, -0.032100398, -0.3787696, -0.26682273, -0.02349713, -0.013915506, 0.035658278, 0.18581918, 0.010441641) * inp_6_1_0; + result1 += M4(0.058614206, -0.21317482, 0.022746429, -0.14420031, -0.0020425997, 0.11044943, -0.032726903, -0.17901061, -0.0031252138, 0.006142974, -0.024956953, -0.10176778, -0.0004878129, 0.01368177, 0.11592114, 0.041805103) * inp_6_2_0; + result1 += M4(0.19395952, -0.060396094, 0.07851155, -0.13842146, -0.066420026, -0.06402058, -0.07195997, -0.19818011, -0.081449166, -0.09736735, -0.24441877, 0.07259191, 0.053844456, -0.027458532, -0.07396858, 0.018261602) * inp_6_0_1; + result1 += M4(-0.03908553, 0.08431586, 0.1502409, -0.17488427, 0.0420161, 0.0352037, 0.005702128, 0.019561678, 0.49739978, -0.3714236, -0.48853144, -0.4776428, 0.16517457, 0.0024230934, -0.17026031, 0.24317311) * inp_6_1_1; + result1 += M4(0.041106287, 0.069029324, -0.051005654, 0.15695803, -0.07960427, -0.08153068, 0.009307281, 0.083104655, 0.05567405, -0.36288092, -0.06000766, -0.44933298, -0.09430687, -0.10819884, 0.08357422, -0.013167584) * inp_6_2_1; + result1 += M4(0.068717465, -0.017653326, -0.0044030654, -0.14711158, -0.012968301, -0.22838975, -0.038133487, 0.06696954, 0.0026133382, 0.14791167, -0.04691662, -0.08854464, -0.006476051, 0.0850852, -0.010678731, 0.03420895) * inp_6_0_2; + result1 += M4(-0.008083416, -0.034217224, 0.04163466, 0.013660057, 0.0340068, -0.013922894, 0.039221708, -0.08806377, -0.03705716, 0.05893824, -0.04710652, -0.51105094, 0.06246556, 0.0031851276, -0.0036289543, -0.012623156) * inp_6_1_2; + result1 += M4(0.050628018, 0.05477649, -0.012073569, 0.020351788, 0.030532775, -0.0074954936, -0.03253457, -0.027320608, -0.03623883, -0.098306954, -0.05111786, -0.106320605, 0.0041741705, 0.0805276, -0.0028842492, 0.031043177) * inp_6_2_2; + result2 += M4(-0.051816043, -0.08162155, -0.035834722, 0.04149071, -0.017222058, 0.1202846, -0.02230568, -0.021887813, -0.107688256, -0.14901721, 0.32219905, -0.051110163, 0.020707764, -0.077505805, -0.00611336, 6.571097e-05) * inp_6_0_0; + result2 += M4(-0.13764429, -0.16772093, -0.1534153, -0.17853442, 0.04130026, -0.074790895, -0.02435289, -0.08679415, -0.06861776, -0.10177034, 0.39531022, -0.18689139, 0.015560553, -0.03354407, -0.09339321, -0.083455384) * inp_6_1_0; + result2 += M4(-0.033349402, 0.15530822, -0.019670071, -0.11229556, -0.08714364, -0.17163718, 0.035208836, -0.120149784, -0.003269507, 0.21157314, 0.16743843, -0.19911668, 0.064635165, -0.11787982, 0.042104848, 0.08591811) * inp_6_2_0; + result2 += M4(-0.03812131, 0.18001193, 0.08615761, -0.08233446, -0.011098239, 0.00524373, 0.030241583, 0.0036737868, -0.10505102, -0.30685636, 0.30573812, -0.029944759, -0.008553355, 0.0051635103, -0.03841724, 0.023594452) * inp_6_0_1; + result2 += M4(-0.024761254, -0.05848222, -0.032456666, 0.01979826, 0.050810054, -0.1760262, 0.04564554, 0.10715419, -0.8558648, -0.38139126, 0.86497164, -0.09869271, -0.09056967, 0.24813749, -0.37562025, 0.050213464) * inp_6_1_1; + result2 += M4(-0.0031948248, -0.14299113, 0.03162738, 0.1303994, 0.03930452, -0.018447455, 0.029013438, -0.06324793, -0.026344039, -0.026901193, 0.2294999, -0.15878648, -0.044261668, 0.0896783, 0.19630735, -0.21652722) * inp_6_2_1; + result2 += M4(-0.10854681, 0.07352848, 0.0009575898, -0.07184708, 0.07462978, 0.23633583, -0.018467274, 0.020680806, -0.046588037, -0.14631374, 0.16218774, -0.02519933, 0.00081205636, -0.03667594, 0.00037472384, 0.014701852) * inp_6_0_2; + result2 += M4(-0.012597556, 0.040239267, -0.1545256, 0.04088659, -0.0071228, 0.029709334, -0.07729832, 0.029503794, 4.3520216e-05, -0.3444901, 0.14977348, -0.0904957, 0.09486538, -0.056630686, -0.04801506, -0.0655883) * inp_6_1_2; + result2 += M4(-0.032831248, -0.095781, -0.08001119, 0.07166758, -0.044561706, -0.02722725, -0.0078305295, -0.055165008, 0.0053979997, -0.0075720716, 0.04506346, -0.0030553632, 0.056965515, -0.15107843, 0.08087521, -0.016785566) * inp_6_2_2; + result3 += M4(-0.011304765, 0.042982396, 0.07333254, -0.15808621, -0.010596216, 0.024228621, -0.06672704, 0.01127709, -0.11750455, 0.048861068, -0.031668387, -0.045650184, -0.03780641, -0.019473178, 0.0013867359, -0.04830007) * inp_6_0_0; + result3 += M4(-0.0046306285, -0.10906396, 0.13108574, -0.22441192, -0.034656122, 0.07466032, 0.051100947, -0.04088952, 0.0022658426, 0.022575997, 0.053428896, -0.2216837, -0.04348988, -0.06219343, 0.032726657, -0.10037727) * inp_6_1_0; + result3 += M4(-0.15779862, -0.13251221, -0.014556472, -0.09607967, 0.2680997, -0.15307818, -0.22778739, -0.00489924, 0.12760034, 0.011123271, 0.14743617, 0.029021882, 0.022585029, -0.10740373, -0.055735435, 0.15033849) * inp_6_2_0; + result3 += M4(-0.1484505, -0.017671613, -0.0032535237, 0.06376863, 0.009464662, -0.049705524, -0.11347451, 0.052946683, -0.1362056, -0.058462933, -0.0800612, -0.021057282, 0.084422134, -0.0019610696, 0.040895924, 0.059515502) * inp_6_0_1; + result3 += M4(-0.15065177, -0.12641229, 0.068029374, -0.0946125, -0.45817226, -0.1478491, -0.02126277, -0.031390682, -0.09608857, -0.1526375, 0.16725342, -0.2977865, 0.10580002, 0.068876594, 0.18560548, -0.19339715) * inp_6_1_1; + result3 += M4(0.03611996, -0.15198688, 0.120738015, -0.029970955, -0.20053011, -0.29047492, 0.020352677, -0.04749614, 0.16482808, 0.07731309, 0.2239227, -0.3563899, 0.0051016877, 0.19389103, -0.18571039, -0.078352235) * inp_6_2_1; + result3 += M4(-0.0422524, 0.034567285, -0.0154731395, -0.0010164597, -0.06711847, 0.14366814, 0.042417593, -0.15601753, -0.394073, 0.02146194, -0.06259202, 0.0063437214, -0.040900424, -0.06296466, -0.055456385, -0.0039197397) * inp_6_0_2; + result3 += M4(-0.27073866, -0.044074923, -0.026710993, 0.040608283, -0.06941842, -0.3380804, -0.0075574806, 0.08325098, -0.34815624, -0.26169232, 0.12886062, 0.07943478, -0.07662732, -0.029616397, -0.016310096, 0.05584229) * inp_6_1_2; + result3 += M4(0.027694073, -0.11943827, 0.022466535, 0.036501616, 0.0016555354, 0.18194753, 0.046705216, 0.020957671, -0.11640241, 0.007398838, 0.20677792, -0.029324407, 0.05397739, -0.0072574904, 0.0914181, 0.070041664) * inp_6_2_2; + result4 += M4(0.07863554, -0.036211852, 0.07442452, 0.065366924, -0.04510162, 0.0030608699, -0.0056208484, -0.28072548, 0.16514198, -0.011676702, 0.25184974, 0.04918739, 6.7890556e-05, -0.022788605, -0.05768242, 0.002378575) * inp_6_0_0; + result4 += M4(0.11896412, 0.048449878, 0.115514375, -0.069473594, 0.07949468, 0.122040115, -0.0037255713, 0.112943925, 0.19794042, -0.18011995, 0.10669835, -0.110208444, 0.0076629603, -0.005969908, -0.042079974, -0.2219789) * inp_6_1_0; + result4 += M4(0.0261149, 0.044957407, 0.0017095043, -0.23372293, 0.00072821684, 0.04222988, -0.02462424, -0.009386419, 0.18656869, -0.034705825, 0.09576087, -0.13062485, 0.034064356, 0.04706837, 0.0108686825, -0.4326083) * inp_6_2_0; + result4 += M4(0.1909092, -0.109210275, -0.025459444, 0.066925555, 0.040790316, 0.04747867, 0.13884526, 0.023584604, 0.013651083, -0.306847, 0.28757414, 0.050726544, 0.002901525, 0.032665133, -0.0086309025, 0.07343837) * inp_6_0_1; + result4 += M4(-0.022420825, -0.20841351, -0.08048325, 0.12100547, -0.21724851, -0.07345898, -0.0106133735, 0.0895624, 0.2022069, -0.39320457, 0.071119554, -0.0863043, -0.10923801, 0.079745725, -0.1292732, 0.20092624) * inp_6_1_1; + result4 += M4(-0.06487443, 0.019293578, 0.093959495, -0.11587859, 0.1920757, -0.054173063, 0.072559506, -0.105986014, 0.123024404, -0.20599556, -0.12720715, -0.2572074, 0.2344029, -0.1650412, 0.012668855, 0.2621401) * inp_6_2_1; + result4 += M4(0.03779558, -0.024345582, -0.04235648, -0.28064886, 0.10811407, -0.05817636, -0.011114456, -0.23404925, 0.20522195, -0.116229795, 0.011712314, 0.052991785, 0.02051668, 0.008213255, -0.0801853, -0.034602016) * inp_6_0_2; + result4 += M4(0.002073337, 0.09030672, -0.025383666, 0.26505256, 0.05167131, -0.05913865, -0.02019792, 0.05260761, 0.07007701, -0.23771165, -0.09253976, -0.076662965, 0.040042397, 0.027673334, -0.1385559, 0.025858862) * inp_6_1_2; + result4 += M4(-0.060122848, -0.017264307, 0.03408162, -0.037669934, -0.0051638624, 0.060466327, -0.051729687, 0.061894096, 0.06570809, 0.020399906, -0.02639405, -0.32674098, 0.03620623, -2.700061e-05, 0.057435904, -0.16229191) * inp_6_2_2; + result5 += M4(0.019151725, -0.00067892525, 0.01249173, -0.025109585, -0.057257466, 0.09643532, 0.032189075, 0.0030910573, 0.09102012, 0.13997632, -0.076211736, -0.049396016, 0.0758233, -0.04184735, 0.041656617, -0.023186633) * inp_6_0_0; + result5 += M4(0.12635179, -0.20093161, -0.041765526, -0.15793595, -0.020173667, -0.21873972, -0.0035302062, -0.026682058, 0.1779854, -0.12745951, 0.0244154, -9.597553e-05, -0.03827408, -0.15596522, 0.09020815, -0.109819844) * inp_6_1_0; + result5 += M4(-0.00075776194, 0.11454285, 0.01392678, 0.121896744, 0.030620914, -0.0029977555, 0.013663747, 0.00084922696, 0.07865007, -0.049442574, 0.021680849, 0.042142052, -0.020498823, -0.22637348, 0.0614096, -0.04863722) * inp_6_2_0; + result5 += M4(-0.035151657, -0.042745184, -0.055083673, 0.047766786, 0.1135874, 0.08016404, -0.07168598, 0.005107598, 0.11475242, -0.10980326, -0.050768673, -0.042571474, 0.010000346, 0.12790751, 0.033862002, 0.11367156) * inp_6_0_1; + result5 += M4(-0.041150346, -0.07492101, 0.12285059, -0.03447812, -0.020447701, -0.03266682, 0.021030348, -0.09602725, 0.1304616, -0.06513713, -0.083017, 0.13124208, 0.044711158, 0.23591313, 0.21460588, -0.11631257) * inp_6_1_1; + result5 += M4(0.029400103, 0.043555398, -0.013762911, 0.073865004, -0.07119288, -1.0364439e-05, 0.0126738325, 0.14511266, 0.19465037, 0.0013221118, -0.016896866, -0.03914429, 0.09753666, 0.17093673, -0.1356848, -0.14183028) * inp_6_2_1; + result5 += M4(-0.025005903, 0.010155256, -0.025936427, -0.0405672, -0.02723638, 0.06003205, -0.031763673, 0.012658598, 0.005140826, 0.025754128, -0.08343783, 0.10173264, -0.017245816, -0.06569329, 0.0026540714, 0.047640856) * inp_6_0_2; + result5 += M4(-0.034346513, -0.16129138, -0.009168271, 0.11254457, -0.010352256, 0.1587262, 0.014414777, -0.08211211, 0.1135565, -0.07931767, -0.017976725, 0.033258602, 0.031663466, -0.036053393, 0.21427007, 0.046158317) * inp_6_1_2; + result5 += M4(-0.09185946, -0.14098816, -0.0015973342, 0.09322096, 0.045175068, 0.07779206, 0.0012580156, 0.028436018, 0.10802001, -0.10910535, 0.003451664, -0.043159433, 0.031708997, -0.1731695, 0.041159328, -0.15916665) * inp_6_2_2; + result6 += M4(-0.0958679, -0.26637122, -0.026185092, 0.055466387, -0.04198706, -0.020821463, -0.09545562, 0.03068713, -0.20666893, 0.12167395, 0.026612062, -0.08212436, -0.0040794667, -0.086372055, -0.08609278, -0.02917526) * inp_6_0_0; + result6 += M4(0.18580501, 0.017033009, 0.110363975, -0.0418414, -0.025084877, -0.12840068, 0.07177904, 0.0127869, -0.43072087, 0.043192487, 0.010066773, -0.11958247, -0.13177611, 0.0924337, 0.06621749, 0.012264197) * inp_6_1_0; + result6 += M4(-0.015664237, -0.013518279, -0.111916706, 0.03054919, 0.12574184, 0.18625127, 0.15648505, -0.009408972, -0.0780395, 0.06971044, 0.0397292, -0.053990994, -0.013551904, 0.18145713, 0.07709254, 0.051109567) * inp_6_2_0; + result6 += M4(-0.05058331, -0.12537445, 0.050288465, -0.035371277, 0.13732839, -0.5179359, 0.017640235, 0.03727855, -0.3730922, 0.1254433, -0.05149198, -0.036945563, 0.022061089, -0.07633489, -0.047491677, -0.0004574731) * inp_6_0_1; + result6 += M4(0.0029672752, -0.0951583, 0.19591388, 0.0049881227, -0.13086346, -0.73776966, -0.22234154, 0.056313418, -0.27, -0.30227312, 0.3365131, 0.321545, 0.25795555, 0.015529492, 0.05726952, 0.03807587) * inp_6_1_1; + result6 += M4(-0.09282181, -0.08185934, 0.107564256, 0.0097432, -0.09269917, 0.09159919, -0.04614701, 0.06642886, 0.089561746, -0.10309312, 0.16146429, -0.09713908, 0.032345425, -0.037576836, -0.20319611, -0.15360212) * inp_6_2_1; + result6 += M4(0.032014478, -0.13974293, 0.052892286, 0.020222604, -0.16960494, -0.2826723, 0.29836568, 0.025542576, -0.04915736, 0.24182443, 0.042811643, -0.0973593, -0.060745683, 0.08006753, -0.014213451, -0.04268057) * inp_6_0_2; + result6 += M4(0.06054807, 0.062498067, 0.013407407, 0.061428536, 0.1297064, -0.22709037, -0.04131349, -0.06487632, 0.07992309, 0.21329872, -0.10006117, -0.092103615, -0.06569273, -0.1263074, -0.053103503, -0.0495854) * inp_6_1_2; + result6 += M4(-0.077612616, -0.022991799, 0.06686076, 0.00031374677, 0.059132006, 0.036846858, -0.0721737, 0.035311807, 0.1696031, 0.21869786, 0.14040108, -0.12660657, -0.17465432, 0.12630653, -0.009293485, -0.03878277) * inp_6_2_2; + result7 += M4(0.05440344, 0.031686533, -0.020907454, 0.10951271, 0.040619228, -0.15170762, -0.014436217, 0.004299437, 0.0035665198, 0.038972534, 0.01877531, -0.0003444911, 0.05165928, 0.03648476, -0.0172968, 0.00632726) * inp_6_0_0; + result7 += M4(0.17325996, -0.14213556, -0.028062949, 0.18187171, 0.019167548, -0.044269823, -0.004191864, 0.002324773, 0.040318165, 0.17592503, -0.06979839, 0.011143587, 0.02297659, -0.11920922, -0.048505023, -0.025443109) * inp_6_1_0; + result7 += M4(0.08409119, -0.015401151, 0.03091349, 0.037520166, -0.051030744, 0.06852024, 0.037610646, -0.042096093, 0.07281579, 0.12589635, -0.03785591, 0.18377404, 0.021303631, -0.22469413, -0.029890792, -0.13206983) * inp_6_2_0; + result7 += M4(0.14067635, -0.036883865, -0.0025350545, 0.033165004, -0.08287977, 0.1829904, 0.010653497, -0.043646075, 0.038258407, 0.052552413, 0.0017300351, 0.016791333, 0.005788829, 0.04430054, 0.01148681, 0.017427737) * inp_6_0_1; + result7 += M4(0.044377204, -0.2762078, 0.015994258, 0.06664877, 0.090133816, 0.07393251, -0.060353596, 0.23897074, 0.6179383, 0.15073742, -0.12735355, 0.16166665, -0.29235646, 0.10062159, -0.023016633, 0.043823622) * inp_6_1_1; + result7 += M4(0.17045426, 0.018254476, -0.05128312, 0.06370928, -0.0019476673, -0.24873239, -0.008143482, -0.22970337, 0.113136314, -0.048174266, -0.034583163, 0.17667745, -0.18698286, -0.3460756, -0.09774891, -0.3594588) * inp_6_2_1; + result7 += M4(0.04260384, -0.029794449, 0.0069529004, -0.019075565, 0.16143136, -0.0505453, 0.008099726, 0.26149747, 0.10733593, 0.04892239, -0.03790028, -0.18737046, 0.0594152, -0.0020483532, -0.02393423, 0.041325405) * inp_6_0_2; + result7 += M4(-0.04716326, -0.0848431, -0.009930468, 0.09281659, -0.0010374289, 0.015504248, 0.033682622, 0.053844802, 0.17517996, 0.027516868, -0.046616595, 0.11026857, -0.043579206, -0.0022518858, 0.013194802, 0.16172068) * inp_6_1_2; + result7 += M4(0.05315299, 0.051655922, -0.011361677, 0.00078263704, -0.012073149, 0.0028341622, -5.791313e-05, -0.020606972, 0.063796036, 0.04006447, -0.00550045, 0.36251128, 0.06067084, 0.005258376, -0.0012393355, -0.31838936) * inp_6_2_2; + const V4 inp_7_0_0 = inp[7][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_7_1_0 = inp[7][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_7_2_0 = inp[7][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_7_0_1 = inp[7][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_7_1_1 = inp[7][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_7_2_1 = inp[7][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_7_0_2 = inp[7][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_7_1_2 = inp[7][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_7_2_2 = inp[7][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.13234818, 0.024140459, 0.02059781, 0.06852567, -0.43825418, 0.018238941, -0.122793674, 0.3793741, -0.45896035, 0.016663015, -0.07337706, 0.5490679, -0.017448904, 0.012453136, -0.16871272, -0.2665986) * inp_7_0_0; + result0 += M4(-0.08695993, 0.02502302, 0.11226634, -0.056313213, 0.0063000424, 0.029156705, -0.030290717, 0.23947251, -0.25632492, -0.029924147, 0.017257797, -0.13141802, -0.2502964, -0.10639868, -0.1390605, -0.26825) * inp_7_1_0; + result0 += M4(0.04827805, 0.0064410353, 0.0142085375, -0.029163508, -0.63364595, 0.008122169, -0.016164683, 0.089902334, 0.26723737, -0.010226287, -0.080133036, -0.013090045, 0.27368426, -0.010752454, 0.02717971, 0.09543269) * inp_7_2_0; + result0 += M4(-0.2704793, 0.1909402, 0.10042331, 0.040969882, -0.38325265, -0.032312315, 0.031240776, 0.15624237, -0.2482152, -0.024394402, -0.10327549, 0.15105595, 0.03178416, -0.08104968, 0.083295025, -0.102572456) * inp_7_0_1; + result0 += M4(-0.46608293, 0.2581852, -0.038559817, 0.097761236, 0.40059385, 0.028512845, -0.07379742, -0.011084663, -0.46189255, 0.063741334, 0.067148454, -0.0013313569, 0.33348557, 0.1115847, 0.030679429, 0.18109667) * inp_7_1_1; + result0 += M4(0.13822377, 0.04204411, 0.020339737, -0.0012192341, -0.16125815, -0.013855569, -0.03607968, 0.124595635, -0.10623776, -0.005419131, -0.07400978, 0.04839035, -0.21052846, -0.025509095, -0.065525725, 0.011313502) * inp_7_2_1; + result0 += M4(-0.24804014, -0.01698101, -0.021685282, -0.1646782, -0.77832264, -0.014908361, -0.19158065, -0.028142458, 0.4732883, -0.0567988, -0.07517578, 0.114466675, 0.008870034, 0.0071364488, 0.033320315, -0.029111737) * inp_7_0_2; + result0 += M4(0.3797558, -0.0031718987, 0.040338196, -0.12195105, -0.04232809, 0.0067141633, -0.098415874, -0.012539671, -0.3970521, 0.043328803, -0.0860958, 0.15677075, -0.10516383, 0.0012027385, -0.027895002, 0.08783902) * inp_7_1_2; + result0 += M4(-0.051467173, 0.0086186575, 0.0026782842, -0.07827038, -0.24736173, 0.017300595, -0.058101714, -0.04303714, -0.47835463, -0.0074044233, 0.002885336, 0.02689168, 0.07279945, 0.009417397, 0.024617016, -0.03448469) * inp_7_2_2; + result1 += M4(0.120639876, 0.020868301, -0.034151245, 0.01596658, -0.036627162, 0.05034021, 0.020224286, 0.19381411, 0.083688706, 0.16616055, 0.049868044, 0.08023313, -0.09315864, 0.014191121, -0.014214762, 0.1224369) * inp_7_0_0; + result1 += M4(0.07042414, -0.118559286, 0.0019590901, 0.09782385, 0.02881862, -0.4078902, -0.18111974, -0.081410505, -0.08575127, -0.019851848, 0.009251313, -0.20036396, -0.02814018, 0.1724281, -0.016811747, -0.13820945) * inp_7_1_0; + result1 += M4(0.00832213, 0.006434059, 0.039778367, 0.033260122, 0.086187065, 0.049207654, -0.10078501, -0.0166481, 0.0032611024, 0.14055222, -0.010150389, 0.073782206, -0.06512125, -0.101720855, -0.035533793, -0.06191057) * inp_7_2_0; + result1 += M4(0.053763367, -0.069144346, -0.20957503, -0.008475853, 0.11309106, -0.05643106, -0.057507116, -0.1396303, 0.05890346, -0.21478657, -0.038411908, -0.08232966, -0.011029945, -0.13585196, -0.003445853, -0.07545529) * inp_7_0_1; + result1 += M4(-0.019711347, 0.20943874, -0.21868145, 0.0804203, 0.29745734, 0.16547026, 0.085580975, 0.19694416, 0.112818934, -0.034139078, -0.028760202, -0.19049959, 0.043886617, 0.04856925, 0.055728722, 0.17125185) * inp_7_1_1; + result1 += M4(0.016649177, 0.00501597, -0.012714835, -0.017148575, 0.026360888, 0.08068654, 0.011417158, -0.035976347, -0.047410972, 0.13938464, 0.024304058, -0.05510768, -0.051847547, 0.06317871, -0.06413971, -0.091084) * inp_7_2_1; + result1 += M4(0.1454137, 0.042932123, 0.11815033, -0.059083346, 0.028317006, 0.10444435, 0.01732113, 0.028499572, 0.19098248, -0.12168602, -0.117420115, -0.18469682, -0.02500652, 0.006244789, -0.003142881, 0.04107069) * inp_7_0_2; + result1 += M4(-0.0016273146, -0.26632673, 0.08947516, -0.04918196, 0.07012229, -0.15446419, -0.12814572, -0.13558093, 0.12853512, 0.17451707, -0.08464202, -0.059710413, 0.021987932, 0.048532978, -0.067074046, -0.07095954) * inp_7_1_2; + result1 += M4(0.12174815, 0.017727569, -0.0016656194, 0.0651322, -0.0042228177, -0.09287039, -0.08434903, 0.09181954, 0.055689488, -0.10255101, -0.12400715, -0.41026542, 0.028954132, -0.024644546, 0.03617046, 0.03233503) * inp_7_2_2; + result2 += M4(0.020622054, 0.106160074, -0.07232268, 0.088880114, 0.04194982, -0.073700055, -0.0018225019, 0.03528085, -0.05522113, -0.12694271, 0.11073129, 0.24080318, 0.031235753, -0.09278874, 0.041168455, -0.05719343) * inp_7_0_0; + result2 += M4(0.061155282, 0.13887388, -0.07663722, -0.0007587725, 0.042244315, 0.055959538, -0.030442063, -0.027642366, 0.05914553, 0.27082765, -0.096839264, -0.023224281, -0.16004892, -0.22175674, 0.09217488, -0.13198678) * inp_7_1_0; + result2 += M4(0.020568248, -0.12714969, -0.02009391, 0.07749078, 0.017737765, 0.0045806, 0.0045985733, 0.030062703, -0.09190093, -0.058277532, 0.027318913, 0.020496784, 0.009242568, 0.16957264, 0.020597862, -0.05769434) * inp_7_2_0; + result2 += M4(-0.071334586, 0.08517156, -0.09522769, 0.04766956, -0.013629994, 0.12580644, 0.15124352, -0.10273451, 0.04600422, -0.0019151275, -0.015777286, 0.07841785, -0.07107558, -0.005298428, 0.036940023, -0.042208157) * inp_7_0_1; + result2 += M4(0.028360212, -0.22684225, -0.009063659, 0.21087845, -0.040492717, -0.21401477, -0.019912632, 0.08306076, -0.08369832, 0.15740356, -0.027352918, 0.10341503, 0.108977176, 0.1241696, -0.2058242, -0.058593374) * inp_7_1_1; + result2 += M4(0.04030781, -0.0015453289, -0.080386624, -0.073584706, 0.06508918, 0.06421752, 0.020496856, -0.01442261, -0.018723447, -0.11739721, 0.05159809, 0.0510422, -0.038075637, -0.08721064, 0.11245838, -0.01027726) * inp_7_2_1; + result2 += M4(0.123719096, -0.086290866, -0.02953306, 0.012487517, 0.058338538, -0.28617778, 0.06058064, 0.04701797, -0.12604283, 0.2627012, 0.005426399, -0.02776385, 0.035178278, -0.09496975, -0.03458914, 0.022614961) * inp_7_0_2; + result2 += M4(-0.043985445, 0.20527525, 0.1133241, 0.015265315, 0.0043510045, 0.020892188, -0.021317627, -0.030664029, -0.05490803, -0.060274836, 0.10031827, 0.17601359, -0.040775437, 0.0023056045, 0.07625351, -0.020901848) * inp_7_1_2; + result2 += M4(-0.027881717, 0.052852046, -0.08201233, 0.004607959, -0.0041412394, -0.06508582, 0.06523831, 0.054485995, -0.015364985, 0.17650962, 0.084719524, -0.039732866, 0.037317257, 0.058177054, -0.031347405, -0.016701564) * inp_7_2_2; + result3 += M4(-0.079142794, 0.020865908, -0.025012389, 0.061442696, 0.00046456518, -0.0076775257, -0.08181043, -0.22849555, -0.04719709, -0.07264326, -0.110643126, -0.14200874, 0.19270246, -0.047899306, 0.031535115, -0.18195975) * inp_7_0_0; + result3 += M4(0.0014382731, 0.01902578, 0.036787193, -0.050848518, 0.037131432, 0.07913654, 0.057818256, -0.23181073, -0.017667694, -0.014536636, 0.11511683, -0.06638014, 0.05730292, -0.013213898, -0.041609623, -0.32897407) * inp_7_1_0; + result3 += M4(-0.012513578, -0.03199077, -0.011343825, 0.108299285, 0.08520598, 0.03587075, 0.055777445, -0.18219969, 0.020219756, -0.022256203, -0.0034907956, 0.077401996, -0.018888174, 0.07118487, -0.07521588, -0.05902322) * inp_7_2_0; + result3 += M4(-0.18665208, -0.031329613, -0.052610084, -0.0202129, -0.12930258, 0.056678157, 0.0035870606, -0.10903017, -0.22052027, -0.21295534, 0.0641488, 0.006575033, 0.23252448, 0.02751876, 0.2414994, -0.18703108) * inp_7_0_1; + result3 += M4(0.27316484, -0.18469532, -0.05333985, 0.14527515, -0.004299906, -0.16162455, -0.051801134, -0.0697147, 0.16622977, 0.1762794, 0.012692535, -0.099797025, -0.23517591, 0.07453538, -0.3477133, 0.15215652) * inp_7_1_1; + result3 += M4(-0.08222191, -0.0924424, -0.13454486, 0.024854574, -0.033335134, 0.15770987, 0.09670961, 0.03560501, 0.030030804, -0.12069965, -0.004479698, -0.23019435, 0.06902405, 0.0485293, 0.06832267, 0.008212818) * inp_7_2_1; + result3 += M4(-0.12941474, -0.088538855, -0.16145591, 0.04118807, -0.11231108, 0.0038192105, -0.06965243, -0.022071244, 0.077731125, 0.15280017, 0.0040792474, -0.027544567, 0.09617461, -0.017672416, 0.0022583858, 0.06582279) * inp_7_0_2; + result3 += M4(-0.030117944, -0.12556112, 0.07855222, -0.07041124, -0.09424343, -0.016811552, -0.06816887, -0.008770295, 0.08754525, -0.16535464, 0.06419486, 0.03041267, 0.0097553395, 0.041041676, -0.0650508, 0.026939217) * inp_7_1_2; + result3 += M4(-0.033823106, -0.11061437, -0.03672665, -0.043687828, 0.016310422, 0.112685375, -0.021530747, 0.010922581, -0.17197768, 0.13647681, 0.031206718, -0.07963588, -0.02933936, 0.008593718, 0.028987492, -0.06305942) * inp_7_2_2; + result4 += M4(-0.047512725, 0.024654962, 0.004643964, 0.26897344, 0.070306435, 0.112824, 0.053099077, -0.1434266, 0.03842663, -0.03992556, 0.033379946, 0.107225664, 0.13365781, -0.037673056, 0.21686989, -0.53475374) * inp_7_0_0; + result4 += M4(0.030065678, 0.083722286, -0.05224997, -0.21260102, 0.010389271, -0.06578777, -0.057258826, -0.10819672, -0.04085065, 0.071403295, -0.04003213, 0.07820922, -0.02843226, -0.23045602, 0.14640798, 0.21712236) * inp_7_1_0; + result4 += M4(0.029375335, 0.01530824, 0.052318417, -0.037822567, 0.07263983, -0.013356238, -0.094286054, -0.096665934, -0.0056734295, -0.037345275, 0.04929006, 0.107552186, -0.014330267, -2.1985888e-05, -0.05051373, 0.08536556) * inp_7_2_0; + result4 += M4(0.008718212, 0.009928445, 0.00046487228, 0.022819841, 0.09483474, 0.030926187, -0.011275541, 0.13425766, 0.184821, -0.066433184, 0.10382169, -0.099208705, 0.035321396, -0.09237296, 0.21718387, 0.1294959) * inp_7_0_1; + result4 += M4(-0.047972325, 0.07110202, 0.11825178, 0.06483475, 0.08112725, -0.10962242, 0.03660568, 0.26444703, 0.15646888, -0.041350093, -0.060285214, -0.1307824, -0.059748475, 0.22015378, -0.17793809, 0.01958505) * inp_7_1_1; + result4 += M4(-0.0012753924, 0.0862962, 0.0026247662, -0.09131616, -0.018739192, 0.071253836, -0.05191729, 0.21759342, -0.06978092, -0.04853693, 0.106194675, 0.29386562, -0.0040828367, -0.023282863, -0.019179676, -0.11184075) * inp_7_2_1; + result4 += M4(0.11370803, 0.031004118, -0.028854689, -0.1002713, 0.014114363, -0.023677448, -0.05228997, 0.035635523, -0.02329999, -0.054726932, 0.043629427, -0.03266707, -0.046005413, 0.034397162, 0.049573578, 0.110119104) * inp_7_0_2; + result4 += M4(0.21991117, -0.08071918, 0.12767422, 0.033683427, 0.050345413, 0.020746185, -0.1031993, 0.27932635, -0.008108492, -0.056558486, 0.08301507, 0.44316688, 0.0068652625, -0.034775894, -0.0100502, -0.08829247) * inp_7_1_2; + result4 += M4(-0.045197904, -0.0039110426, 0.008551729, 0.074192815, 0.034783233, 0.005694333, 0.029502572, 0.046073496, 0.06818265, 0.0034356776, -0.10520141, -0.029901898, 0.025677385, 0.004649126, -0.014201963, -0.009314913) * inp_7_2_2; + result5 += M4(-0.0152262505, 0.04112893, -0.012193331, 0.09269423, 0.045208376, 0.14724231, -0.014657305, -0.061980486, 0.18461047, -0.043901265, 0.029602895, 0.10525452, 0.10954091, -0.11964209, 0.0033518581, -0.24894364) * inp_7_0_0; + result5 += M4(-0.12376315, -0.11762766, 0.0038412586, -0.043043792, 0.03970286, 0.2391605, 0.0028833454, 0.06441764, -0.12192651, -0.2876178, 0.02315545, 0.12040522, 0.242298, -0.06216442, -0.04319146, -0.18767585) * inp_7_1_0; + result5 += M4(-0.009807402, -0.06350806, -0.018244635, 0.0036108517, 0.046721287, -0.01664753, 0.022530906, 0.06195682, 0.08243953, -0.2068215, 0.0010408794, 0.012249968, 0.0011985519, 0.17430706, -0.01604266, 0.05597206) * inp_7_2_0; + result5 += M4(0.0331121, 0.2132486, 0.018717118, 0.08270584, 0.058101498, 0.12564899, 0.0088256635, 0.031151576, -0.027145183, -0.16707194, -0.020464635, 0.18196811, 0.02538494, 0.24251193, 0.08546804, -0.2179097) * inp_7_0_1; + result5 += M4(-0.102173194, 0.16821802, -0.034983687, 0.16153032, -0.035508722, 0.4272775, 0.044508364, 0.1498723, 0.060956605, -0.2567921, -0.032972004, -0.07443882, -0.012709201, -0.078562036, 0.32701463, 0.22750773) * inp_7_1_1; + result5 += M4(-0.005661811, -0.04283017, 0.030498324, -0.08435541, 0.043476727, 0.23815215, 0.037590496, 0.035874996, -0.0168875, -0.10105766, -0.009729588, -0.01862814, -0.0022954084, -0.10926876, 0.06535011, 0.008848365) * inp_7_2_1; + result5 += M4(0.053151302, -0.20101906, -0.06660011, 0.06758124, 0.06296126, 0.026565203, -0.04855645, 0.10597188, -0.084681444, -0.06543283, -0.039568894, 0.002655453, 0.020315137, 0.09464992, -0.0031060046, -0.016402066) * inp_7_0_2; + result5 += M4(-0.016726276, 0.26303118, -0.052008346, -0.13394625, 0.117321774, 0.22990148, -0.033415716, -0.10480937, 0.0890672, -0.16193764, 0.07916709, 0.15453972, 0.041005164, -0.042691853, 0.038163647, 0.0322729) * inp_7_1_2; + result5 += M4(-0.027041586, -0.03554421, -0.015481368, 0.077423766, 0.030307984, -0.027284933, -0.019532818, 0.018685386, 0.075268984, -0.333208, 0.014211208, -0.00033899894, -0.005806998, 0.03051582, -0.008191966, -0.02886768) * inp_7_2_2; + result6 += M4(-0.014872829, -0.02321414, 0.00489583, 0.01924416, -0.15218875, -0.04618979, 0.07350328, -0.008297021, -0.4236741, -0.05810434, -0.063896775, -0.029798493, -0.15132132, -0.0416993, 0.044762846, -0.104156815) * inp_7_0_0; + result6 += M4(0.022956135, -0.0023403126, -0.047048185, 0.017426884, -0.014484376, -0.03440669, -0.16587481, -0.021950213, -0.0460931, -0.041721676, -0.14123705, -0.02087679, 0.11961106, 0.10613775, 0.12240612, -0.061052103) * inp_7_1_0; + result6 += M4(0.005877017, 0.025301978, 0.05443906, 0.06069619, 0.052617826, -0.10428248, 0.099501655, -0.039056007, -0.17485978, 0.076176606, -0.00089645135, -0.0003865021, 0.047758367, -0.13440448, -0.04847185, -0.029566327) * inp_7_2_0; + result6 += M4(0.007236993, -0.102605596, -0.05802096, 0.036356803, 0.16754487, -0.16840936, 0.16197258, 0.043191057, -0.24089858, -0.0012793159, -0.21263, 0.03682201, 0.17951293, -0.10115861, 0.16826086, -0.18623632) * inp_7_0_1; + result6 += M4(-0.036979362, -0.0062729586, 0.28175145, 0.08105705, -0.24217941, -0.0317539, 0.0013010842, 0.0139259845, -0.048095934, -0.10652068, 0.36398926, -0.009815652, -0.055901844, 0.16276228, -0.32601035, 0.31223118) * inp_7_1_1; + result6 += M4(0.120920025, 0.11975834, -0.11491352, -0.021084255, 0.05748386, -0.08073311, -0.07892196, 0.010723322, 0.023018999, 0.09767648, -0.087181315, -0.008482152, -0.077214934, -0.034772787, 0.026836116, -0.011319538) * inp_7_2_1; + result6 += M4(-0.18652977, 0.07718767, -0.114250064, 0.036094118, -0.12500831, 0.092108615, -0.084842, -0.034727436, -0.04290265, -0.16524102, 0.21705121, -0.0062293923, 0.056003887, -0.020803714, -0.038386784, -0.046298534) * inp_7_0_2; + result6 += M4(-0.031938035, -0.31181517, 0.13145946, -0.012869959, 0.26267383, -0.008760284, -0.027948705, -0.05201039, -0.23893741, 0.15011923, 0.042576697, -0.048681576, -0.02999273, 0.0630577, -0.074624844, 0.052970782) * inp_7_1_2; + result6 += M4(-0.036090072, 0.042140193, 0.05210011, 0.069158755, -0.06686733, -0.02453599, 0.0010439788, -0.009910277, 0.054839734, -0.24132515, -0.20682353, 0.021605317, 0.013303519, -0.03426659, 0.03487262, -0.014674249) * inp_7_2_2; + result7 += M4(-0.02102193, 0.0035500196, 0.016372157, 0.013960896, 0.039535347, 0.014720616, 0.011953596, -0.028945958, -0.13731441, 0.14999218, 0.019043447, -0.056968886, 0.14384778, 0.077612296, -0.047982696, -0.0096788565) * inp_7_0_0; + result7 += M4(0.025285816, 0.17647319, 0.00147858, -0.06293042, 0.07901491, 0.008939415, 0.005800431, 0.07993876, 0.026949039, -0.13902293, 0.012317744, 0.04698391, 0.12897827, -0.29269418, 0.04207743, -0.037707347) * inp_7_1_0; + result7 += M4(-0.024639513, -0.012540064, 0.000104586776, -0.08256717, -0.08135283, 0.037238933, 0.034043007, 0.061925434, 0.043009643, 0.048277095, -0.014939118, -0.041639775, 0.03691335, -0.06905864, 0.0010431814, 0.16429694) * inp_7_2_0; + result7 += M4(-0.09154465, 0.07758772, 0.030311756, -0.074405074, -0.015287525, 0.019609263, 0.012912235, -0.10051786, 0.13249321, -0.036514886, 0.05441133, 0.105387226, 0.049750704, 0.0023911544, 0.0657314, -0.011020473) * inp_7_0_1; + result7 += M4(0.16349766, 0.21930553, 0.25630805, -0.09835134, -0.064368404, 0.050222535, 0.008777958, -0.015757414, -0.08548143, -0.013160285, -0.0025046426, -0.09314837, -0.1415013, 0.07129445, 0.43791455, -0.012009919) * inp_7_1_1; + result7 += M4(-0.038309116, 0.1674021, 0.048630405, -0.020286104, 0.0031749187, -0.06025599, 0.035346877, 0.19861764, -0.0027232647, 0.02493601, 0.07113758, 0.04787715, 0.0060196156, -0.00339514, 0.014146109, 0.010153284) * inp_7_2_1; + result7 += M4(-0.015669102, 0.065125085, 0.02909808, -0.098975055, -0.036952786, -0.0011229445, -0.005792147, -0.07868097, 0.062462553, -0.06982226, 0.03999935, 0.005694036, 0.010188598, 0.07394883, 0.014077988, -0.04385791) * inp_7_0_2; + result7 += M4(-0.060688168, -0.09090148, 0.09340644, -0.06260428, -0.07208855, -0.024901878, -0.009066221, 0.06757054, -0.04243263, 0.081757195, 0.017139152, -0.16694625, -0.014496033, -0.012155245, 0.040567834, 0.023896586) * inp_7_1_2; + result7 += M4(0.09606695, -0.0035116659, 0.040588666, 0.06580704, -0.0073454226, 0.032742504, -0.016482571, -0.025873497, -0.026671821, -0.043061186, 0.033182908, -0.11756651, -0.019081619, -0.02530556, -0.026103446, 0.016588146) * inp_7_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(4, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 0), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 0), max(result3, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result4, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result5, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 1), max(result6, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 1), max(result7, V4(0.0))); +} + +//!DESC ArtCNN C4F32 DS (Conv2D-4-ReLU) +//!COMPUTE 48 32 12 16 +//!HOOK LUMA +//!BIND conv2d_3 +//!SAVE conv2d_4 +//!WIDTH LUMA.w 4.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[8][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(4, 2); + inp[0][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(2, 0), 0)); + inp[3][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(3, 0), 0)); + inp[4][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(0, 1), 0)); + inp[5][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(1, 1), 0)); + inp[6][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(2, 1), 0)); + inp[7][y][x] = V4(conv2d_3_mul * texelFetch(conv2d_3_raw, input_base + ivec2(3, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(-0.016542107, -0.012679774, -0.017688308, 0.0048230723); + V4 result1 = V4(0.002919079, -0.0065332386, -0.060906243, -0.015134616); + V4 result2 = V4(-0.01801499, -0.0032619475, -0.0062636537, 0.004419572); + V4 result3 = V4(-0.0059241373, -0.013414753, 0.015237642, -0.008156484); + V4 result4 = V4(0.0011550249, -0.032338362, -0.012596041, -0.009159248); + V4 result5 = V4(-0.04556048, 0.0011225869, -0.021639528, -0.02443676); + V4 result6 = V4(0.024590693, -0.02941249, -0.0149086, -0.023160407); + V4 result7 = V4(0.0007290187, -0.010429996, -0.06336649, -0.011101873); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.050084125, 0.011325267, 0.03905409, 0.28082657, 0.075469054, -0.008193264, 0.034493946, 0.013142418, -0.02122179, -0.027524106, -0.1729417, -0.08972137, 0.07738356, 0.009138024, 0.0071516414, 0.1854231) * inp_0_0_0; + result0 += M4(-0.01855109, 0.024444751, -0.070182405, 0.058751844, -0.08322817, -0.021590779, -0.1341947, 0.3573937, -0.108749315, 0.041122083, 0.10334136, -0.14147314, -0.08528963, -0.0050656125, 0.045218155, -0.4296871) * inp_0_1_0; + result0 += M4(0.0035430503, 0.018665286, 0.015904365, 0.03131911, -0.046010375, 0.059393555, 0.21222147, -0.16424854, -0.13312043, -0.07158205, -0.18523844, -0.52106565, 0.07094656, 0.0021211952, -0.06564686, 0.16554663) * inp_0_2_0; + result0 += M4(0.017739372, 0.0023111654, -0.1251821, -0.19510305, 0.08178124, -0.0031667405, 0.0593662, 0.15396512, -0.015187601, -0.028620917, -0.290968, -0.056516875, 0.0332856, 0.010859935, -0.080543876, -0.0037281413) * inp_0_0_1; + result0 += M4(-0.025135472, 0.023864137, -0.057448756, -0.03442884, 0.11550942, -0.10850868, 0.29050592, -0.005255575, -0.03386252, 0.006812388, -0.353441, 0.07509677, -0.096932195, -0.00842387, 0.10004468, -0.036403757) * inp_0_1_1; + result0 += M4(0.009376374, 0.0029212954, -0.070137, -0.2663141, 0.14669581, 0.23949608, 0.034024604, 0.08857758, -0.23379914, -0.15621044, -0.0400368, -0.54812866, 0.013621858, 0.02337291, -0.06899478, -0.06675567) * inp_0_2_1; + result0 += M4(0.06399371, 0.010321662, 0.009413287, 0.08853818, 0.06916661, 0.02321199, -0.18504642, 0.17936738, -0.07753787, -0.041417316, 0.0033812264, -0.16644792, 0.0023637733, -0.012235416, -0.08722863, 0.10052439) * inp_0_0_2; + result0 += M4(-0.07459823, 0.030876542, 0.07654594, 0.13852786, -0.1404074, -0.053831626, 0.22613738, 0.20265292, -0.124435894, -0.01632648, -0.14340241, 0.04823094, 0.089095764, 0.033899773, 0.02491223, 0.20127468) * inp_0_1_2; + result0 += M4(0.04396496, 0.011924869, -0.029322898, 0.04432441, 0.06990681, 0.06408676, -0.05587314, 0.10004018, 0.06642851, -0.014157152, -0.07679483, -0.18803637, -0.07471932, -0.01494545, 0.038381, -0.1822777) * inp_0_2_2; + result1 += M4(-0.017871566, -0.041596025, 0.32224208, 0.016512657, 0.00508703, 0.048751228, 0.12879516, 0.045008127, 0.09034886, -0.038664747, 0.10238643, -0.066557266, -0.02791805, -0.054194644, 0.086112715, -0.031732492) * inp_0_0_0; + result1 += M4(-0.003704424, -0.020565212, -0.3136572, -0.037200455, -0.1784549, -0.09110337, 0.029692614, -0.09057145, -0.010382863, -0.07367683, -0.087211154, -0.10693934, -0.0014508942, 0.09694302, -0.15624073, -0.01370392) * inp_0_1_0; + result1 += M4(-0.008113902, -0.0014286042, 0.42281562, -0.045003124, 0.041234497, 0.062886186, 0.122424535, 0.02314279, -0.001083323, -0.01264907, 0.009040765, -0.01429229, -0.00010829072, -0.016989667, 0.14959723, 0.006822573) * inp_0_2_0; + result1 += M4(-0.0066052354, -0.007328133, -0.05545804, -0.028420491, -0.062478587, -0.031995762, -0.14429249, -0.116246946, 0.026747463, -0.041652326, -0.04969374, -0.0667569, 0.05258227, 0.018456772, -0.18474315, 0.013049629) * inp_0_0_1; + result1 += M4(-0.0037995127, -0.03843067, 0.10581279, 0.013679892, -0.020294208, 0.13637277, 0.02544319, 0.15271997, 0.0071817287, -0.04525665, 0.23252755, -0.10723104, 0.01890405, -0.03340116, 0.16292317, 0.023409538) * inp_0_1_1; + result1 += M4(0.006661697, -0.0094777, -0.064126715, 0.0017646403, -0.002192948, -0.030412296, 0.19438899, -0.011306443, -0.00104239, -0.052301046, -0.18872653, 0.024933362, 0.0031348662, 0.023994213, -0.2035901, -0.017689131) * inp_0_2_1; + result1 += M4(0.018339697, 0.009256576, 0.22590935, -0.06576637, 0.037864428, 0.009654998, -0.005438166, 0.0059928983, 0.008466759, 0.003179748, -0.022330668, -0.04849996, 0.0022550432, -0.01399647, -0.02096306, -0.041134126) * inp_0_0_2; + result1 += M4(0.006801038, 0.011600131, -0.22520253, -0.03621297, 0.0069761374, -0.0030935777, -0.036739305, -0.0013867997, -0.0103504, -0.007979353, 0.027838033, 0.0050616497, 0.005577895, 0.03348561, 0.014656373, -0.0050173285) * inp_0_1_2; + result1 += M4(0.00035079816, 0.0030824412, 0.28137797, 0.00095397764, -0.0058895512, 0.025194025, -0.033050053, -0.004739523, -0.0026151284, 0.018386485, 0.0008312886, -0.020002274, 0.0004895481, -0.0016054516, -0.034663394, 0.013620786) * inp_0_2_2; + result2 += M4(-0.025834234, 0.004361098, 0.011241019, -0.018341137, 0.0022237708, -0.000808556, -0.019275058, 0.024911843, -0.0021157733, 0.011792845, 0.018057384, -0.010296266, -0.0074022426, 0.0032578576, -0.00897053, -0.012268648) * inp_0_0_0; + result2 += M4(-0.0594218, -0.027025925, 0.014039617, -0.02184239, -0.09020728, -0.0022100045, 0.0042070947, -0.030025607, -0.033037934, -0.035481334, 0.022689689, -0.02616385, -0.012762042, 0.041177, -0.002869835, 0.0006208272) * inp_0_1_0; + result2 += M4(-0.012530844, -0.02094423, -0.00437871, -0.0138727315, 0.060289416, 0.06659194, -0.10565998, 0.009702638, -0.07174413, -0.040633556, 0.0386967, 0.0041002557, 0.03822132, -0.017502738, -0.0052290238, -0.00036737192) * inp_0_2_0; + result2 += M4(-0.028754015, 0.016205607, 0.005112095, 0.0239719, -0.08401191, -0.037812985, -0.039320022, 0.049222887, -0.0021033597, -0.048998397, 0.0076606683, 0.01361554, -0.043039523, -0.027094271, -0.005291174, -0.010883237) * inp_0_0_1; + result2 += M4(0.01627023, -0.00762941, -0.00080632005, 0.021211404, 0.20159216, 0.17768899, 0.21231668, 0.24435699, -0.093186125, -0.042097103, 0.061804675, 0.101889156, 0.09773501, -0.03514878, -0.0011517085, 0.031506952) * inp_0_1_1; + result2 += M4(-0.040042855, -0.015471295, -0.015428241, 0.039255697, 0.030589487, -0.07444299, -0.07285818, -0.038294997, -0.054270312, -0.02890017, -0.034612767, 0.03797289, -0.036023382, 0.021515746, -0.0041990154, 0.01738835) * inp_0_2_1; + result2 += M4(-0.12061757, -0.009343633, -0.00081862457, -0.008557594, 0.0157209, 0.07520143, -0.0057730125, -0.037164804, -0.023208179, -0.026747117, 0.02937458, -0.02085094, -0.019180479, -0.001153464, -0.0123294825, 0.00057600276) * inp_0_0_2; + result2 += M4(-0.07491442, 0.0012998895, -0.003791768, -0.0018487296, 0.011851669, -0.04956705, -0.04037895, 0.0035907337, 0.011612738, 0.051951934, 0.02765865, 0.03238063, -0.024823004, 0.031854708, 0.0016208817, 0.010899303) * inp_0_1_2; + result2 += M4(0.03014621, -0.042644065, 0.006469791, -0.017715499, -0.015943421, 0.02756462, -0.0066749803, 0.038881935, -0.020365236, -0.010369052, 0.016093656, 0.0077305282, 0.049845703, -0.030355452, -0.0064737713, -0.018258851) * inp_0_2_2; + result3 += M4(-0.078773834, -0.016008634, -0.007935509, -0.001396128, 0.054233056, 0.0035843593, 0.015553826, 0.0026222363, -0.05675569, 0.006963015, -0.016199075, -0.007500399, 0.04218557, -0.009065071, -0.0028575014, 0.0016697721) * inp_0_0_0; + result3 += M4(-0.096383415, 0.010926693, -0.028683553, -0.007648038, -0.024882574, 0.023757296, 0.038190883, 0.0096803475, -0.06872187, -0.09900396, 0.022616332, 0.01139855, -0.21759689, 0.027885599, 0.022720288, -0.0060495557) * inp_0_1_0; + result3 += M4(-0.05951591, 0.026032036, -0.009158509, 0.0063456916, -0.024268983, -0.06693157, 0.04884325, 0.02376814, -0.08697725, -0.025094235, 0.008715934, -0.014071452, -0.038649008, -0.021583658, 0.0088210525, 0.0007642979) * inp_0_2_0; + result3 += M4(0.05229015, 0.032827277, 0.004427977, 0.01396573, 0.05961745, 0.008633765, 0.014677919, -0.013303794, 0.011513263, -0.051826224, -0.029732209, 0.011103, 0.0019684895, 0.027300525, 0.01646766, 0.0023945945) * inp_0_0_1; + result3 += M4(0.026070546, -0.113941304, -0.0002405115, 0.002818134, 0.31538942, 0.014483092, 0.025939906, -0.035604917, 0.03252292, -0.0068924283, 0.035239175, 0.0012859845, 0.16931184, -0.09490419, 0.06653527, -0.015014678) * inp_0_1_1; + result3 += M4(0.03613594, -0.036518693, 0.004710271, 0.0033459312, 0.056379013, 0.052322853, -0.07846089, -0.25096613, -0.006002274, -0.19779839, 0.010680657, -0.0020964164, 0.052844316, 0.047519457, 0.009496485, 0.010146979) * inp_0_2_1; + result3 += M4(-0.058442213, -0.018870808, 0.0011031982, -0.0015571571, -0.0010916296, -0.0033068894, 0.027714644, -0.015485217, -0.059925172, -0.0061753164, 0.0014754878, -0.009641381, -0.05915063, 0.010575672, -0.0035367615, 0.0002553907) * inp_0_0_2; + result3 += M4(-0.10965299, 0.03346314, 0.0015841913, -0.012393825, 0.10672976, -0.052294686, -0.053476516, -0.052087646, 0.033924025, -0.049459033, -0.0037261224, -0.055700976, -0.027407493, 0.013178274, -0.021325173, -0.0065716277) * inp_0_1_2; + result3 += M4(-0.023626707, -0.054254208, -0.0025664438, 0.057461217, -0.06782892, 0.060140558, 0.032029916, -2.0816886, -0.04932835, -0.041099142, 0.018772643, 0.012928383, -0.04103815, -0.03920651, -0.020854194, 0.015807824) * inp_0_2_2; + result4 += M4(-0.01289379, -0.0070452425, 0.007505676, 0.008018532, 0.00627048, 0.017560653, -0.06317347, -0.008233337, 0.02157538, 0.033503562, -0.02323948, 0.006499736, -0.00054582214, 0.023411544, -0.002362799, -0.005648069) * inp_0_0_0; + result4 += M4(-0.0050366605, -0.012969378, -0.018873924, -0.01141787, 0.039177284, 0.052830983, 0.13202119, -0.0842506, -0.039367992, -0.09508656, -0.019069986, 0.047900178, -0.001291695, -0.0015365388, 0.0045803576, -0.024888445) * inp_0_1_0; + result4 += M4(-0.0032193027, 0.004804373, -0.01857103, 0.004124962, 0.04113418, -0.029371548, -0.017747998, -0.08516284, 0.0012016459, -0.014943191, -0.07220075, 0.03819413, -0.006938766, -0.0014203513, 0.009422985, 0.004410304) * inp_0_2_0; + result4 += M4(0.042007565, 0.031422462, -0.035660017, 0.04698539, 0.015569978, 0.015705317, 0.081193365, -0.04071247, -0.023311192, -0.019290227, 0.039105233, -0.03195655, 0.0017112943, 0.043241616, 0.023499122, -0.032004416) * inp_0_0_1; + result4 += M4(0.015962446, 0.015347915, -0.051607084, 0.005601069, 0.32964543, 0.12579475, 0.04610197, 6.200917e-05, 0.0716747, 0.023456257, -0.11930905, -0.030191997, 0.027482346, -0.03263236, 0.023119524, 0.004183345) * inp_0_1_1; + result4 += M4(0.03917032, 0.0056261914, -0.05610095, 0.009960206, 0.015520569, 0.06267059, 0.16553426, -0.02010012, -0.024812296, -0.020280052, -0.13751085, -0.013581094, 0.004869674, 0.014552553, -0.07951488, 0.009768775) * inp_0_2_1; + result4 += M4(-0.014322015, 0.08621455, -0.04344676, 0.009875786, 0.0026412352, -0.0077130427, 0.020648358, -0.016539896, 0.0036327185, -0.015483406, -0.0538694, 0.0053454577, -0.019284973, -0.054858893, -0.01628997, -0.0070626675) * inp_0_0_2; + result4 += M4(-0.016621089, 0.0081797615, -0.10295796, -0.005728805, 0.05631096, -0.086629316, -0.017370053, -0.042710636, 0.008218702, 0.13222654, 0.10951487, 0.017404452, -0.017342474, 0.043236215, -0.018527396, -0.03745143) * inp_0_1_2; + result4 += M4(-0.022747595, 0.06096653, -0.059444312, 0.0038460172, 0.01158954, 0.014732194, 0.02134244, 0.051906865, -0.0296352, 0.026961008, -0.053348456, -0.03643577, 0.0074761016, -0.028639847, 0.107226305, -0.019053055) * inp_0_2_2; + result5 += M4(-0.058057223, -0.039166585, 0.016640013, 0.015895281, -0.008452976, 0.017194986, 0.012341754, -0.015883062, 0.06288335, -0.047669325, -0.03428946, -0.025943978, -0.086632036, 0.024514856, 0.012214399, -0.0005448519) * inp_0_0_0; + result5 += M4(0.108249374, 0.016742574, 0.027921552, 0.018645188, 0.04553082, 0.059700355, -0.20957518, 0.1510889, -0.18399017, -0.039760534, -0.14547798, -0.16409859, 0.15494652, -0.014586802, 0.0361119, -0.021014791) * inp_0_1_0; + result5 += M4(-0.0333254, -0.009196911, -0.006961476, 0.021157758, -0.06481886, 0.0057613165, 0.12950577, -0.061620865, -0.14778855, -0.029510964, -0.029036159, 0.05396873, -0.021684581, -0.01220097, 0.012617503, 0.035705253) * inp_0_2_0; + result5 += M4(0.072661586, -0.021702189, -0.04158937, -0.012955859, 0.21056259, 0.02581396, -0.012816757, -0.04235959, -0.14589727, 0.043966237, -0.004286118, 0.020072805, -0.06324599, -0.026485743, 0.013703415, -0.0018785495) * inp_0_0_1; + result5 += M4(0.11000013, -0.041045997, -0.032035988, 0.007968857, 0.32520214, -0.15416919, 0.22168629, 0.31035063, -0.8326168, -0.05459754, -0.12952703, -0.18654208, 0.06105866, 0.041240346, -0.055467404, -0.026087457) * inp_0_1_1; + result5 += M4(-0.028301246, -0.056161396, -0.004700935, -0.028534684, 0.06380836, 0.21001332, 0.034014743, -0.11567242, 0.1396275, -0.19471501, -0.33776173, -0.023274034, -0.1089506, -0.029636431, 0.038700502, 0.00016737756) * inp_0_2_1; + result5 += M4(-0.024325654, -0.011601796, -0.096013404, 0.012228482, 0.10135071, 0.02378393, -0.01687777, -0.0575494, -0.16002157, -0.04933964, -0.05483927, -0.037313033, 0.050847594, 0.0064098234, -0.021452649, -0.0054918393) * inp_0_0_2; + result5 += M4(0.015146107, -0.09046074, -0.0039179586, -0.033066064, -0.3870267, 0.11426056, 0.14134352, -0.051078025, -0.20435314, 0.005509383, -0.20035794, -0.021291165, -0.0027239271, -0.05983914, 0.05280896, 0.04786474) * inp_0_1_2; + result5 += M4(-0.06103365, -0.032689698, 0.0016097855, 0.02102138, 0.2968155, -0.062097516, -0.104581796, 0.041469987, -0.12192299, -0.0065730982, -0.092781015, 0.0981968, 0.011944244, 0.013649742, 0.022564681, -0.021659542) * inp_0_2_2; + result6 += M4(0.11077963, 0.0011563837, -0.020882158, -0.0020795912, -0.0786811, 0.014214256, 0.015662903, 0.016882181, -0.30587372, 0.033704683, 0.012865511, 0.014549307, 0.04320479, 0.020851586, -0.024538603, -9.427432e-05) * inp_0_0_0; + result6 += M4(0.040177345, 0.0134358285, -0.029296411, 0.067432664, 0.19949926, -0.02194099, -0.02440344, 0.08097038, -0.041496076, 0.04633682, 0.062154904, -0.05480727, -0.24887241, 0.05525719, 0.07487823, 0.04832519) * inp_0_1_0; + result6 += M4(0.20286922, 0.0057481565, -0.016141923, 0.035026092, -0.050194476, 0.063432954, 0.13011551, 0.0523196, -0.092645906, 0.02987317, 0.05786584, -0.15279952, 0.09147116, 0.0019088131, 0.0058786185, 0.010905708) * inp_0_2_0; + result6 += M4(0.22396933, -0.03834644, 0.02748083, -0.06860154, 0.12852079, -0.04496647, 0.0844889, 0.030927813, -0.33666012, -0.005711643, 0.03257282, -0.03837854, -0.0011762482, -0.025935419, -0.013378392, -0.015012171) * inp_0_0_1; + result6 += M4(-0.18189368, -0.15784307, 0.025255619, 0.029570572, 0.11988644, 0.17366901, 0.2352522, 0.16982158, 0.09998576, -0.06848574, 0.055721313, -0.002694097, -0.06832549, -0.20364797, 0.090322375, 0.0009486827) * inp_0_1_1; + result6 += M4(-0.021874918, -0.021511186, -0.007370704, 0.0023035852, -0.058854107, -0.0037493664, 0.026673635, -0.0057249884, 0.011881192, -0.1349753, -0.021164447, -0.14210021, 0.007355388, 0.011178779, 0.026148302, 0.0056277495) * inp_0_2_1; + result6 += M4(0.25154752, 0.024832219, 0.006589518, -0.0057187276, 0.04539431, 0.037196115, 0.016173976, 0.0051059304, -0.17792349, 0.011545101, 0.0026983162, 0.04348514, -0.013908699, -0.010357224, -0.025162924, -0.02410551) * inp_0_0_2; + result6 += M4(-0.2870902, 0.0020163858, 0.021209292, 0.025311703, 0.099115975, -0.052700743, -0.053314462, -0.03868319, 0.09428621, 0.017449796, 0.024728855, 0.008780251, 0.049800154, -0.00546953, 0.0131761655, 0.038137753) * inp_0_1_2; + result6 += M4(0.10019241, 0.026749019, 0.021972235, -0.0031393464, -0.07198951, -0.037454784, -0.0085364105, 0.027606621, -0.10679027, 0.035117567, -0.0023179913, -0.06936379, -0.07426625, -0.06542811, -0.0021566902, 0.0019493703) * inp_0_2_2; + result7 += M4(0.016778281, 0.027244873, 0.1785118, -0.028542737, -0.02158157, 0.0018936591, 0.044226184, 0.005454867, 0.006133459, -0.0022196944, 0.05522412, 0.0016904869, 0.010006922, 0.0077003897, 0.14999124, 0.018117785) * inp_0_0_0; + result7 += M4(0.0027752982, -0.0011517212, -0.11453347, -0.006889162, 0.0013214573, 0.014642321, -0.009536182, 0.06629019, 0.014946253, -0.01821599, -0.036175184, -0.027156498, -0.008841768, 0.042829454, -0.012587802, -0.038321946) * inp_0_1_0; + result7 += M4(0.0029785964, 0.03305846, 0.20846348, -0.016032532, 0.016099088, 0.0047752312, 0.21619861, 0.009659423, -0.013535722, 0.03346688, -0.014527106, -0.124695465, -0.00046251842, 0.012625537, 0.12431096, -0.00020890926) * inp_0_2_0; + result7 += M4(0.0024013943, -0.052964713, -0.09795327, 0.04927752, -0.00896287, -0.033386085, -0.17224927, 0.022460157, -0.035059433, -0.027771607, -0.061376143, 0.009803232, 0.042268053, -0.008064652, -0.021386102, -0.019951392) * inp_0_0_1; + result7 += M4(0.0030796481, -0.025629131, 0.060133893, 0.02577895, 0.16429196, -0.061604384, 0.27389398, 0.24194263, -0.11225831, -0.0100386245, 0.08777596, 0.11811642, -0.0058315797, -0.049185995, -0.08956391, -0.06419162) * inp_0_1_1; + result7 += M4(-0.0013952986, -0.014312465, 0.0081506325, 0.060935892, -0.004787767, 0.026864463, -0.037531868, -0.086743966, 0.019121658, -0.17381035, -0.35539955, 0.059250716, -0.0075980066, -0.0065173106, 0.034874164, -0.047306087) * inp_0_2_1; + result7 += M4(-0.003411818, 0.03353024, 0.24050865, -0.010094028, 0.011867048, 0.014723875, -0.019341152, 0.016229203, -0.008229837, 0.0034855935, 0.06604283, -0.0018945972, -0.009332319, -0.0042675044, -0.007325845, -0.014454763) * inp_0_0_2; + result7 += M4(0.0003701205, 0.021963142, -0.26295194, 0.075434074, -0.026853768, -0.0359465, 0.037549775, -0.107349336, 0.007897477, 0.077532426, 0.095322214, 0.014742816, 0.017885676, 0.039552286, -0.07062351, 0.06477598) * inp_0_1_2; + result7 += M4(-0.0053137187, 0.0039010711, 0.26665658, 0.0011285796, 0.0138741415, 0.069002256, -0.03234969, -0.03120307, -0.0027824824, 0.030501414, 0.13849977, -0.005607998, 0.010689414, 0.026879018, -0.04614842, 0.012998317) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.069759585, -0.01573197, -0.019362776, 0.23598818, -0.04912704, -0.013924066, 0.04628924, -0.12344715, -0.020282255, -0.021566777, -0.048429627, -0.34257057, -0.08174711, -0.0009847737, 0.06897319, 0.019713469) * inp_1_0_0; + result0 += M4(-0.029824898, -0.0070922943, 0.048803955, -0.10334113, 0.024044944, 0.005320066, 0.09797858, -0.20305471, 0.059991308, -0.00934283, -0.098593146, 0.25650647, 0.001406327, -0.024399182, -0.042362742, -0.31486136) * inp_1_1_0; + result0 += M4(0.07022933, 0.022159398, -0.020647798, 0.6392809, 0.031926244, -0.044625495, -0.19889951, -0.19427465, -0.011934095, -0.002966804, -0.089966506, 0.04981931, -0.019965818, 0.0019160038, -0.07461672, -0.14302221) * inp_1_2_0; + result0 += M4(0.027679078, -0.014971468, 0.012308202, -0.081432745, 0.11803643, 0.0120128, -0.16855171, 0.25168505, -0.12739635, -0.020168182, 0.0064175962, -0.10148978, 0.02268503, 0.05391281, 0.05604633, 0.10306229) * inp_1_0_1; + result0 += M4(0.030125475, 0.027856808, 0.15825862, 0.08692091, -0.25286105, -0.015990704, -0.06339778, -0.008698826, 0.07821253, 0.022914948, -0.037823234, -0.18075646, -0.09930718, -0.01728723, -0.068361096, -0.06910528) * inp_1_1_1; + result0 += M4(0.08636643, 0.10044524, -0.012154737, 0.23643473, 0.09127728, 0.06186279, -0.26712304, 0.24551098, -0.0482596, -0.022057222, 0.047239028, -0.09296678, -0.0068342444, 0.09386074, -0.1275545, 0.20772336) * inp_1_2_1; + result0 += M4(-0.074230246, -0.008949588, -0.0043404317, -0.28251222, 0.076502964, 0.0046890667, -0.25128037, 0.06507089, -0.066883706, -0.035244968, -0.013487795, -0.20238803, 0.104889385, -0.006779997, -0.05340542, -0.11138533) * inp_1_0_2; + result0 += M4(0.12301065, -0.008550837, -0.0516488, 0.19054751, -0.17213024, -0.013116637, 0.095610835, -0.44067273, 0.013825274, 0.02581849, -0.037420906, -0.10775812, 0.13375175, -0.063953236, 0.015891433, -0.3149349) * inp_1_1_2; + result0 += M4(-0.067207485, 0.031286363, 0.02840882, -0.40900674, -0.0082170395, 0.021382434, -0.03838344, -0.19516744, -0.036277033, 0.00034281323, -0.07211101, -0.2361534, -0.03302797, 0.01692043, 0.114838436, -0.11760255) * inp_1_2_2; + result1 += M4(-0.029706296, -0.05248761, -0.33545738, -0.12596764, -0.015084135, -0.052900173, -0.21451795, -0.09247048, 0.09419264, 0.0156194465, 0.03142249, -0.038329862, 0.07068911, 0.019921113, 0.04984978, 0.1038811) * inp_1_0_0; + result1 += M4(-0.012716611, -0.04260189, -0.25355944, -0.018495861, 0.009794862, 0.06644613, -0.14286776, 0.09717802, 0.016163072, -0.11943416, -0.28763446, -0.07038638, 4.5881323e-05, 0.08324362, -0.026893144, 0.03285746) * inp_1_1_0; + result1 += M4(-0.008414961, -0.043285243, -0.08509111, -0.00172135, -0.00911804, -0.11219939, -0.16589727, -0.002465509, -0.0068474705, -0.04103227, -0.62504536, -0.014356414, -0.014680181, -0.015523176, 0.4186634, 0.0031351268) * inp_1_2_0; + result1 += M4(-0.01396166, 0.024831569, -0.089373894, -0.1036001, -0.03851702, -0.067040466, -0.1321764, -0.111300245, 0.031170268, -0.040760603, -0.097344846, -0.052310213, -0.0155425845, 0.07169252, -0.08741599, 0.13948059) * inp_1_0_1; + result1 += M4(-0.004784282, -0.11388955, -0.3687792, -0.0014438336, 0.008865337, 0.06712148, -0.11676311, 0.010888562, 0.038391903, -0.0058718063, 0.18395917, -0.04148364, -0.012247986, -0.025193544, -0.41034153, -0.0660706) * inp_1_1_1; + result1 += M4(-0.007774285, -0.011684829, -0.1261301, -0.008266488, 0.004665687, 0.01296363, -0.07926099, 0.00039324735, -0.003218291, -0.03723256, -0.023750132, 0.01778312, -0.008515377, 0.042133063, -0.22591662, -0.02799224) * inp_1_2_1; + result1 += M4(0.0009856308, -0.04092987, -0.042002074, -0.0023758663, 0.005487486, 0.014913833, -0.04651767, 0.023761598, -0.01015791, -0.01038192, -0.0594634, -0.056171156, -0.015122081, 0.009180416, 0.03187551, 0.016158033) * inp_1_0_2; + result1 += M4(-0.006504527, 0.0012869429, -0.040399574, -0.055316262, 0.002899159, -0.006958559, -0.06554664, -0.009679741, -0.010512587, -0.015364673, -0.026660308, 0.0017851419, -0.0008710558, -0.010404262, 0.11519802, -0.01665407) * inp_1_1_2; + result1 += M4(-0.007862216, 0.0003762563, -0.036025226, 0.027081454, -0.0072422125, -0.0019626904, -0.07563435, -0.002883421, 0.0001578607, -6.29984e-05, -0.1759683, -0.026070148, 0.0032333322, -0.039243754, 0.10713396, 0.014173934) * inp_1_2_2; + result2 += M4(-0.018290471, -0.008456612, 0.014321202, -0.015954705, 0.04432792, 0.049570207, 0.015845405, 0.002891528, -0.0062128846, -0.019229969, -0.0013510644, 0.0030160812, 0.17636502, 0.0477721, 0.008577081, -0.023127135) * inp_1_0_0; + result2 += M4(-0.068967335, -0.067173734, 0.020672966, -0.016111633, 0.0168461, 0.10798353, -0.049942844, 0.032419384, -0.013251344, -0.043575652, 0.0065951026, 0.015024389, -0.03153569, -0.05764462, -0.004872319, -0.06236922) * inp_1_1_0; + result2 += M4(-0.049503498, 0.018817697, -0.0205654, 0.0070158853, -0.0017866828, -0.055189367, 0.0030540507, -0.013144511, -0.07728904, 0.0059341067, 0.024631834, -0.00017130763, 0.09031055, -0.008405811, 0.00959548, 0.018110791) * inp_1_2_0; + result2 += M4(-0.031645045, -0.007563045, 0.04191059, 0.0135494415, -0.14752215, -0.032768063, -0.015438905, 0.013153754, -0.011449229, -0.02259906, 0.020613346, 0.0066561773, -0.044300422, -0.0073168925, -0.057878617, 0.002732759) * inp_1_0_1; + result2 += M4(-0.18678784, -0.09959061, 0.011212419, 0.05955596, 0.026348552, 0.16489275, 0.31075048, 0.073002934, -0.182382, -0.09003974, 0.06571621, 0.06007381, 0.1871938, -0.0865607, 0.044542335, 0.023401545) * inp_1_1_1; + result2 += M4(-0.013724682, -0.009321084, 0.011152485, -0.0033966685, -0.043078344, 0.036416885, 0.015623447, 0.055957038, -0.01849877, -0.072857074, -0.01046809, 0.026011404, -0.06919331, 0.091046415, -0.04164453, 0.046394613) * inp_1_2_1; + result2 += M4(0.0012422197, -0.002631582, 0.003743998, 0.015123382, -0.015633993, -0.035724614, 0.026706185, -0.017725002, -0.06825478, -0.00901042, 0.00061856484, -0.0063771904, 0.13396682, -0.033139773, -0.009686248, -0.03838249) * inp_1_0_2; + result2 += M4(-0.09512716, -0.08837415, 0.018194735, 0.008871673, 0.062261507, -0.065781176, -0.055187, 0.027707918, -0.0053967116, -0.044796087, 0.010361364, -0.008945669, -0.061361406, 0.008197509, 0.047274556, -0.005719721) * inp_1_1_2; + result2 += M4(0.029693535, -0.017528165, -0.007855424, -0.0074159503, -0.01266465, 0.025099238, -0.006872992, 0.019218933, -0.04778084, -0.06347614, 0.03295207, 0.00090956315, 0.02077793, -0.062143005, -0.034944285, -0.024958752) * inp_1_2_2; + result3 += M4(-0.09974788, 0.020605205, -0.0024725075, 0.0028876564, 0.038388405, -0.020979702, 0.017852712, -0.0020744698, -0.008816921, 0.038277615, 0.0064083883, -0.004805702, -0.021744244, -0.013467642, 0.014029597, -0.00802205) * inp_1_0_0; + result3 += M4(-0.29090038, -0.07220626, 0.003039927, 0.00031529332, 0.081712596, -0.053949203, 0.0560472, -0.019879429, 0.04487666, -0.07840531, 0.022384407, 0.0037922375, -0.12139882, 0.058006596, -0.07355735, -0.002001135) * inp_1_1_0; + result3 += M4(-0.12707077, 0.0029293671, 0.002925028, -0.011142545, 0.0012060722, -0.0059201643, -0.022559587, 0.0047758655, -0.012047067, 0.006398406, -0.00014037399, -0.007924496, -0.08267729, 0.03089181, -0.011231169, 0.010514431) * inp_1_2_0; + result3 += M4(-0.016742278, -0.007793414, -0.020882057, -0.0062197475, -0.029902719, -0.054846365, -0.027987752, 0.0056060706, -0.034713805, -0.047086217, 0.004880524, 0.01464124, -0.012823535, 0.025803465, -0.031325895, -0.0010646778) * inp_1_0_1; + result3 += M4(-0.27933434, -0.14838761, -0.11952433, 0.0036372135, 0.058186408, 0.06696874, -0.06479991, -0.010031049, -0.13002986, -0.01275557, 0.016198829, -0.009882386, 0.089558944, -0.079711266, -0.08013397, 0.065905005) * inp_1_1_1; + result3 += M4(0.023724329, 0.03271399, 0.0075594573, 0.015919626, 0.01905627, 0.036951147, 0.029244334, -0.023265809, -0.11982203, -0.07621513, -0.007814278, 0.024171054, 0.11532883, 0.05751838, 0.04637661, 0.017592529) * inp_1_2_1; + result3 += M4(-0.03479878, -0.022777118, 0.012533797, 0.007029099, -0.0046606115, -0.027692024, 0.039454233, 0.0031962066, -0.07223084, 0.023742193, 0.011920917, -0.0152232265, -0.037636317, 0.03351182, 0.003346064, -0.004711423) * inp_1_0_2; + result3 += M4(-0.15771055, -0.076403245, 0.013966556, 0.0042798854, 0.05392789, -0.10186627, -0.021976942, 0.013428745, 0.0008405691, -0.0656948, 0.0028464287, 0.030519322, -0.16605647, 0.1102983, 0.04253903, -0.029273903) * inp_1_1_2; + result3 += M4(-0.024137326, -0.008258713, -0.011959554, -0.65658355, 0.05886992, 0.0021063786, -0.0040613245, -1.4775715, -0.004617782, -0.01655899, 0.044767484, -0.44391325, -0.030074531, -0.100835845, -0.00067998114, -0.6768125) * inp_1_2_2; + result4 += M4(-0.0019363825, -0.043588802, 0.054561615, 0.0024997436, -0.016966254, -0.034322012, 0.1413046, -0.018009556, -0.001101635, -0.02704994, -0.07043372, -0.02230024, -0.0015380388, 0.005272876, -0.037090015, 0.006166373) * inp_1_0_0; + result4 += M4(-0.0050472687, -0.07574829, -0.15483479, 0.043677237, 0.023145339, -0.0086202165, -0.0049951524, -0.0060210736, -0.017921211, -0.05777129, -0.048439827, 0.026267895, -0.100406535, -0.061962795, 0.09865183, 0.055020455) * inp_1_1_0; + result4 += M4(-0.0055961697, -0.04754439, -0.0017440156, -0.005986155, -0.030325167, -0.021534791, 0.084809996, 0.023918811, 0.017858705, -0.022967286, -0.095544815, 0.0074437135, 0.019627845, -0.019305013, -0.01984569, 0.040462747) * inp_1_2_0; + result4 += M4(0.048991658, -0.13385503, -0.046927042, 0.016631545, -0.029064609, 0.0006330952, 0.008242063, 0.028124796, 0.0060957284, -0.040064096, -0.032486413, 0.013428372, -0.08499794, -0.006317721, -0.12359131, 0.058705498) * inp_1_0_1; + result4 += M4(-0.006022805, -0.1837393, -0.12978028, -0.0013139789, -0.055542786, -0.13720812, 0.23876561, -0.053139366, 0.15966879, 0.008683597, -0.14635624, 0.0126981875, 0.32272208, 0.06236775, -0.10698612, 0.14063711) * inp_1_1_1; + result4 += M4(-0.009701131, -0.03646291, -0.037340086, 0.039884623, 0.009189008, -0.0064634443, -0.0565141, -0.0011173718, -0.019694382, -0.04803177, 0.069370545, 0.050015707, -0.05899881, -0.003470957, -0.20582588, 0.05659334) * inp_1_2_1; + result4 += M4(0.013319271, -0.21169075, -0.040460724, -0.007307999, 0.025113398, -0.13337378, 0.062859945, -0.014940971, 0.009030944, -0.015980482, -0.052400064, -0.005603718, -0.015142185, 0.105756275, -0.005185126, 0.03659301) * inp_1_0_2; + result4 += M4(0.029834945, -0.24019423, -0.059754893, 0.01608155, -0.050190847, -0.07629842, -0.036545094, -0.033685338, -0.04057415, -0.1007561, -0.03597081, 0.02017857, 0.021963967, 0.15769747, 0.012509617, 0.071566634) * inp_1_1_2; + result4 += M4(0.0071591125, -0.081908636, -0.23059505, 0.0007022638, 0.0049481234, 0.06784498, 0.14878985, 0.02515274, 0.015787132, -0.054703876, -0.17242855, -0.0075456346, -0.05905788, -0.035373684, -0.027502216, -0.050735876) * inp_1_2_2; + result5 += M4(0.1399075, -0.011689272, -0.019618753, 0.07614495, 0.09006709, 0.08453059, 0.013071986, 0.04905171, -0.046357352, -0.037395712, -0.04851694, -0.031871088, -0.22293495, -0.09758526, 0.027082501, -0.07850271) * inp_1_0_0; + result5 += M4(0.12827924, -0.07307409, 0.009706256, 0.037915763, -0.023452701, -0.056642782, 0.09213479, -0.16854583, -0.010336425, -0.019925116, -0.019452507, -0.027321696, 0.15007468, 0.028512416, -0.14916861, 0.060340323) * inp_1_1_0; + result5 += M4(0.0071526146, -0.012299189, 0.01801723, -0.05339408, 0.18717697, 0.0010336664, -0.035712525, 0.06225803, -0.06730897, -0.048067704, -0.01911119, -0.025771273, 0.0284756, -0.01424645, -0.049994357, 0.07865) * inp_1_2_0; + result5 += M4(0.054180637, -0.030158587, 0.028763872, 0.011243639, -0.11195821, 0.048051868, -0.036910217, -0.121535614, 0.034089345, -0.010673306, -0.118964724, 0.006967483, -0.43662754, 0.10253554, 0.19969112, -0.09384508) * inp_1_0_1; + result5 += M4(0.17829208, -0.017263798, 0.095714435, 0.015920453, 0.047719326, 0.27315283, 0.06549526, 0.034134313, -0.107288554, -0.07971154, 0.023380052, -0.1049888, 0.07676816, -0.1270428, -0.30297834, -0.016645133) * inp_1_1_1; + result5 += M4(-0.080704, -0.04045251, 0.057528976, -0.060223106, 0.030582413, -0.029517375, -0.035083197, 0.13772357, 0.11981866, -0.0055306703, -0.05157847, 0.019871347, -0.31669575, -0.10019969, 0.05156495, 0.13592085) * inp_1_2_1; + result5 += M4(-0.07726804, 0.010888947, 0.0045093806, -0.031755887, 0.069382794, -0.114867374, -0.027609147, 0.007948753, -0.05999028, -0.0076457877, -0.022484811, -0.034255974, -0.040651836, -0.03269805, -0.09060754, 0.020044835) * inp_1_0_2; + result5 += M4(-0.22580162, -0.026431922, 0.0066301497, -0.083136596, 0.036208548, 0.038507033, 0.033245984, 0.0031778018, -0.06463218, -0.002233673, -0.047485773, -0.055477843, 0.24420127, -0.12433101, -0.15715355, 0.0033607255) * inp_1_1_2; + result5 += M4(0.18169144, -0.117782086, -0.049622487, -0.007055393, -0.2349688, 0.045167558, 0.06171585, -0.032344848, -0.086783715, -0.12275233, -0.040596236, 0.016874569, -0.28013673, 0.041738532, 0.076820694, -0.038521003) * inp_1_2_2; + result6 += M4(0.4646428, -0.106396586, -0.008314068, 0.04745663, -0.025684066, -0.0687092, 0.004304384, -0.012457071, -0.10869589, -0.0013894064, 0.0054308963, -0.034909822, -0.04161765, -0.069621116, -0.062489342, -0.052697487) * inp_1_0_0; + result6 += M4(-0.13566065, -0.19315332, -0.011638345, -0.07154829, 0.09162782, -0.063815884, 0.088597, 0.040585265, 0.17736122, -0.09628029, 0.049993422, -0.039434943, -0.23161477, 0.03393691, -0.03461162, -0.09007837) * inp_1_1_0; + result6 += M4(0.096893504, -0.073935166, 0.013661386, 0.1132911, 0.025515532, -0.027286345, -0.0048642736, 0.037666928, -0.048467107, -0.08495862, 0.020949233, -0.088655114, -0.029095348, 0.0017143011, 0.046989925, 0.0054008774) * inp_1_2_0; + result6 += M4(0.21191326, -0.042432927, -0.005542918, 0.0049734917, -0.08363724, 0.012624439, -0.01816311, 0.00029272735, -0.12316026, -0.038396236, 0.017166546, 0.012600694, -0.087789804, 0.055348933, 0.032430384, -0.15191323) * inp_1_0_1; + result6 += M4(0.05356737, -0.19634083, -0.044354584, -0.15601216, -0.29275194, 0.15823555, 0.08218647, -0.12905455, -0.0021870707, -0.017191757, 0.008696628, -0.016767973, -0.2398507, -0.017669896, -0.004906887, 0.0259101) * inp_1_1_1; + result6 += M4(0.033864714, -0.018132137, -0.033162106, 0.0486692, -0.0010737425, 0.058966868, 0.032421466, 0.064478435, -0.038641904, -0.005040093, 0.009166323, -0.061544646, 0.17484759, 0.029496586, -0.04968734, 0.05957608) * inp_1_2_1; + result6 += M4(-0.4815216, -0.07188454, -0.012073379, 0.009241282, -0.28480425, -0.013349487, -0.0076810173, 0.04503337, -0.36490703, 0.0014258957, -5.720579e-05, -0.08018242, 0.07554508, 0.065987855, 0.0073008398, 0.029608311) * inp_1_0_2; + result6 += M4(0.27818504, -0.24485376, -0.0066393493, -0.062494364, 0.064903826, -0.055958327, -0.0057145157, -0.1297167, 0.0024186247, -0.08357713, 0.0039343257, -0.039283898, -0.18243206, 0.06448699, 0.028300015, 0.09711386) * inp_1_1_2; + result6 += M4(-0.1664957, -0.09776599, -0.016569579, -0.034156576, -0.05563782, -0.052336413, 0.022353496, -0.00014532752, -0.010451572, -0.05604475, 0.008415247, -0.06049494, 0.077859275, 0.019115182, 0.0045760144, -0.019009842) * inp_1_2_2; + result7 += M4(0.0055705504, -0.026394561, -0.1139865, -0.044170834, 0.019989682, -0.018016277, -0.23643732, -0.008260699, 0.0014235481, -0.0050782706, 0.026109695, -0.03192164, 0.0016869969, -0.043272555, -0.03469904, -0.026431138) * inp_1_0_0; + result7 += M4(0.004675645, -0.11380706, -0.016251858, -0.16694085, -0.010026139, -0.14811772, -0.16526401, 0.1084492, 0.005308494, -0.02474828, -0.14797011, 0.0033176611, 0.015307528, 0.058559656, 0.15691474, -0.1340313) * inp_1_1_0; + result7 += M4(-0.0028032598, -0.05997547, -0.121733114, -0.09554267, -0.0004986317, -0.049930423, -0.1273882, 0.013951515, 0.00014469973, -0.002117326, -0.28851274, -0.032613505, -0.0025998768, 0.05574168, 0.07926589, 0.0036856018) * inp_1_2_0; + result7 += M4(-0.005603397, -0.036351632, -0.11528746, -0.022929851, -0.016323281, 0.027111532, -0.06355817, -0.102257326, 0.0077102194, 0.033174835, 0.12208106, -0.07609491, -0.12240418, 0.0012740727, -0.08517984, 0.045448177) * inp_1_0_1; + result7 += M4(0.026478117, -0.047482636, -0.24134436, -0.19304702, -0.020660242, 0.003701428, -0.24806923, 0.07357205, -0.040037777, 0.017275618, 0.06370994, -0.09546771, -0.054608576, -0.023270067, -0.14147069, 0.082173534) * inp_1_1_1; + result7 += M4(-0.0056879753, -0.0789688, -0.036169644, -0.08457389, -0.005534551, 0.03795418, 0.12144431, 0.06957072, -0.0027520072, -0.049243074, -0.114631444, -0.15805164, 0.006229704, 0.054365523, -0.0737803, -0.07932503) * inp_1_2_1; + result7 += M4(-0.0027459075, -0.0031624225, -0.2853663, -0.016258257, -0.004350614, -0.006499531, -0.07625435, 0.019749388, -0.0043036724, 0.0026062243, -0.034052182, -0.0254773, -0.007793149, 0.0050190384, 0.014368649, -0.008314004) * inp_1_0_2; + result7 += M4(-0.012016951, -0.14817005, -0.37908626, 0.0062397486, 0.022265838, -0.031428758, -0.18387163, -0.065556504, -0.013573682, -0.010420115, -0.05035488, -0.034537543, 0.016361326, 0.09706439, 0.12125735, 0.08310228) * inp_1_1_2; + result7 += M4(-0.0032962672, -0.057069913, -0.2866559, 0.01628468, 0.012958846, -0.06301743, -0.14468633, -0.052856874, -0.0067473697, -0.021823918, -0.32554987, -0.012471529, 4.9743405e-05, -0.011773439, 0.039131045, 0.028107878) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.06259104, -0.007911529, -0.033087455, 0.09226988, -0.07786077, -0.01577213, -0.08678229, -0.24408747, -0.039184645, -0.02137133, 0.015986593, -0.118641235, 0.01882303, -0.024270365, -0.16987392, -0.15344885) * inp_2_0_0; + result0 += M4(0.14670405, 0.04385066, -0.0486158, -0.006886528, 0.06561302, 0.010654134, -0.25718275, 0.11941544, 0.014750529, -0.024777737, -0.06386406, 0.114893936, -0.119082555, -0.00048255626, 0.15127754, -0.06443381) * inp_2_1_0; + result0 += M4(0.073016174, -0.008870542, 0.19351654, -0.09719472, -0.11198074, 0.0290701, 0.023286037, -0.057860527, 0.014365183, -0.0026683658, 0.0041949, -0.02270391, -0.0044946442, -0.06463224, -0.08278831, -0.10824213) * inp_2_2_0; + result0 += M4(0.07936937, 0.014984422, 0.09283034, 0.12912495, -0.19152328, -0.060032662, 0.120669484, -0.29279032, -0.01796172, -0.0113306595, 0.114664845, -0.13806632, -0.15837833, -0.07952474, -0.09303139, -0.084077515) * inp_2_0_1; + result0 += M4(-0.65202504, -0.0027762896, -0.33984727, -0.18644305, 0.075471565, 0.02684578, -0.22864924, -0.19950864, -0.17015947, 0.07735234, -0.43614385, -0.6078004, -0.00021246736, 0.072867185, -0.33468452, -0.15514167) * inp_2_1_1; + result0 += M4(0.14552318, -0.2215449, 0.045654118, -0.017868856, -0.14882736, -0.05951145, 0.123094864, -0.23920804, 0.0658428, -0.26702496, -0.055465832, 0.25096157, -0.099843405, -0.13427813, 0.03559234, -0.21518996) * inp_2_2_1; + result0 += M4(0.15783593, -0.0041399, 0.0020199376, 0.31567332, -0.21559085, -0.013718181, 0.06864336, 0.10989995, -0.09445197, 0.0027337098, 0.068018034, -0.03058095, -0.16046366, -0.017405983, -0.06688804, -0.40090325) * inp_2_0_2; + result0 += M4(-0.21699506, 0.011274276, 0.123575896, -0.6198383, 0.086284466, 0.0052944883, -0.30053416, -0.12883341, -0.03160203, 0.011840349, 0.026714055, -0.12557992, -0.13357289, -0.05784815, -0.09033823, -0.031946022) * inp_2_1_2; + result0 += M4(-0.016761016, 0.018148478, -0.040655173, 0.5077567, -0.035978027, 0.017774666, -0.12156969, -0.37683502, 0.039764706, -0.046592835, -0.0076407106, -0.13444586, -0.047292627, -0.089782365, 0.010468214, -0.49796557) * inp_2_2_2; + result1 += M4(0.20441686, 0.105641656, -0.57313365, 0.039662212, -0.056281734, -0.0032463258, 0.12104667, 0.08683196, -0.19730814, 0.05890102, -0.41860288, 0.05867849, -0.017145434, 0.001774893, -0.25436202, 0.039173983) * inp_2_0_0; + result1 += M4(-0.0038675999, -0.13757882, -0.42988667, -0.07135995, 0.007278631, -0.083656915, 0.058825217, -0.099255435, 0.006978729, -0.2647683, -0.28938037, -0.03733833, -0.037920482, -0.06694141, -0.40598732, -0.01538189) * inp_2_1_0; + result1 += M4(0.009998102, 0.020497074, -0.18007217, 0.023767253, 0.008274002, 0.054186467, -0.08604311, 0.037877038, -0.009494318, -0.06919818, -0.13998544, 0.02897189, 0.0011283894, 0.038402133, -0.357374, -0.02176028) * inp_2_2_0; + result1 += M4(-0.0067111147, -0.038228486, 0.35508108, -0.3360015, -0.016141115, 0.0339894, 0.08852273, 0.03516315, -0.019841066, 0.030301504, 0.01180214, -0.3614631, 0.07711318, -0.009658857, -0.26690215, -0.30690867) * inp_2_0_1; + result1 += M4(0.003324947, 0.006942956, -0.03625221, 0.14541042, 0.01747195, -0.119628154, -0.22727552, -0.021256894, -0.058296442, -0.034491703, -0.10815976, 0.10701775, -0.012522395, 0.14182894, -0.08321797, 0.0030181266) * inp_2_1_1; + result1 += M4(0.0007243287, -0.03981442, 0.14314127, -0.011543288, -0.0016491759, -0.034187082, 0.015851242, 0.005562158, -0.0025102352, 0.021291113, 0.11228219, -0.0025074272, 0.006264527, 0.012934666, 0.03688195, 0.028460085) * inp_2_2_1; + result1 += M4(0.003825073, 0.0053533437, -0.052753773, 0.13051084, -0.019932156, -0.01216888, -0.101206355, -0.047114212, 0.0030692355, 0.0016778547, 0.03255571, 0.081206575, 0.03073618, -0.016007476, -0.15195127, -0.050261617) * inp_2_0_2; + result1 += M4(-0.00061310123, 0.0029938128, -0.076946884, -0.04023276, -0.0059665437, -0.0036570185, -0.058270033, -0.043692518, -0.008154179, 0.025144642, 0.077070415, -0.04914022, 0.012160264, 0.008769339, -0.27849194, 0.018670456) * inp_2_1_2; + result1 += M4(-0.0018538286, -0.020888457, -0.14603226, 0.004458962, -0.0051186327, 0.005187376, -0.088105775, -0.023515442, 0.0015456943, -0.02115476, 0.061274562, 0.008745916, -0.00017942826, 0.0014278735, 0.0021558965, -0.02485254) * inp_2_2_2; + result2 += M4(0.04387733, 0.011177, -0.013155367, 0.0038707254, 0.033662025, 0.07323885, 0.014289165, 0.020749439, 0.014215851, -0.04377387, 0.02840525, 0.023437489, -0.069018185, 0.029670266, -0.0093726795, 0.037346628) * inp_2_0_0; + result2 += M4(-0.1662737, 0.014679469, -0.03971628, 0.03979063, -0.09359844, -0.10326178, 0.042040948, -0.017902981, 0.048015613, 0.07861354, -0.05978879, 0.01613378, 0.0764324, 0.059389252, 0.0019603793, 0.0019048663) * inp_2_1_0; + result2 += M4(0.07047738, 0.012104223, 0.010471003, 0.016561575, -0.014056279, 0.052423958, -0.004780873, 0.008856081, -0.03842137, -0.029917346, -0.017814208, 0.016944503, -0.07138358, -0.04974661, 0.0056911004, -0.021948488) * inp_2_2_0; + result2 += M4(-0.02167664, 0.058325823, 0.00016128928, -0.00394003, 0.0980444, 0.082544304, 0.038742963, -0.042758625, 0.064785205, 0.027517313, 0.0054561617, -0.017314855, -0.14048225, 0.03143404, 0.01539274, -0.07431104) * inp_2_0_1; + result2 += M4(-0.3627822, -0.2677452, -0.07767445, -0.06756611, -0.0081676245, 0.1942054, 0.09633285, 0.3299528, -0.3213503, -0.3397066, -0.12813206, -0.12383137, 0.02204129, -0.068835855, -0.027104858, -0.040614042) * inp_2_1_1; + result2 += M4(0.028998533, 0.034165263, 0.01882919, 0.022605037, 0.010741659, -0.08068657, 0.040684298, -0.044681616, 0.07946782, 0.08955503, 0.020676995, 0.017162135, -0.014604344, 0.025126308, -0.01885885, 0.04648592) * inp_2_2_1; + result2 += M4(0.031499267, 0.010798005, -0.024340192, 0.0053935014, -0.03673988, -0.03745097, -0.028180122, -0.010525879, -0.0043634507, -0.008282364, 0.012158862, -0.007480346, 0.003468437, -0.10743966, -0.04802061, 0.013861989) * inp_2_0_2; + result2 += M4(0.015782064, 0.05101154, 0.013595114, 0.0018728715, -0.09477508, 0.033218864, 0.054674916, 0.007754477, 0.06362434, -0.0034073882, -0.0074852365, 0.0217853, 0.01791608, 0.042523008, 0.025429696, -0.023894863) * inp_2_1_2; + result2 += M4(-0.055626452, 0.0052463147, -0.0025686221, 0.019014176, -0.03757351, 0.035200834, 0.013226553, 0.04271463, 0.0337667, -0.023146713, 0.022220766, -0.014187415, 0.04665612, 0.009068524, 0.028105063, 0.0009911516) * inp_2_2_2; + result3 += M4(0.02311099, -0.015033379, -0.014415912, 0.007996471, -0.11714304, -0.025033528, 0.014787917, 0.00031632956, 0.036097407, -0.0062593, 0.0008023568, 0.0004291088, -0.058643885, 0.027261145, -0.00373395, -0.0106300535) * inp_2_0_0; + result3 += M4(-0.25627783, 0.014724077, -0.0031693468, -0.012934334, -0.14009495, 0.04730234, -0.07532691, 0.017501894, 0.17639922, 0.04749578, -0.030031111, 0.00010847835, -0.14200123, 0.013962472, 0.0012221021, 0.007009478) * inp_2_1_0; + result3 += M4(0.06224593, 0.053510256, -0.013872289, 0.016935157, -0.0507928, -0.014157633, 0.039609414, -0.016739354, 0.07427419, -0.092689894, 0.01857107, 0.0059409305, 0.057695348, -0.011191513, -0.0154221505, -0.010002582) * inp_2_2_0; + result3 += M4(-0.15928954, 0.04469865, 0.013059807, -0.014103501, 0.057253107, -0.03000104, 0.060849454, -0.008835153, -0.05975281, 0.03099963, -0.022080095, 0.008955542, -0.10001169, -0.02306701, 0.077677965, 0.017762778) * inp_2_0_1; + result3 += M4(-0.7209511, -0.33367357, 0.22877729, 0.0061251954, 0.088426866, 0.03677022, -0.08787391, -0.017562442, -0.6404437, -0.1710262, -0.28416404, 0.011668628, -0.26956356, -0.077434845, 0.07234901, -0.012213251) * inp_2_1_1; + result3 += M4(-0.029024111, -0.06502331, -0.011149307, 0.011200875, 0.012817251, -0.053123422, -0.029780958, -0.0075182803, 0.0239775, 0.016467577, -0.008465127, -0.0021384323, 0.019587008, -0.020116564, -0.025568662, -0.0240682) * inp_2_2_1; + result3 += M4(0.10459938, 0.0138568925, -0.010416794, 0.013563447, -0.00088927144, -0.021339059, -0.02198659, 0.0025771253, 0.059850562, -0.01238115, -0.004079428, 0.0014808591, -0.008280608, -0.0142796645, -0.00029255965, -0.03438513) * inp_2_0_2; + result3 += M4(-0.056060266, -0.10531251, 0.015185159, -0.024719283, -0.11129147, 0.026094018, 0.046266057, -0.018299006, -0.10789085, 0.009946776, -0.038517643, 0.0032327347, 0.08875372, -0.06078948, -0.008161181, 0.010793295) * inp_2_1_2; + result3 += M4(-0.04116976, -0.00475276, -0.011068314, -0.9719308, -0.100531764, -0.06516781, 0.0069025243, -0.22409818, -0.031182699, -0.009395091, -0.056300312, -1.0057682, 0.015271213, 0.0041449284, -0.013503556, -1.2952812) * inp_2_2_2; + result4 += M4(-0.0010569907, 0.037784833, 0.09058641, 0.00082357554, -0.009851633, -0.0206631, 0.02837604, 0.0010502184, 0.02194765, -0.009642023, -0.0026158122, 0.017715322, 0.025873099, 0.06527135, -0.042106256, -0.015425125) * inp_2_0_0; + result4 += M4(-0.013039143, -0.00092544657, 0.051402394, -0.073085226, -0.015918039, -0.017300375, 0.056266524, 0.0017518857, 0.015943771, 0.0051748073, 0.069561206, 0.038211856, 0.04274, -0.0036364659, 0.11233605, -0.027552709) * inp_2_1_0; + result4 += M4(0.026801294, 0.058651876, -0.08943758, 0.0057815216, 0.0014140977, 0.005042935, -0.13145381, -0.02659785, 0.019952124, -0.0039740773, -0.06676227, 0.02837083, -0.008902661, -0.02823108, -0.050232675, -0.0055570873) * inp_2_2_0; + result4 += M4(0.012736761, -0.076623105, -0.13613585, -0.0010271526, 0.001768636, -0.022922553, 0.10797487, -0.078531064, 0.0011252342, 0.020363344, 0.0037479124, 0.022272632, 0.0015242241, -0.0706725, 0.004770372, -0.018829994) * inp_2_0_1; + result4 += M4(-0.055683408, -0.07893092, -0.28381112, 0.001254962, 0.04472634, 0.0785131, -0.06490618, -0.05510835, -0.14655365, 0.061543383, -0.20277788, -0.038100597, -0.08800601, 0.03669007, -0.20510712, -0.029635012) * inp_2_1_1; + result4 += M4(0.041054245, -0.01956224, 0.21626267, -0.02382071, -0.0013260319, -0.08335329, 0.07006225, -0.016757535, -0.007988418, -0.0040367995, -0.067163855, 0.029561952, 0.022996977, -0.06787791, 0.026121844, -0.0044194665) * inp_2_2_1; + result4 += M4(0.009216556, -0.07813361, 0.08760252, 0.012415527, -0.030264309, 0.014184212, -0.089587666, -0.02850281, 0.004826943, -0.04655235, 0.022605399, 0.016589975, -0.034731586, -0.52998376, -0.09905967, -0.041101467) * inp_2_0_2; + result4 += M4(-0.037874702, -0.35465613, -0.26578254, -0.009551241, 0.014520269, 0.094988525, 0.095908746, -0.0032020216, 0.015690498, 0.006354517, 0.06937414, -0.004596613, 0.060183756, -0.29521805, -0.108245134, -0.03682771) * inp_2_1_2; + result4 += M4(0.01502931, 0.050048694, 0.12765224, 0.026397388, 0.0032798718, -0.03649024, 0.019652147, 0.0033454793, -0.004857356, 0.0051806583, 0.013952992, 0.020540467, 0.020426799, -0.056183644, 0.017993515, 0.01699833) * inp_2_2_2; + result5 += M4(0.06332271, -0.023084689, 0.032270726, 0.030445438, 0.18853442, 0.06726671, -0.04710401, 0.10672021, 0.10711485, 0.032424342, 0.0026893164, 0.09738551, 0.24309203, -0.035328314, -0.059811164, 0.0035163194) * inp_2_0_0; + result5 += M4(-0.031312633, -0.028656557, 0.060663447, -0.02233647, 0.038305853, 0.04246763, 0.05070555, 0.047282346, 0.022795606, 0.010903942, -0.1032557, -0.15654396, -0.008885978, 0.052279137, 0.06697581, 0.05159628) * inp_2_1_0; + result5 += M4(0.081875764, -0.01453514, -0.0054250895, -0.029229179, -0.15769237, -0.0713213, 0.071340404, -0.03371788, 0.008936784, -0.021031775, 0.06703637, 0.014112684, -0.028089365, -0.0071306084, -0.03943905, 0.0019693028) * inp_2_2_0; + result5 += M4(0.037231147, 0.08544815, 0.023376346, -0.020104773, 0.10020539, -0.015085355, -0.0060485243, 0.080421075, 0.15664357, 0.07094089, -0.07145073, 0.09701311, 0.24878515, -0.12589175, -0.1816692, -0.13067612) * inp_2_0_1; + result5 += M4(-0.12882102, -0.24260274, -0.43471512, 0.01938544, 0.11010322, 0.13329925, 0.115565196, 0.06456029, -0.31028664, -0.24667418, -0.26054385, -0.09559916, -0.67517704, -0.07482172, 0.071183324, 0.04955354) * inp_2_1_1; + result5 += M4(0.06611156, 0.15018785, 0.054557666, 0.017349077, -0.0818607, 0.06388472, 0.03500259, -0.14694388, -0.030318553, 0.06897548, 0.06355376, 0.11583515, 0.09560257, -0.0022927609, -0.10419371, 0.032708354) * inp_2_2_1; + result5 += M4(0.09569397, -0.027850833, 0.05960813, 0.0046952227, -0.13313407, 0.027086373, 0.11578828, -0.022797415, 0.048064835, 0.0027774738, 0.0049024625, 0.058362234, -0.2263547, 0.020394979, 0.0572644, -0.029309602) * inp_2_0_2; + result5 += M4(-0.050434433, 0.107525654, 0.117903136, 0.059306815, 0.10257986, -0.04112016, 0.03624714, 0.06940063, -0.1844857, 0.042563245, -0.08704364, -0.09770156, -0.25283772, -0.06382317, -0.14003965, -0.07532586) * inp_2_1_2; + result5 += M4(-0.025616704, 0.04303626, 0.0703198, -0.016617738, 0.046424564, 0.042200685, -0.051435344, 0.007989153, -0.147374, 0.005222426, 0.050844256, -0.036575984, 0.04505599, -0.023205958, -0.04365487, 0.029482046) * inp_2_2_2; + result6 += M4(0.16323288, -0.07697494, 0.0036021718, -0.018482288, 0.07922852, 0.031661283, 0.04610719, 0.090015285, -0.19198969, 0.0022031656, 0.012363241, 0.006750837, -0.12190212, 0.118119456, 0.04309471, 0.15813415) * inp_2_0_0; + result6 += M4(0.030367097, 0.087709054, -0.019422337, 0.08742913, -0.03249268, 0.01943231, -0.09225626, 0.10421135, -0.07407643, 0.030260053, -0.04976755, -0.09395393, -0.15528789, 0.049084287, 0.044716276, -0.036950078) * inp_2_1_0; + result6 += M4(-0.14495733, -0.0033047767, -0.030252518, 0.049959883, -0.06735904, -0.071782365, 0.00432423, -0.014054759, 0.01710648, -0.048354227, 0.065480836, 0.002764397, 0.06308667, -0.06444245, -0.021439746, -0.0625157) * inp_2_2_0; + result6 += M4(0.13954696, 0.015149074, 0.01400249, 0.04257805, -0.09718105, 0.0357621, -0.0113757625, 0.0772206, 0.21321023, -0.07966299, 0.04483856, 0.073616624, -0.29049397, -0.15661527, -0.048223075, 0.06354912) * inp_2_0_1; + result6 += M4(-0.17682892, -0.32434925, -0.058441192, 0.009955925, 0.2313231, -0.06718312, -0.11039461, -0.15741758, -0.026655002, -0.5290647, -0.055935364, -0.11362352, 0.2593133, -0.16837834, 0.12212712, -0.16563371) * inp_2_1_1; + result6 += M4(-0.0765633, -0.0022757533, -0.0030445922, 0.04933367, -0.09522646, 0.01708325, 0.018829428, -0.03566491, 0.083820574, 0.009320629, 0.004601883, -0.013381807, -0.07618723, 0.023810752, -0.03849788, -0.0015569695) * inp_2_2_1; + result6 += M4(0.12340713, -0.035633143, -0.000730753, 0.039920222, -0.13694862, 0.025033863, -0.0047767838, -0.039701987, -0.17719546, -0.0033921285, 0.020795459, 0.0026577634, -0.23769258, -0.05419352, 0.0007649054, -0.012916516) * inp_2_0_2; + result6 += M4(-0.18191607, -0.016308228, 0.013017699, 0.0013568805, -0.07645262, 0.019816648, 0.004391781, -0.014893658, -0.039497644, 0.08922314, -0.02652472, -0.01703181, 0.19856219, -0.096463844, 0.006254947, -0.030607205) * inp_2_1_2; + result6 += M4(0.05397833, 0.030990133, 0.002806348, 0.016910397, -0.04133647, 0.012163248, -0.014821759, 0.06565339, 0.06255686, 0.01559677, -5.922529e-05, -0.068239056, -0.12171919, -0.09679009, 0.033463333, -0.0014853496) * inp_2_2_2; + result7 += M4(0.04146421, -0.012865749, -0.009707601, 0.027850294, 0.013585483, -0.022817992, 0.07336379, -0.0074528162, -0.0016996431, 0.013874952, -0.08006178, 0.020839715, -0.005113131, 0.021290349, 0.24516137, 0.0037921611) * inp_2_0_0; + result7 += M4(0.028129315, 0.0075063645, 0.18359877, -0.02147192, 0.008527542, 0.10667993, 0.16808704, -0.10862029, 0.024802713, -0.047098104, -0.18204574, 0.16109203, -0.007077818, 0.038010005, -0.01702178, -0.07948193) * inp_2_1_0; + result7 += M4(0.009913939, 0.03263535, 0.18109964, 0.013029601, -0.013681817, 0.05438949, -0.12543575, -0.05536285, -0.007107966, 0.010420662, 0.055783633, 0.07936553, -0.008366168, 0.0051002456, -0.12116985, -0.09176514) * inp_2_2_0; + result7 += M4(-0.0039965436, 0.013184399, 0.017582629, 0.03430134, 0.12803346, 0.030973611, -0.14719161, -0.025845028, -0.011929984, -0.03815087, -0.30388555, -0.01967596, 0.028990403, -0.04263259, -0.4578903, -0.1594504) * inp_2_0_1; + result7 += M4(0.008504513, -0.15613689, -0.92339265, -0.011249895, 0.07949582, -0.051825784, 0.028209334, 0.00655686, -0.003414628, -0.02872148, -0.45489213, -0.009449394, -0.0744571, -0.10714275, -0.27856743, -0.24656865) * inp_2_1_1; + result7 += M4(0.008009527, 0.021199463, -0.11994805, 0.011137968, 0.0041203573, -0.09547085, -0.087147444, 0.029765243, -0.02127172, 0.057646498, 0.06545404, -0.0025877974, 0.004377491, -0.056918643, -0.11158697, -0.020177836) * inp_2_2_1; + result7 += M4(0.048053, 0.039475646, -0.042274997, 0.009786394, 0.0028160515, -0.0037620077, -0.10746224, -0.036494777, 0.017574804, -0.04649511, -0.03779512, -0.009219406, -0.051743623, -0.076405086, -0.106107414, 0.04329679) * inp_2_0_2; + result7 += M4(0.0118290065, -0.06250438, -0.13289489, -0.07007109, 0.010890779, 0.034959443, 0.101750456, 0.061163537, -0.0028765078, -0.054626506, 0.08974447, 0.015254667, -0.012915041, -0.11506801, -0.4121583, -0.04415781) * inp_2_1_2; + result7 += M4(0.0024066872, -0.091722414, -0.12651238, 0.016087336, -0.0007628652, 0.08666506, -0.057445258, -0.0046896227, 0.006538677, -0.071827024, 0.0032424238, 0.00068183034, 0.015331278, -0.060188826, 0.1724857, -0.0058465926) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.01884821, 0.02225298, 0.0609312, 0.26772645, 0.010304153, -0.025359716, -0.124975115, -0.101660624, 0.039085135, -0.0012123106, 0.0376473, -0.1736828, 0.029522952, 0.019022364, 0.0065592313, 0.0016020348) * inp_3_0_0; + result0 += M4(-0.009566287, -0.06439758, 0.03587801, 0.31137368, 0.052976143, -0.00045283034, -0.0732186, -0.19127107, 0.017481882, -0.010848177, -0.17232758, -0.062315885, 0.063886866, -0.016843708, -0.03020957, 0.0970365) * inp_3_1_0; + result0 += M4(0.062872596, 0.062106118, -0.029959345, 0.1910304, -0.03332523, 0.034179598, 0.12184684, 0.087091975, -0.05155777, -0.054864924, -0.09164668, 0.05479193, -0.021929933, 0.043209106, 0.031430453, 0.013835954) * inp_3_2_0; + result0 += M4(0.14966221, 0.039149858, -0.018892152, 0.04979894, -0.15222071, -0.013965407, -0.13854334, 0.08704429, 0.032250788, -0.023581238, 0.03958956, 0.13200888, 0.09045509, 0.08314211, -0.115738794, 0.3736751) * inp_3_0_1; + result0 += M4(-0.025297886, -0.05312454, 0.18119511, -0.13896842, 0.12201004, -0.06974543, 0.009590841, -0.1759535, -0.42742318, -0.036296893, -0.023707138, -0.02932279, 0.057680465, -0.06070717, 0.0047926847, -0.26466325) * inp_3_1_1; + result0 += M4(-0.012135449, 0.14930926, 0.13740848, -0.23095651, 0.08305027, 0.061010078, -0.01396914, 0.042804472, 0.096340165, 0.13279516, -0.19360799, 0.16441306, -0.052142918, 0.07423331, 0.22432159, 0.20987682) * inp_3_2_1; + result0 += M4(0.014316071, 0.03874188, -0.042387724, 0.33908868, -0.04863518, -0.0328775, 0.038263336, -0.3184205, 0.08507752, -0.013796855, -0.11221604, -0.08596128, -0.010760439, -0.0015378286, -0.05118684, 0.14045839) * inp_3_0_2; + result0 += M4(0.09434496, -0.05842221, -0.059500962, 0.23325484, 0.106550224, 0.03946791, 0.12929924, 0.45724982, -0.29787195, -0.013933312, 0.050397996, -0.46583217, 0.046672523, -0.081212655, -0.08685097, -0.2800335) * inp_3_1_2; + result0 += M4(-0.0013050294, 0.042344168, 0.052031405, 0.26614693, 0.01395185, -0.0017289019, -0.035085235, -0.00588513, 0.036729053, 0.048423328, -0.07941932, -0.040365215, 0.028111415, 0.06112914, -0.09793375, -0.1132537) * inp_3_2_2; + result1 += M4(-0.06250671, 0.012309623, 0.1481295, -0.0020055398, 0.049955696, -0.065890044, -0.54642016, -0.023447255, 0.0030096937, 0.043713823, -0.034119286, -0.019435098, 0.033844166, -0.040153492, 0.25838697, -0.10927334) * inp_3_0_0; + result1 += M4(0.027105171, 0.0014346655, -0.4046152, -0.01299009, 0.021844005, -0.012008094, 0.014106283, -0.03993987, -0.003289567, -0.04379177, 0.020796522, -0.0063147615, -0.029618349, 0.042246055, 0.34788325, 0.106097095) * inp_3_1_0; + result1 += M4(0.010641735, -0.09698625, -0.102795415, -0.00017856473, 0.009379015, 0.04438752, 0.3853207, 0.011924211, -0.00039226655, -0.0039059813, -0.16610676, 0.009873127, 0.013944055, -0.010356517, 0.31021017, -0.0005584608) * inp_3_2_0; + result1 += M4(-0.024330674, -0.014041768, 0.013623545, 0.0087550925, -0.02536001, 0.0022383442, 0.04521856, 0.045863442, 0.036882702, 0.005205646, -0.168819, -0.22588225, -0.016948085, 0.044146243, 0.28415143, 0.28309682) * inp_3_0_1; + result1 += M4(0.022651544, -0.030680181, 0.035747916, -0.03521948, -0.017953519, 0.054650687, -0.00035218126, 0.06687334, 0.011700043, 0.012629784, -0.13795328, 0.06381413, -0.0016056991, 0.06598586, -0.15195106, -0.008760848) * inp_3_1_1; + result1 += M4(-0.006826481, 0.048955724, 0.13722718, 0.0025277198, 0.003250822, -0.018708214, -0.07780324, -0.008313009, -0.00716623, -0.018976055, -0.22579159, -0.008596183, -0.009374258, -0.009971103, 0.3956088, -0.0034246633) * inp_3_2_1; + result1 += M4(-0.0095452, 0.02172935, -0.085909374, -0.014317445, 0.0016978491, -0.010642444, 0.09447157, -0.05678749, 0.0009725698, -0.019332105, 0.057287097, 0.07546865, 0.019813916, 0.024594069, 0.01624759, 0.14962631) * inp_3_0_2; + result1 += M4(0.0033371202, -0.005898891, -0.08099478, 0.019843815, -0.0043270085, -0.03385353, -0.060939293, -0.018619116, 0.0059468923, 0.006402152, 0.124421105, 0.0016647028, -0.00082514866, -0.08626113, 0.100049764, -0.043861367) * inp_3_1_2; + result1 += M4(-0.003957271, -0.0014693633, 0.038502783, 0.0005841569, 0.0011435278, -0.005467989, 0.047523648, 0.0011898798, -0.0055441153, -0.0037178195, -0.00010545709, -0.012234697, -0.004670635, 0.008560715, -0.051418226, 0.010909083) * inp_3_2_2; + result2 += M4(-0.010705484, -0.01650546, -0.03246215, 0.0055108117, -0.104894646, -0.088077545, 0.0036809004, -0.04068051, 0.023358036, 0.06055789, 0.0037449882, 0.014770061, -0.013959497, -0.072800525, 0.009345961, -0.025399605) * inp_3_0_0; + result2 += M4(0.04424502, -0.0010698559, 0.0073272446, 0.02035995, 0.01310611, 0.02774244, -0.026604129, 0.026129542, -0.04380847, 0.053310756, 0.010456372, 0.014191831, 0.06798116, 0.005584759, -0.021483535, 0.03465087) * inp_3_1_0; + result2 += M4(-0.06981241, 0.009179036, -0.007089444, 0.017998978, 0.033409934, -0.0010209056, 0.009835712, -0.01610797, 0.027777841, -0.02542095, -0.021839399, 0.006255029, -0.015071021, 0.0113992775, 0.0005979145, 0.014408419) * inp_3_2_0; + result2 += M4(-0.021173203, 0.03255849, -0.007509637, -0.0014215419, -0.030343855, -0.027915409, 0.015587552, -0.06947983, -0.013560703, -0.04733876, -0.010759031, 0.051037107, 0.06359524, 0.08342158, -0.0065136985, -0.024240833) * inp_3_0_1; + result2 += M4(-0.06390198, 0.0067974203, -0.014299631, -0.0330741, 0.07374566, -0.049495887, -0.03310458, 0.11702922, 0.055769373, -0.17010662, -0.029184362, -0.048500344, -0.06861463, -0.123462, 0.04641681, -0.092642166) * inp_3_1_1; + result2 += M4(0.03394884, 0.023914674, 0.001027905, -0.013558634, -0.018708143, -0.023531381, 0.03330786, -0.039130103, -0.054672997, 0.02905047, 0.0028177788, 0.022127794, 0.08353726, -0.025451906, 0.02043948, -0.030153554) * inp_3_2_1; + result2 += M4(0.02741172, -0.0044080904, -0.01745032, -0.0046453015, 0.022975057, -0.0059091668, -0.0013712894, 0.029681692, 0.0044574183, 0.020697022, -0.001904999, -0.0069700526, 0.13211533, 0.013961191, 0.015293953, -0.00871585) * inp_3_0_2; + result2 += M4(-0.015452823, 0.00926378, 0.009741526, -0.01230558, -0.029600343, -0.030560542, 0.014431204, 0.035062976, -0.073340975, 0.060812566, -0.014831958, 0.024725016, -0.08529233, -0.0006856377, -0.03570654, 0.12063796) * inp_3_1_2; + result2 += M4(0.0365202, 0.020286338, -0.011979078, 0.02199579, -0.01317772, 0.034260873, -0.011521621, -0.027682288, -0.0009087675, -0.07905871, -0.0034417368, -0.009568027, -0.0463178, 0.022884985, -0.0015075009, 0.04794616) * inp_3_2_2; + result3 += M4(0.040243845, 0.020009438, -0.022967605, -0.005078967, -0.001594309, 0.05022829, 0.017403048, 0.0021964486, 0.08951761, 0.019662904, 0.00875745, -0.00035708013, 0.01922627, -0.030730775, -0.012931215, 0.0025635688) * inp_3_0_0; + result3 += M4(0.14607942, -0.014502504, 0.05937585, 0.01516785, -0.06510718, -0.077533536, -0.014252629, -0.01605195, 0.093539715, 0.031601768, -0.010872191, 0.022814253, 0.08808098, -0.050142072, -0.00042278145, -0.008262899) * inp_3_1_0; + result3 += M4(0.110871136, 0.008590263, -0.02233829, -0.031699177, -0.0490625, -0.01637946, 0.0047087697, -0.0010593381, -0.03551471, -0.011482322, 0.0006708069, -0.013692782, 0.019284317, 0.047920547, 0.0062774224, -0.004485404) * inp_3_2_0; + result3 += M4(0.009341054, 0.012021308, -0.021828284, 0.018237026, -0.15594478, -0.07180854, 0.029837968, 0.015278842, -0.08246709, -0.045936767, -0.0018548577, -0.019593865, 0.06280897, -0.022976711, -0.024260508, -0.0090077) * inp_3_0_1; + result3 += M4(-0.18668243, -0.044478036, 0.054378722, -0.027900947, 0.02033037, 0.10561459, 0.002562161, -0.0351626, -0.23726769, -0.17712243, -0.050947964, -0.003436438, 0.052377757, 0.16239664, -0.017259536, 0.046880163) * inp_3_1_1; + result3 += M4(0.015096582, -0.03987804, -0.025625862, -0.0031193558, 0.072353065, 0.008608825, 0.03284955, 0.046854686, -0.042063735, 0.022962196, 0.02525136, 0.022712387, 0.03157628, -0.03814462, -0.03217625, -0.03147913) * inp_3_2_1; + result3 += M4(0.017976282, -0.0019546675, -0.009366877, -0.009684881, 0.010940719, 0.018178592, 0.0053218855, 0.016856434, -0.023441786, 0.016724804, 0.005823601, 0.01591395, 0.119048, 0.005636123, 0.0003508919, -0.0065224557) * inp_3_0_2; + result3 += M4(0.043224, -0.022490898, -0.0318398, 0.0662153, -0.036592364, -0.081410274, -0.040130008, -0.043861974, 0.010291703, 0.03139131, 0.0077008577, -0.078571044, 0.15903676, 0.09245416, 0.012083053, 0.013685362) * inp_3_1_2; + result3 += M4(0.036334466, -0.0030910447, 0.0054326546, -0.2346665, -0.0027534284, -0.016249357, -0.0113077955, 0.11272883, -0.06895104, 0.02666235, 0.027947282, -0.60318786, 0.089082755, -0.008126287, -0.000207589, -1.1350799) * inp_3_2_2; + result4 += M4(-0.029548187, -0.013966757, -0.008829929, 0.003102979, -0.037540227, -0.02307922, 0.0052571394, -0.1140597, 0.024680968, 0.03634128, -0.029496174, 0.0036431698, -0.01264313, -0.044854958, 0.051910926, 0.004404255) * inp_3_0_0; + result4 += M4(0.016480023, -0.0033210155, -0.071480766, 0.033374444, 0.010757276, -0.022202821, 0.08354359, 0.081340596, 0.025887804, 0.009548545, -0.039751876, -0.009907633, 0.008462095, 0.008830086, -0.103166394, 0.019572519) * inp_3_1_0; + result4 += M4(0.0020512184, 0.053157315, 0.025247136, -0.042039078, 0.026559286, 0.023869678, -0.040236153, -0.040763464, -0.010120602, 0.004665955, 0.008478423, -0.034106277, -0.023226656, -0.04557557, 0.0031924895, -0.008834393) * inp_3_2_0; + result4 += M4(-0.011608415, 0.061025925, -0.041336574, 0.0128027545, 0.0009278712, -0.006532636, -0.16649033, -0.02779791, 0.0066272365, -0.015011618, -0.028866014, 0.056353964, -0.03133743, -0.023878438, -0.124563724, 0.036416247) * inp_3_0_1; + result4 += M4(-0.0039392044, 0.05639322, 0.15169688, -0.0026368015, -0.07996431, 0.007413352, -0.004271802, 0.041610185, 0.013149139, -0.04214141, 0.053484872, -0.07891855, -0.12922476, -0.055902585, 0.18590944, 0.086027175) * inp_3_1_1; + result4 += M4(0.003076728, 0.06658513, 0.0014087419, -0.027857183, 0.02210675, -0.029139476, 0.039626084, 0.02102879, -0.010810135, -0.03377696, -0.119157836, -0.016692212, -0.036642957, 0.014692644, -0.0742418, -0.009270793) * inp_3_2_1; + result4 += M4(-0.020245697, -0.034442406, 0.05797367, -0.022118598, 0.029425234, 0.022680778, 0.016676152, 0.022658339, 0.0071033794, -0.06422739, 0.123738706, -0.005134058, 0.0004977546, 0.20787615, 0.105217434, 0.024816323) * inp_3_0_2; + result4 += M4(-0.006777237, -0.025886461, -0.11807061, 0.026512923, 0.0007593673, 0.014026958, 0.0249759, -0.012121091, -0.0019108102, -0.10819494, -0.17732982, 0.030663192, 0.18832111, 0.08630976, -0.01657824, 0.068553194) * inp_3_1_2; + result4 += M4(-0.018167648, -0.03997246, -0.013433306, -0.017634757, -0.012371488, 0.023017474, 0.0016603069, 0.018851371, 0.011730141, -0.014452896, 0.018975778, 0.031780776, 0.012363704, 0.108077295, -0.062828265, 0.022595907) * inp_3_2_2; + result5 += M4(0.0145915765, -0.045400243, 0.073935665, -0.034597788, -0.23691322, -0.021288719, -0.1574719, -0.011355033, -0.145868, 0.025925312, -0.072244376, -0.06409915, -0.18273768, 0.022524066, -0.04140903, -0.03942252) * inp_3_0_0; + result5 += M4(0.107767306, -0.0021494434, 0.038669072, 0.08293106, 0.19135106, -0.06582466, -0.04842468, 0.11317694, -0.138321, -0.03875345, 0.05869516, -0.06852802, -0.05094979, -0.055154055, 0.01619824, 0.01852071) * inp_3_1_0; + result5 += M4(0.14048418, 0.008264727, -0.0042425888, 0.02912613, -0.050939154, 0.017133055, 0.061310638, -0.07764296, 0.05216904, -0.00859254, -0.024114585, 0.06240051, 0.09720164, -0.0038485967, -0.015042794, -0.00055489194) * inp_3_2_0; + result5 += M4(0.056485083, 0.0018631028, 0.052851774, -0.012058202, -0.20219888, -0.039547462, 0.03850607, 0.023425415, 0.051048644, 0.040121235, -0.017586619, -0.077584416, -0.35448, 0.03971185, 0.2152446, -0.04790976) * inp_3_0_1; + result5 += M4(0.15629588, -0.045338333, -0.012678156, 0.07396085, 0.0480755, 0.054410193, 0.024967624, 0.123384476, -0.23930879, -0.0009900838, -0.31708395, -0.17032936, 0.30256245, 0.11198592, -0.09638942, 0.082779706) * inp_3_1_1; + result5 += M4(0.14274575, 0.035344955, -0.033423383, 0.0021479705, -0.1311837, 0.013131482, 0.031113813, -0.03752862, -0.09714721, -0.031091178, -0.015206765, 0.089015365, 0.024627196, -0.033424858, 3.3462973e-05, -0.032662988) * inp_3_2_1; + result5 += M4(0.026727347, 0.05133357, 0.044563908, 0.03557109, 0.059456248, -0.028536018, -0.08496481, 0.04663098, 0.12366748, -0.028286988, -0.015779838, -0.05601998, -0.047197193, -0.064062975, -0.029679319, 0.02629866) * inp_3_0_2; + result5 += M4(0.053813867, -0.030096482, -0.0156154195, 0.06651504, -0.02930628, -0.010030458, 0.090722345, 0.034194693, -0.03799409, -0.006204306, -0.10783034, -0.038356468, 0.18142909, 0.093396164, -0.07819175, -0.0790709) * inp_3_1_2; + result5 += M4(0.084904894, -0.01936723, 0.012884307, 0.01079485, 0.13136025, -0.0028572613, -0.02520937, -0.067924984, -0.3820122, -0.0013870555, 0.08223087, 0.026284024, -0.050817117, -0.03537573, 0.04668999, 0.011017071) * inp_3_2_2; + result6 += M4(0.2575977, 0.010964673, 0.008924867, -0.081447475, -0.048979428, -0.12353753, -0.063453056, 0.034469236, -0.042514462, -0.013070628, 0.0045871357, 0.012448431, 0.14621142, -0.09512812, -0.02290356, -0.044323735) * inp_3_0_0; + result6 += M4(0.19578551, -0.15015762, 0.07775376, -0.0056468034, -0.031699214, -0.0033966932, 0.0032211933, 0.047410674, -0.16827974, -0.04243024, -0.081694946, -0.18510474, 0.12526773, -0.09593631, 0.0045592147, -0.0120100165) * inp_3_1_0; + result6 += M4(0.02321155, -0.0012054921, -0.016785277, 0.11251173, -0.032332707, 0.07800903, 0.0018862602, 0.0065808785, 0.052115206, 0.020399416, -0.01715928, 0.051596902, -0.11143815, -0.039698903, -0.023331625, -0.011376851) * inp_3_2_0; + result6 += M4(0.04101079, 0.005097226, -0.010333197, -0.009281498, -0.117112294, 0.0644846, -0.025808629, -0.05194357, -0.023917366, -0.026221342, 0.009081462, -0.00026552044, 0.07379806, 0.07338241, 0.05444282, -0.06932964) * inp_3_0_1; + result6 += M4(0.04542431, 0.15359387, 0.015007861, 0.012507759, -0.052328404, 0.03981155, 0.027189463, 0.09547719, -0.14972119, -0.057026792, 0.015331038, -0.03261109, 0.03163613, 0.1932335, 0.10518103, 0.08578725) * inp_3_1_1; + result6 += M4(-0.019297699, 0.08715985, 0.0109084025, 0.060195714, -0.02296073, -0.07364316, 0.0067465403, 0.04858355, 0.036142863, -0.12773067, -0.016158149, 0.12716506, -0.053368356, 0.06778647, 0.08765144, -0.0062067686) * inp_3_2_1; + result6 += M4(0.26197362, -0.019081198, -0.008743975, 0.048327573, 0.102703765, -0.0080702845, 0.008677162, -0.0031994798, -0.12507248, -0.03463628, -0.021783654, -0.021980956, 0.11624361, 0.07184015, 0.01349438, 0.049611583) * inp_3_0_2; + result6 += M4(0.15259522, -0.06820844, 0.0061506326, -0.022589752, 0.10179859, -0.021071019, 0.0005125368, 0.043334063, -0.20909151, -0.021796664, -0.013409315, -0.06586106, -0.14444274, 0.07329714, -0.0595393, -0.097062066) * inp_3_1_2; + result6 += M4(0.015401729, -0.036891527, 0.008934082, 0.08003983, -0.07095628, 0.006754855, 0.012062694, 0.023313662, 0.11078438, 0.018024879, 0.011048344, -0.10227341, 0.06207329, 0.11343193, -0.029054716, 0.026508108) * inp_3_2_2; + result7 += M4(0.001332309, 0.008496888, -0.04085346, 0.03902241, 0.0175806, 0.022650866, -0.105883494, -0.051471643, -0.015511705, -0.042901974, -0.059724472, 0.038504463, 0.0004971406, -0.0295719, -0.16592711, -0.027845114) * inp_3_0_0; + result7 += M4(0.0066125807, -0.053711805, -0.16609953, 0.19058682, 0.05513127, -0.058335137, -0.01801092, -0.048993565, -0.0038444567, 0.010192278, -0.04772477, 0.018794794, -0.0049104164, -0.07499136, -0.07840126, 0.14432356) * inp_3_1_0; + result7 += M4(0.0018919223, -0.018218946, 0.07316231, 0.13501935, -0.012945283, 0.07542135, 0.20659958, -0.012889675, -0.0013052122, 0.005058418, -0.037553705, -0.021615338, 0.0014601327, -0.06847536, -0.061825827, 0.038802728) * inp_3_2_0; + result7 += M4(0.041981738, 0.005597128, 0.11018467, 0.0032644204, 0.07530397, -0.05951611, 0.07450283, -0.005922322, 0.036117464, 0.011094838, -0.02793344, -0.004478613, -0.01604977, 0.017032115, 0.35127386, 0.09251453) * inp_3_0_1; + result7 += M4(0.066794336, 0.07097917, 0.015864775, -0.13579993, 0.037443314, -0.009019754, -0.06436591, -0.008693444, 0.014885683, -0.05455319, -0.07293119, -0.055708934, 0.044612657, 0.17219391, 0.28060448, 0.15946048) * inp_3_1_1; + result7 += M4(0.0049949894, 0.09829119, 0.18719345, -0.023272216, -0.004434824, -0.033500746, -0.06961843, -0.03294643, -0.020013694, -0.052665558, -0.15829746, -0.10578164, 0.004096447, 0.14796317, 0.3790023, 0.10108945) * inp_3_2_1; + result7 += M4(-0.0045376658, -0.022875838, -0.037856285, -0.026642285, 0.007010922, 0.018420387, 0.15169138, 0.05360536, -0.036082547, 0.043787856, 0.06766086, -0.001375816, 0.027911961, 0.050982665, 0.3339394, -0.015187151) * inp_3_0_2; + result7 += M4(0.0029686706, -0.0013550227, -0.04827626, -0.023147695, -0.0058941836, -0.007722708, 0.020669388, -0.004416151, -0.001527503, -0.045378324, -0.010862972, -0.008204876, 0.006345512, 0.18554237, -0.15723045, -0.13058613) * inp_3_1_2; + result7 += M4(-0.0006688145, 0.017388795, -0.023427669, -0.034102734, 0.00031701455, 0.022926936, 0.16746669, 0.04390338, -0.028491322, -0.045772992, -0.18151388, 0.023017827, -0.005325638, 0.17508554, 0.23028685, -0.0021354717) * inp_3_2_2; + const V4 inp_4_0_0 = inp[4][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_4_1_0 = inp[4][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_4_2_0 = inp[4][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_4_0_1 = inp[4][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_4_1_1 = inp[4][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_4_2_1 = inp[4][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_4_0_2 = inp[4][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_4_1_2 = inp[4][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_4_2_2 = inp[4][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.023859713, 0.004455244, -0.002377918, -0.13685068, 0.04832673, -0.020542728, -0.069400765, 0.16850239, -0.021624798, -0.030256521, -0.12316566, -0.30301347, 0.06703788, 0.031297717, -0.093510635, 0.45338058) * inp_4_0_0; + result0 += M4(0.014708575, 0.004094363, 0.1738236, -0.13215998, -0.010963995, 0.020334357, 0.13969354, -0.47183305, 0.14020021, 0.016115865, -0.037026897, 0.25319436, -0.052121464, -0.07727695, 0.20109044, -0.29890946) * inp_4_1_0; + result0 += M4(-0.009991341, 0.013138874, -0.112630226, -0.31813458, 0.06638714, -0.022273874, -0.07118327, 0.25611976, -0.02931166, -0.047314268, -0.0612468, 0.2157666, -0.015947148, 0.046236917, -0.25237247, -0.019552069) * inp_4_2_0; + result0 += M4(0.11330945, -0.000864947, -0.12717432, 0.18417744, -0.086828135, -0.02315802, -0.028860042, -0.37922463, -0.20862983, -0.05426192, 0.10147666, -0.3109466, -0.061471142, -0.030394116, -0.19532241, -0.20670058) * inp_4_0_1; + result0 += M4(-0.2607493, -0.046044532, -0.24980219, -0.07620337, -0.21202587, 0.039140634, -0.12970094, -0.49645844, 0.21316975, 0.031200308, -0.29867926, 0.1266121, -0.09478635, -0.030060625, -0.092912465, 0.18421893) * inp_4_1_1; + result0 += M4(-0.050291248, -0.077760756, 0.067675576, -0.043119945, 0.05872864, -0.057585012, -0.0858208, 0.10962405, 0.059937954, 0.007578836, -0.2438118, 0.15389061, -0.020469157, 0.087004155, -0.23853436, -0.13583867) * inp_4_2_1; + result0 += M4(-0.020880964, -0.004678778, -0.15380706, 0.028993685, -0.014578469, -0.008724125, 0.038938, -0.05063669, -0.057933625, -0.033926018, 0.09626932, -0.21451063, -0.08264, 0.008077987, -0.043677248, -0.024457106) * inp_4_0_2; + result0 += M4(-0.085743085, -0.009369179, -0.29852355, -0.5998807, -0.0038788326, 0.057073753, -0.0017683671, -0.19511129, 0.051573887, 0.036944892, -0.08212776, 0.13903797, -0.22563867, -0.011816562, 0.11828972, -0.1958442) * inp_4_1_2; + result0 += M4(-0.032265928, -0.07938842, 0.025272928, -0.2576814, 0.013718613, 0.034285318, 0.10671524, 0.030972904, 0.027826209, 0.0003211338, 0.0022470127, 0.19050935, 0.032751035, 0.0523657, -0.19224732, 0.42710903) * inp_4_2_2; + result1 += M4(0.15124603, -0.026941005, -0.44718397, 0.108720444, -0.04649959, -0.0007690393, 0.21924922, 0.14684929, 0.18426548, -0.014624747, 0.00083363935, -0.10960432, 0.013218476, -0.038135085, 0.13330173, -0.059721634) * inp_4_0_0; + result1 += M4(-0.019207804, 0.11822485, -0.6380687, 0.09257789, 0.0023504647, -0.06687477, -0.31443894, 0.01878101, 0.04603227, -0.06783463, -0.0916639, -0.006227829, -0.010663166, 0.15866677, -0.04842553, -0.04404028) * inp_4_1_0; + result1 += M4(-8.069056e-05, -0.019805213, -0.2719378, 0.009419326, -0.0063420287, -0.074358396, -0.35171902, -0.03408413, 0.004589689, 0.06414359, 0.07358375, 0.009688882, -0.0017543485, -0.026901478, 0.5281173, 0.006985629) * inp_4_2_0; + result1 += M4(-0.030180238, 0.024072908, -0.58140194, 0.020893931, -0.021975895, -0.05850558, -0.035511117, -0.5192421, -0.020530628, -0.025253527, -0.11308856, 0.15836221, -0.021790039, 0.024110956, -0.15462653, -0.09588735) * inp_4_0_1; + result1 += M4(-0.028668966, -0.07700054, -0.39094114, 0.019754864, 0.026636409, -0.04527157, -0.026282465, -0.08171292, -0.05002831, 0.048063282, -0.15509962, 0.037119415, 0.010990413, -0.033768933, 0.31064925, 0.06266823) * inp_4_1_1; + result1 += M4(0.010557531, 0.06177348, 0.09497353, 0.0057446286, -0.00158716, 0.05495757, -0.08581388, -0.0123871965, -0.010037563, -0.048436042, -0.18572886, -0.035327513, 5.6554294e-05, -0.04835167, -0.6870528, -0.027399777) * inp_4_2_1; + result1 += M4(0.00034220816, -0.011041973, 0.1542877, 0.036416434, -0.013598769, -0.020497307, 0.05451107, 0.042456426, -0.0066677406, -0.005100653, 0.028958762, -0.027084077, 1.0284521e-05, 0.026825996, 0.06796177, -0.11522354) * inp_4_0_2; + result1 += M4(0.012229485, 0.05228846, 0.055574104, 0.036745057, -0.0033466492, 0.03923544, 0.0794358, 0.032911297, -0.0038450863, 0.016761316, 0.020559635, -0.004080305, 0.0026956282, -0.011313599, -0.01703021, 0.0006629756) * inp_4_1_2; + result1 += M4(0.0021817288, 0.0034975926, -0.00988273, 0.0029229533, -0.0015326847, 0.008841427, 0.11833992, 0.009737943, -0.001636571, 0.0012688697, 0.1972416, -0.00500852, 0.006666943, 0.018024994, 0.4365644, 0.04244845) * inp_4_2_2; + result2 += M4(0.070601925, -0.014832522, -0.005291692, -0.012599502, -0.044300884, 0.04914395, 0.001796133, 0.00759639, -0.040950056, -0.045874655, 0.021728046, -0.016460735, -0.046293322, 0.011460647, -0.0027610336, -0.011529388) * inp_4_0_0; + result2 += M4(0.08101221, 0.040676136, 0.016204886, -0.007073004, 0.13636649, 0.040680025, 0.009403601, 0.019096185, -0.0256713, -0.019710507, -0.029215112, 0.018300094, 0.019002156, -0.038342085, 0.020993775, 0.00044086654) * inp_4_1_0; + result2 += M4(-0.0028851593, -0.009202628, -0.025044741, -0.015088186, -0.058316752, -0.07177227, 0.0020192324, -0.043514576, 0.026148524, -0.02090211, -0.020344133, -0.005242076, -0.0013512422, -0.012045611, -0.0029308465, -0.015209391) * inp_4_2_0; + result2 += M4(-0.028822146, -0.05558955, -0.019578548, -0.030242875, 0.08117146, -0.02399579, 0.042416006, -0.03383768, 0.08046571, -0.03797942, 0.036127154, -0.027143223, 0.034858666, -0.02404033, -0.02131069, -0.007186167) * inp_4_0_1; + result2 += M4(-0.121257596, -0.16235761, -0.064689174, -0.051821593, -0.04864424, 0.087969534, -0.1756449, -0.12571654, 0.012008921, 0.033566337, 0.007650471, 0.051010884, 0.22904405, 0.0012919256, 0.007851234, 0.02917895) * inp_4_1_1; + result2 += M4(0.09072267, 0.020490156, 0.008377944, -0.025208322, -0.032429654, 0.06172293, -0.018755283, 0.011810052, -0.04944588, -0.09504029, 0.035250075, 0.025170475, -0.054515738, 0.011876419, -0.0044741468, 0.02859669) * inp_4_2_1; + result2 += M4(0.0082549965, 0.052110333, 0.010620348, -0.030734533, -0.07222009, -0.026855266, -0.0056354217, 0.017188957, -0.051928584, 0.0043232213, 0.016709872, -0.003846665, 0.03463802, 0.0025464997, -0.004202488, -0.0145620005) * inp_4_0_2; + result2 += M4(0.09782991, -0.081127495, -0.023697635, -0.02887728, -0.008071907, 0.007967479, 0.019351335, -0.05544894, 0.07679484, -0.03592071, -0.010992033, 0.008713708, -0.14171878, 0.026273664, 0.0040301215, -0.009691411) * inp_4_1_2; + result2 += M4(0.015741572, 0.02951323, 0.012329126, -0.012197747, 0.11860267, -0.0010880535, 0.017459186, -0.012477584, -0.019927463, 0.029959552, -0.012756799, 0.0028729404, 0.050521027, 0.029120576, 0.00780705, 0.011151294) * inp_4_2_2; + result3 += M4(0.019585919, -0.017675076, -0.00082494144, 0.00022281577, 0.004518876, 0.0741858, -0.007993614, 0.015966507, 0.038870357, -0.0060034483, 0.050406333, -0.0021747998, -0.17242897, 0.08241093, -0.002990767, -0.01007886) * inp_4_0_0; + result3 += M4(-0.034971416, 0.020543758, 0.012265966, -0.006595169, 0.034970112, 0.05295805, 0.029638683, -0.022583855, -0.02601401, -0.12975766, 0.014604507, -0.007962972, -0.034181397, -0.0027087794, 0.026609916, -0.0015675776) * inp_4_1_0; + result3 += M4(0.009510334, 0.070280336, -0.02388081, 0.00031435036, 0.05599774, 0.01933175, 0.002184445, 0.019249488, -0.041498672, -0.04365051, 0.0063173906, 0.0034823623, 0.02605108, 0.0018707864, 0.0051907846, -0.004443477) * inp_4_2_0; + result3 += M4(-0.039673332, 0.028356653, -0.004765511, 0.003102143, 0.18238713, -0.0073861033, -0.017427104, -0.032043844, -0.053080082, -0.08592378, 0.019187478, -0.0031024364, 0.112678796, 0.025666485, -0.007565813, -0.0006711753) * inp_4_0_1; + result3 += M4(-0.2100566, 0.054332584, 0.16911295, 0.028797867, -0.22902343, 0.09438615, -0.106923684, -0.012784057, 0.1182429, 0.18395427, 0.017236775, 0.014868723, 0.12947643, -0.13174742, 0.015163319, 0.052961364) * inp_4_1_1; + result3 += M4(-0.095436074, 0.06448746, -0.022598868, -0.020078328, -0.051383484, 0.056716044, 0.038470473, 0.016933812, 0.21265252, 0.03825304, 0.014578858, 0.0066368203, 0.043466188, 0.05020769, -0.0023113098, -0.019127365) * inp_4_2_1; + result3 += M4(-0.19591577, -0.02937765, -0.007567413, 0.003241523, 0.00040428128, -0.0017792569, -0.024028005, 0.033440206, 0.049779184, 0.027317362, 0.00021749092, -0.0050912155, 0.04628823, 0.010364296, -0.003357356, 0.009913488) * inp_4_0_2; + result3 += M4(0.076550364, 0.015933773, -0.019085985, -0.016548207, -0.11369565, 0.05355817, 0.020396193, 0.011267707, -0.010191895, -0.011590965, -0.025692463, -0.04185553, -0.08545018, 0.043549392, -0.018635789, -0.033626337) * inp_4_1_2; + result3 += M4(0.0917065, 0.091621086, -0.052564632, -0.9093429, 0.0137432525, -0.07486207, 0.02412349, -1.3287994, -0.065092415, 0.025197644, -0.02589547, -0.6003589, -0.038512293, 0.05214821, 0.019990617, -0.4080502) * inp_4_2_2; + result4 += M4(-0.0011065865, 0.004361771, 0.058067102, -0.0003729418, 0.0050898474, 0.022686366, 0.08649572, 0.031093955, 0.0024723646, -0.005907795, -0.14235686, -0.022013307, -0.023272363, 0.00183599, 0.026127363, -0.010689358) * inp_4_0_0; + result4 += M4(0.04011746, 0.040639587, -0.019481385, -0.005606484, 0.016786132, -0.011691512, -0.03276996, 0.07931959, -0.02021918, -0.013474289, 0.015815701, 0.052064817, -0.0019740178, -0.012213153, -0.08325174, -0.001975228) * inp_4_1_0; + result4 += M4(-0.011913236, -0.020632606, 0.07980256, -0.012381817, -0.032859985, -0.04055804, 0.0976651, -0.0015878766, 0.015533325, -0.021102041, -0.015316372, 0.0006883457, -0.0069804657, 0.013606629, 0.03507516, -0.006430682) * inp_4_2_0; + result4 += M4(-0.024898242, -0.02899132, -0.023410093, 0.0018563439, 0.008975198, 0.15583113, 0.019116785, 0.049385443, 0.013085802, -0.029388415, 0.054360867, -0.03041284, -0.020285629, 0.05869668, 0.09120235, -0.029572278) * inp_4_0_1; + result4 += M4(-0.029433373, -0.10438833, -0.11188211, 0.017460383, -0.16285038, 0.11949173, -0.082640246, -0.16122617, 0.02557263, -0.032468136, -0.13243191, 0.16276221, 0.012047499, 0.08136583, -0.041441474, -0.006403048) * inp_4_1_1; + result4 += M4(-0.016160902, 0.0076878215, 0.017508298, 0.0030001504, -0.02734933, 0.0636681, -0.049740307, 0.053536236, 0.044964515, -0.08641628, -0.1166198, 0.032113962, -0.008334231, 0.036778294, 0.013588499, -0.001974873) * inp_4_2_1; + result4 += M4(0.006887317, -0.14054482, 0.028575014, -0.005214252, -0.03997718, -0.12259291, -0.099819064, -0.0063396306, -0.004513895, 0.0403355, -0.056890015, -0.021483857, -0.005824905, 0.06439299, -0.024622729, 0.0014631762) * inp_4_0_2; + result4 += M4(-0.0060670865, -0.06643547, 0.0016586828, 0.017541163, -0.033914223, -0.0095484, 0.0448096, 0.0028355, 0.0041099624, 0.07487003, 0.11122535, -0.013245749, 0.0023274145, 0.14515898, 0.0026270556, -0.026971022) * inp_4_1_2; + result4 += M4(0.026604306, 0.034865793, 0.07666645, -0.011438582, -0.017533895, -0.052912213, -0.05149498, -0.013888071, 0.0012517864, 0.0499751, 0.015479219, 0.031983975, -0.0035353177, 0.05356372, 0.010568097, -0.0031850094) * inp_4_2_2; + result5 += M4(0.14271596, -0.017759029, 0.032885257, 0.0072756833, 0.23596177, 0.073969685, 0.028536724, 0.08226236, 0.14731658, 0.014973116, -0.21056932, 0.08577863, -0.07515932, -0.031641446, 0.08578241, -0.09723262) * inp_4_0_0; + result5 += M4(-0.02457276, 0.04053715, 0.0422397, -0.059486095, 0.1035117, 0.04473667, 0.10929049, -0.003947403, -0.08261905, -0.08315906, -0.0036764569, -0.06112449, 0.14918959, 0.01950978, 0.051387057, 0.0129363425) * inp_4_1_0; + result5 += M4(-0.018800788, 0.009927671, 0.01894571, 0.01163225, 0.21287952, 0.056717362, -0.03717517, 0.0587995, -0.0045976425, -0.018402318, 0.039512213, -0.08982805, 0.07081415, 0.004064484, 0.0031761164, 0.043164354) * inp_4_2_0; + result5 += M4(-0.05464874, 0.039328545, 0.056838807, -0.05926126, 0.17684151, -0.023561789, -0.060943063, 0.046758395, -0.045146126, -0.07409688, -0.043774106, 0.11160182, 0.13076578, 0.018333199, -0.070689656, -0.012261061) * inp_4_0_1; + result5 += M4(-0.40536138, -0.072739914, -0.15534219, -0.10337857, -0.24237475, -0.53582096, -0.108108126, -0.042470045, -0.20948479, 0.15080559, 0.25295603, -0.07247551, 0.012296087, -0.051865015, -0.06819402, 0.05164876) * inp_4_1_1; + result5 += M4(-0.0034712544, -0.022865832, -0.107938655, 0.011823184, -0.031241452, -0.04384156, 0.038186125, 0.1271688, -0.048578527, -0.013269044, 0.08416805, -0.044156726, 0.010347561, -0.036402013, -0.031786133, 0.10860822) * inp_4_2_1; + result5 += M4(-0.049830165, -0.05659381, -0.009732374, -0.051384013, -0.15868908, 0.09233686, 0.13370122, -0.024779513, -0.15767068, 0.028253611, 0.08171342, -0.03374992, 0.09184247, 0.0053282995, 0.0074592573, 0.003335011) * inp_4_0_2; + result5 += M4(-0.31770813, 0.027316336, 0.01642844, -0.0131445695, -0.03087505, 0.022081072, -0.00059224037, -0.008582735, 0.19334872, -0.048972342, -0.055213604, -0.007374455, 0.18206303, -0.0074423095, 0.001091665, 0.08408393) * inp_4_1_2; + result5 += M4(0.14494145, 0.043378375, -0.024161316, 0.0068140607, 0.008322008, -0.021887975, 0.03614526, -0.007394633, -0.08547806, -0.00643793, -0.034237247, -0.060413282, -0.11980462, 0.035390332, 0.097667545, 0.03212041) * inp_4_2_2; + result6 += M4(-0.36189663, 0.020741109, -0.014227836, 0.010552417, -0.23210502, 0.101755366, 0.060653634, 0.13818975, -0.120628394, -0.07889201, 0.044530567, 0.17194629, -0.06381627, 0.018349336, 0.015036086, -0.06712973) * inp_4_0_0; + result6 += M4(-0.10304263, 0.016445968, 0.051030986, 0.011352426, -0.1495902, 0.0075346404, 0.041121878, 0.17279992, -0.35058084, -0.06449225, 0.050316013, -0.12074753, -0.090388566, 0.06928403, 0.05244845, -0.04504952) * inp_4_1_0; + result6 += M4(-0.064742975, -0.022371136, -0.0019048752, -0.011422433, 0.2685091, 0.11239129, -0.0012263199, -0.096080035, 0.08487421, 0.0067672306, 0.063248284, 0.10481587, 0.031244673, -0.025100319, 0.013568226, 0.052519444) * inp_4_2_0; + result6 += M4(-0.19833754, -0.11054866, 0.01805616, 0.07009402, -0.2596385, 0.103656076, 0.026423646, -0.04476002, -0.4312731, 0.0871887, -0.0054558194, 0.060997717, -0.21627232, 0.073644586, 0.028389607, -0.04079153) * inp_4_0_1; + result6 += M4(0.085182294, -0.30439737, -0.05885439, -0.115479745, 0.023302298, -0.3353974, -0.0673425, 0.08140151, -0.26428482, 0.13782765, 0.035738807, -0.117511995, 0.12126562, 0.029603243, -0.0040487326, 0.009205216) * inp_4_1_1; + result6 += M4(0.041155897, 0.043152735, 0.015883105, -0.07004022, -0.0032382738, -0.018978892, -0.075261064, -0.0042700446, -0.041074894, -0.040481932, -0.060322165, 0.09335181, -0.059867248, -0.0149408, 0.009428354, 0.07734847) * inp_4_2_1; + result6 += M4(-0.54041266, 0.03653768, 0.0076536164, 0.015833791, -0.17396416, 0.0007066151, 0.002655451, -0.091494955, 0.029475072, -0.028643942, -0.007456634, -0.026160534, 0.16250062, -0.010053017, -0.011650024, 0.031500697) * inp_4_0_2; + result6 += M4(0.06665518, 0.00027555425, 0.0036541973, -0.024381254, 0.12066567, 0.034838542, -0.0047756876, 0.04162213, -0.020100128, -0.001990978, -0.030474715, -0.0056014247, -0.5193268, 0.027919956, -0.0056259134, -0.047425497) * inp_4_1_2; + result6 += M4(-0.12569065, 0.025217315, -0.009073684, 0.01433599, 0.15018259, -0.036545917, 0.016683564, -0.013200186, -0.050798338, 0.031369623, -0.023354547, 0.009630601, 0.30341607, 0.121258266, 0.0074613863, 0.02719777) * inp_4_2_2; + result7 += M4(0.00057596446, 0.00820698, -0.15671416, 0.016200595, -0.037705947, -0.018765997, 0.1655083, 0.049910277, -0.004273615, -0.022224553, 0.01136582, -0.00095973356, 0.003227117, 0.07895224, 0.19962539, 0.0666221) * inp_4_0_0; + result7 += M4(-0.024428371, 0.025500804, -0.08464559, 0.0063669137, -0.029393317, -0.070365734, -0.08556919, -0.040882237, 0.032301337, -0.07898201, -0.19100904, 0.08218557, 0.0061767763, 0.032722086, 0.05010724, -0.050281312) * inp_4_1_0; + result7 += M4(-0.0108663505, -0.050716337, -0.15298451, -0.048775706, -0.0028181237, 0.039387777, -0.04269699, -0.005725893, -0.015829941, -0.0073935734, -0.11688312, 0.04211434, -0.008078509, -0.0011058762, 0.106737435, -0.026486738) * inp_4_2_0; + result7 += M4(-0.03920596, -0.006681461, -0.24516189, -0.10796381, -0.023149999, -0.022254908, -0.024199646, -0.0062088277, 0.04342773, -0.0017690136, -0.04399842, -0.012637119, -0.009597771, -0.0024834601, -0.42737588, 0.021605711) * inp_4_0_1; + result7 += M4(-0.029350376, -0.102734536, -0.52108145, -0.12297046, -0.027304547, -0.07347977, -0.36036336, -0.091495484, -0.0023731436, 0.105059125, -0.07063477, -0.004721114, 0.016149826, -0.0066922433, 0.3405859, 0.03783498) * inp_4_1_1; + result7 += M4(-0.0052855504, -0.040714275, -0.04350332, -0.030558262, -0.011317641, -0.06827948, -0.22080219, -0.056677774, -0.00026092274, 0.03296498, 0.12431698, 0.01775296, -0.008008691, -0.08919731, -0.2718084, 0.07866052) * inp_4_2_1; + result7 += M4(-0.007421864, 0.045899726, -0.25079954, 0.03904733, -0.04154342, -0.035786167, 0.07493005, -0.050995097, 0.026313728, -0.027238062, -0.0012218172, -0.00172147, -0.0013928516, 0.021201873, 0.13946052, 0.012338421) * inp_4_0_2; + result7 += M4(-0.009875562, -0.07234777, -0.31468564, 0.026008982, -0.005563818, 0.04609909, 0.17156258, 0.11807239, 0.012193787, 0.0075681983, 0.13915597, -0.037645176, 0.005634749, 0.0012593336, -0.06909221, 0.05869621) * inp_4_1_2; + result7 += M4(-0.00084139843, -0.006233557, 0.03237075, -0.0034765676, -0.0046846424, 0.0004515443, 0.08111396, -0.011091206, 0.009850372, 0.030282846, 0.16435917, 0.014978042, -0.014760738, 0.12110702, 0.3880304, 0.0436076) * inp_4_2_2; + const V4 inp_5_0_0 = inp[5][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_5_1_0 = inp[5][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_5_2_0 = inp[5][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_5_0_1 = inp[5][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_5_1_1 = inp[5][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_5_2_1 = inp[5][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_5_0_2 = inp[5][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_5_1_2 = inp[5][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_5_2_2 = inp[5][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.07483121, 0.047063787, 0.07374778, 0.31769532, 0.017322259, 0.008300764, 0.059722487, -0.0025180755, -0.094267584, 0.0141164465, -0.010330118, -0.021610612, 0.15163203, 0.053797286, -0.22308366, 0.062314536) * inp_5_0_0; + result0 += M4(-0.24144739, -0.037539218, -0.28955126, -1.1868873, -0.036552146, -0.016526535, 0.11408427, -0.50982016, 0.1300695, 0.053468116, 0.043524645, -0.11903253, -0.28910205, -0.16227607, -0.027681645, -0.62036866) * inp_5_1_0; + result0 += M4(-0.03789409, 0.020600036, 0.011660592, -0.29614636, 0.043089446, -0.034586933, -0.097780585, 0.23817936, -0.07334253, 0.0571398, 0.208584, 0.2629321, 0.05254382, 0.09973011, -0.01220805, -0.08827702) * inp_5_2_0; + result0 += M4(-0.05097586, -0.017860867, 0.07355176, -0.16677943, 0.04545738, -0.003149086, 0.08122203, -0.10491879, -0.06999885, 0.004541706, 0.051017024, -0.15920131, 0.14594613, 0.013507741, -0.12961464, -0.042316604) * inp_5_0_1; + result0 += M4(-0.11246478, 0.03173381, -0.22669828, -0.016215464, -0.17379439, -0.07468649, -0.07726293, 0.2067122, 0.2093439, 0.05112315, -0.22271189, 0.1031352, -0.18271585, -0.039410837, -0.17504399, -0.78678143) * inp_5_1_1; + result0 += M4(-0.0321244, -0.0672973, 0.09822254, -0.046086065, 0.040323, 0.10398941, -0.02657579, -0.059235204, 0.042367738, 0.0018331892, 0.078710906, -0.22649765, 0.07910405, -0.04926818, 0.0012930505, 0.037007578) * inp_5_2_1; + result0 += M4(-0.06530553, -0.051296435, 0.349298, -0.22925952, 0.109149985, 0.08928391, -0.030218372, 0.18349427, -0.060022093, -0.0010489912, 0.018047197, 0.018946774, -0.14357865, -0.037310254, 0.11176737, -0.31042525) * inp_5_0_2; + result0 += M4(0.24375601, 0.04076074, -0.07613952, 0.57086706, -0.04037201, -0.11891336, 0.06262244, -0.38928714, 0.054227084, 0.01660341, 0.055232767, 0.04315458, -0.25590885, 0.06128791, -0.2928808, -0.5484102) * inp_5_1_2; + result0 += M4(-0.049694087, 0.08271336, 0.02442945, 0.2990378, 0.030164765, 0.024244657, 0.08696084, 0.008612266, -0.0762842, -0.105493106, -0.13255173, 0.23666973, -0.22727323, -0.15232511, 0.15621027, -0.49899757) * inp_5_2_2; + result1 += M4(0.039408907, 0.011309981, -0.08761814, 0.08737932, 0.002707166, 0.053742293, -0.7015076, -0.017557265, 0.07054905, -0.031967565, 0.30991855, 0.053515386, -0.05051318, -0.08796035, -0.2127413, -0.06747065) * inp_5_0_0; + result1 += M4(0.031378802, -0.103843145, -0.15135477, -0.114012085, 0.018722687, -0.09269623, 0.42554364, 0.046855096, 0.07807347, -0.026045365, 0.28931096, -0.07932266, 0.04734616, 0.023661686, -0.95422095, 0.055896934) * inp_5_1_0; + result1 += M4(0.00069976103, 0.008312606, -0.32054356, 0.0007041386, -0.0036291934, 0.009521557, -0.570368, -0.020225605, 0.0057637296, 0.12193305, 0.44359246, -0.014770922, 0.013533181, -0.0674555, -0.5718742, -0.0050457306) * inp_5_2_0; + result1 += M4(-0.02727696, 0.02091126, 0.19075912, -0.122085184, 0.020038225, -0.0011693131, 0.52832747, 0.031853452, -0.060993228, 0.0073539866, 0.024202116, 0.10486712, 0.060815107, 0.00082101946, -0.3257364, -0.5935856) * inp_5_0_1; + result1 += M4(0.0070991274, -0.118046306, -0.12676442, -0.017629202, 0.0031608117, 0.0066243596, 0.06206153, -0.0635002, 0.02966587, 0.05849763, 0.020881008, 0.12050715, -0.018091852, -0.042970482, 0.07730558, -0.11283092) * inp_5_1_1; + result1 += M4(-0.0010705901, -0.044887718, -0.2883397, 0.014177124, 0.007165047, 0.009177472, 0.035292387, 0.03229695, -0.0025869021, -0.040337905, -0.22766824, 0.015610324, 0.012554573, 0.07323866, 0.11702241, 0.024119506) * inp_5_2_1; + result1 += M4(-0.022569923, -0.023828449, 0.1488533, -0.0145759145, 0.010793525, 0.021326512, -0.6625454, 0.00085745216, -0.014903852, 0.009162843, -0.054173853, 0.018812409, -0.001955668, -0.012775812, 0.109919876, -0.03071185) * inp_5_0_2; + result1 += M4(-0.004134229, -0.010984694, 0.124786034, -0.038324945, 0.0007969303, -0.041152276, -0.004313858, 0.008114088, 0.015886864, 0.0022939704, -0.11069539, -0.10324996, -0.0030892212, 0.04267562, 0.0885597, -0.052302524) * inp_5_1_2; + result1 += M4(0.0008170753, 0.013301961, 0.1815448, -0.009439186, 0.0025459235, 0.026232528, 0.0009007796, -0.02355336, 0.002972475, -0.001600558, -0.12072551, 0.015272286, -0.004272006, -0.027098453, -0.16730817, -0.0022291455) * inp_5_2_2; + result2 += M4(0.026221612, -0.013690791, -0.0028586744, 0.0060761203, -0.020195171, -0.0972889, 0.00020876035, 0.009973064, 0.036941737, 0.0085559245, 0.016834864, -0.038576897, -0.10711522, 0.055938907, -0.003758021, -0.012083382) * inp_5_0_0; + result2 += M4(-0.019417172, -0.03460168, 0.01933901, -0.043690868, -0.0017395314, -0.03332913, -0.009036095, -0.03565724, 0.07578074, -0.13275795, 0.04249325, -0.049465336, 0.090170085, 0.025203452, 0.000101406884, 0.0139736) * inp_5_1_0; + result2 += M4(-0.13325179, 0.0092983665, 0.0081002405, 0.006359305, -0.01956364, 0.0106262565, -0.040832117, 0.030771626, 0.0062237135, 0.052257292, 0.06670754, -0.027994005, -0.034620192, 0.0069601703, 0.0034000545, 0.0005790582) * inp_5_2_0; + result2 += M4(0.038719837, -0.021463823, 0.02023773, 0.068525136, 0.080091126, 0.010453173, -0.013497189, 0.01132102, 0.009695962, -0.03451035, 0.0064998274, -0.05360003, 0.005831024, -0.033574637, 0.03356129, 0.019509813) * inp_5_0_1; + result2 += M4(-0.10125573, -0.03178281, 0.086591385, -0.06538841, -0.046868883, -0.38974422, 0.038706817, -0.051259045, -0.051737573, 0.15911302, -0.057974786, -0.028165305, -0.29169866, -0.07587525, 0.009294523, -0.030461896) * inp_5_1_1; + result2 += M4(0.023917248, -0.010737714, 0.013295185, 0.02375338, 0.034284353, 0.0052084625, -0.011358086, 0.00750003, 0.09136356, -0.20336387, 0.3035513, -0.12645239, 0.072611086, 0.030561982, 0.006377861, -0.033868592) * inp_5_2_1; + result2 += M4(-0.049503963, 0.055452026, 0.009027011, -0.044692382, 0.027284004, -0.19287783, -0.0628574, 0.0026560517, -0.004082762, -0.011418342, 0.005354789, 0.01666234, -0.0017665984, 0.059133336, 0.038757626, -0.010006088) * inp_5_0_2; + result2 += M4(-0.054397367, 0.05084847, 0.093563974, 0.009561407, -0.09071541, -0.026214551, -0.0068408316, 0.0026650713, 0.03041869, -0.009229575, -0.057778046, -0.049414687, 0.074949786, 0.0046772384, -0.010191719, 0.023153663) * inp_5_1_2; + result2 += M4(-0.026934631, -0.029390255, -0.019467328, 0.011385554, -0.000815343, -0.018501997, -0.004726863, -0.014090242, -0.057662483, 0.08498014, 0.082734406, -0.08189864, -0.0068748365, 0.022185318, -0.00964068, 0.0011388641) * inp_5_2_2; + result3 += M4(-0.01138743, -0.020006236, -0.02838959, -0.0027390516, -0.058288656, -0.006424417, 0.011350733, -0.00018796478, -0.0984927, 0.0073165186, 0.009947041, -0.0066732503, -0.26125643, 0.04552679, -0.054414567, 0.009297777) * inp_5_0_0; + result3 += M4(0.0052165827, 0.066149496, -0.059447166, 0.01662117, 0.18608935, 0.03846452, -0.0023011437, 0.006444358, -0.16029942, -0.047585644, 0.022039922, 0.019156447, 0.07772752, 0.09511228, 0.0110934945, -0.0030902703) * inp_5_1_0; + result3 += M4(0.050554793, 0.0062975604, -0.010809019, -0.01587796, 0.09426445, -0.015036171, 0.021018952, 0.0034158174, -0.024776539, 0.02703288, 0.0006708393, -0.015684862, 0.06405421, -0.030658672, -0.0019640136, 0.0006359808) * inp_5_2_0; + result3 += M4(0.082843624, -0.0058466373, -0.0001927569, -0.0054505523, -0.036168188, -0.06406799, -0.014195686, 0.0041891257, 0.034694634, -0.019641217, -0.013024316, 0.032979004, 0.15279615, 0.008255314, 0.02779349, -0.0034597116) * inp_5_0_1; + result3 += M4(-0.17692919, -0.089195535, -0.05977019, 0.033673696, -0.3156338, -0.030655265, 0.0041716495, 0.003762428, 0.26595598, 0.2034683, 0.020819688, 0.12479038, -0.18631695, -0.24201138, -0.003909684, -0.0052289786) * inp_5_1_1; + result3 += M4(-0.02077353, -0.097781494, 0.01233942, 0.023903158, -0.014568144, -0.007301065, 0.022682862, -0.01391774, 0.08644398, -0.054097548, -0.117955364, 0.24956807, -0.14174971, 0.12832682, 0.043740183, -0.011534949) * inp_5_2_1; + result3 += M4(-0.042752188, -0.0053177867, 0.054738652, -0.024831854, 0.16105731, 0.04903369, -0.010821958, -0.012044306, 0.0356995, 0.013791298, -0.0075505297, -0.00804303, -0.064347796, 0.01142062, 0.030802218, 0.008763939) * inp_5_0_2; + result3 += M4(-0.16015866, 0.022330351, 0.13681799, -0.062638275, 0.1055862, 0.027915165, 0.01229335, 0.026821595, -0.13360634, -0.0104192, 0.0005295131, -0.03985375, -0.101275936, 0.11623205, 0.08874695, -0.031169536) * inp_5_1_2; + result3 += M4(-0.10026812, -0.021585241, 0.0698658, -0.26119703, -0.02041572, -0.028592126, 0.0025204902, -0.86565274, -0.038617194, -0.0017866961, -0.016586272, 0.1369089, 0.15430436, -0.09243481, -0.05501641, -1.0170106) * inp_5_2_2; + result4 += M4(-0.00046180302, -0.016193122, -0.04214098, 0.021198846, -0.009012628, 0.008982511, -0.10128469, 0.013775624, -0.0377402, -0.028123314, 0.0034520095, -0.017229725, -0.061591353, 0.011617439, 0.0051412303, -0.014545118) * inp_5_0_0; + result4 += M4(-0.046234526, 0.061278384, -0.0701329, -0.055992045, 0.0133969225, -0.061173655, -0.16218357, 0.013087903, -0.05969246, -0.036829423, -0.000682327, 0.20933838, 0.03487913, 0.020396423, 0.04309976, -0.045642234) * inp_5_1_0; + result4 += M4(-0.00846842, 0.011618203, -0.029997766, -0.03157264, 0.0127973305, -0.053822458, -0.045769673, -0.002580632, 0.0068292916, 0.034586877, -0.0641841, 0.0068810177, -0.0025419085, 0.007145983, 0.029469332, 0.001459382) * inp_5_2_0; + result4 += M4(0.045662917, 0.06437083, -0.015806442, 0.037452206, 0.0046498333, -0.024642916, -0.2477687, -0.026788803, -0.01928559, 0.07023465, 0.0057724235, 0.023370357, 0.053570773, 0.0042258054, 0.016674742, -0.022389535) * inp_5_0_1; + result4 += M4(0.03662519, 0.025690917, -0.046904974, -0.026372867, 0.011431667, 0.033790786, -0.17635894, -0.0023115175, -0.13661973, 0.2529538, 0.09977758, -0.108515956, -0.0014443756, 0.017618539, 0.002556921, -0.006504148) * inp_5_1_1; + result4 += M4(0.040658694, -0.001910411, 0.06833234, 0.012209252, -0.016579024, 0.08395572, -0.20233363, 0.020153467, 0.19210419, -0.05882498, -0.035512786, -0.01936435, 0.005268984, 0.009647608, -0.009203391, -0.027216494) * inp_5_2_1; + result4 += M4(0.010460851, 0.1278093, -0.025103651, 0.026261805, -0.006562681, 0.0419387, -0.1941597, 0.021188475, 0.0030412704, 0.054412894, -0.06324457, -0.020397758, -0.011186675, 0.0010607947, -0.02191576, -0.002746275) * inp_5_0_2; + result4 += M4(0.010770182, 0.11662795, -0.03307867, 0.0707133, 0.0062796585, -0.10396597, -0.0043355864, -0.011910805, -0.042159002, -0.07722447, -0.0022672373, -0.011503746, -0.022136046, -0.22918393, 0.031220835, -0.047974706) * inp_5_1_2; + result4 += M4(-0.064475425, 0.06700181, 0.00033355327, -0.03881661, 0.010458988, 0.007195441, -0.049511086, 0.010732126, 0.09039737, -0.013024988, 0.00033459542, 0.01940788, 0.023288997, 0.0010807625, 0.042632915, -0.061170507) * inp_5_2_2; + result5 += M4(-0.34010622, -0.050208513, 0.12984185, -0.12801993, -0.059924997, 0.009232815, 0.053447627, -0.03466389, -0.13563374, -0.05613264, 0.02635468, 0.12122156, -0.44967335, -0.034657534, 0.069062315, -0.24278118) * inp_5_0_0; + result5 += M4(-0.024168227, 0.035439927, -0.21634299, 0.0015464671, 0.10643957, -0.26159284, -0.26025757, 0.051730163, 0.113262355, 0.052747175, -0.008385651, 0.04134606, 0.10007507, 0.07138188, -0.08615962, 0.06716338) * inp_5_1_0; + result5 += M4(-0.090735234, 0.002162947, 0.012358903, 0.045510314, -0.16824563, -0.114109926, 0.03124729, 0.03342145, -0.15391634, -0.021493945, 0.14154111, -0.09149245, 0.10135065, -0.01751155, 0.0073357457, 0.071516074) * inp_5_2_0; + result5 += M4(0.08391129, 0.044084772, -0.12922052, 0.096335925, -0.203127, -0.17005804, 0.012851081, -0.09809622, -0.08306311, 0.012551611, -0.012054054, 0.060885694, -0.06660338, 0.06956777, -0.054405212, -0.04080556) * inp_5_0_1; + result5 += M4(0.0553979, -0.18571101, -0.25444478, 0.061466966, -0.012718775, -0.101259165, -0.12592496, -0.03926893, 0.07621921, -0.12686317, 0.031390358, -0.005295218, -0.257335, -0.012894264, -0.2587087, -0.022324631) * inp_5_1_1; + result5 += M4(0.042152084, 0.0035049655, -0.054234825, 0.003745356, -0.16814667, -0.17852442, 0.016048001, 0.05099118, 0.056833014, 0.044886924, -0.018665008, -0.1423507, -0.0842296, 0.058836102, 0.1297667, -0.05923727) * inp_5_2_1; + result5 += M4(0.09534519, -0.059014343, -0.06742045, 0.0855816, -0.15113333, -0.09430361, 0.003787114, 0.05077557, 0.02708173, -0.008606664, 0.007463053, 0.014316801, 0.017279487, -0.042298485, -0.018940696, 0.023345977) * inp_5_0_2; + result5 += M4(0.22404572, 0.0042623365, 0.17759202, 0.062343325, 0.14542598, -0.07219359, -0.07012087, -0.032649912, 0.09314505, 0.1145661, 0.10668438, -0.03479758, -0.31248543, 0.0609933, 0.046848066, -0.07604761) * inp_5_1_2; + result5 += M4(-0.05552681, 0.047586277, 0.14445384, 0.04939336, -0.3417242, 0.050764516, -0.07891634, -0.01659901, -0.09508644, -0.07485686, -0.041391358, -0.056875456, 0.18324311, -0.05309739, -0.20276046, -0.0038453958) * inp_5_2_2; + result6 += M4(-0.43465915, 0.066311434, -0.02448939, -0.07710466, 0.069238074, -0.0017666236, -0.0109219495, -0.05104662, 0.08460043, 0.05343665, 0.010880282, -0.015643943, -0.45058006, 0.137677, -0.06061439, -0.08240984) * inp_5_0_0; + result6 += M4(-0.1015192, -0.07764643, -0.19970131, -0.07513604, -0.52606064, -0.16571827, -0.02529136, 0.048174836, -0.0050692116, 0.09795422, -0.003961023, 0.04816874, 0.032598272, -0.050344173, -0.018449953, -0.07303806) * inp_5_1_0; + result6 += M4(0.010268895, 0.016190592, -0.07245638, -0.099899836, 0.35320166, -0.07290188, 0.04110496, -0.055162027, -0.06049851, 0.0039485963, 0.027686737, -0.051116787, -0.0037235906, -0.029232757, 0.0018759675, 0.10575665) * inp_5_2_0; + result6 += M4(0.034075093, -0.057320252, -0.019969082, 0.03351689, -0.34619695, 0.13294634, 0.034058455, 0.01375284, -0.089123264, 0.051564164, -0.047974393, 0.012478401, -0.634654, -0.14120638, -0.02404604, 0.09954053) * inp_5_0_1; + result6 += M4(0.066299535, -0.08180153, -0.13489084, 0.13285111, 0.18003917, 0.18036184, -0.021227892, -0.057879, -0.0069515808, 0.003557019, -0.034047384, -0.022737062, -0.013421484, -0.15962498, -0.004261226, 0.055825233) * inp_5_1_1; + result6 += M4(0.10263027, -0.006790574, -0.037699178, 0.01765225, 0.029452002, 0.055822473, -0.010352509, 0.028900946, 0.032231413, 0.064724624, -0.059510604, -0.093398765, 0.033752806, 0.20656876, -0.0011954533, -0.17618215) * inp_5_2_1; + result6 += M4(0.29551166, 0.049993046, 0.015853599, -0.028993756, 0.2136953, -0.11408323, -0.015325497, 0.026346995, 0.07833931, -0.028349303, -0.010778066, -0.027874222, -0.57900894, 0.013222003, -0.005511304, 0.034613047) * inp_5_0_2; + result6 += M4(-0.03403526, 0.100832775, -0.018452095, 0.12351465, -0.118823156, -0.13342337, 0.0075422493, -0.024242288, 0.030941337, 0.043606926, 0.015011621, 0.041843265, 0.025949888, 0.078992724, -0.005989606, 0.038938757) * inp_5_1_2; + result6 += M4(0.063024774, 0.024168994, -0.014206519, 0.026095923, -0.13201635, 0.08593809, 0.015810627, 0.004019612, -0.010463751, -0.041695844, -0.00026350084, 0.030784179, 0.017668728, -0.22507419, -0.01906102, -0.068198696) * inp_5_2_2; + result7 += M4(-0.030755898, -0.021939723, 0.038514294, -0.012435489, -0.00035072534, 0.010223821, -0.276949, 0.026185542, 0.043994617, 0.0005854587, 0.044658076, 0.040134452, -0.013960766, 0.077154845, 0.33035004, -0.01699112) * inp_5_0_0; + result7 += M4(0.0037870558, 0.060576808, -0.11033274, -0.10536779, 0.0069959355, -0.06730829, 0.034311775, 0.0784653, 0.08492847, 0.09449308, 0.2120786, -0.0223666, 0.00026424773, 0.08239599, 0.032526847, -0.13654903) * inp_5_1_0; + result7 += M4(0.009892634, -0.03100528, 0.05408845, -0.060207017, -0.018686958, -0.03704682, -0.44232005, -0.06998197, -0.02772952, 0.11526324, 0.2579473, -0.016176077, -0.00073412806, -0.031965405, -0.022278674, 0.040883616) * inp_5_2_0; + result7 += M4(-0.03608727, 0.015700052, 0.041335873, 0.03863478, -0.0144856125, 0.06313405, 0.24218546, -0.07658271, -0.014746704, 0.05725393, 0.29396272, -0.019632459, -0.032947984, -0.07185171, -0.5096812, -0.06523113) * inp_5_0_1; + result7 += M4(-0.018811163, 0.07612921, -0.026718883, -0.005369504, -0.015152133, 0.092503846, -0.29812264, 0.021017868, 0.233852, 0.07419989, -0.05219466, -0.024814952, 0.050316833, -0.12389305, -0.59454477, 0.0035371205) * inp_5_1_1; + result7 += M4(0.01573445, 0.02081198, -0.31803352, 0.048742726, -0.010373865, 0.045333374, 0.41793144, 0.093884975, -0.0049903016, 0.00900994, -0.0120234545, -0.008116833, 0.0063830027, -0.053449664, -0.02187606, 0.029403567) * inp_5_2_1; + result7 += M4(0.04181186, 0.000555606, 0.081792146, 0.04973729, 0.008407554, -0.046391103, -0.3928514, 0.07345774, -0.0028344628, -0.03487235, -0.08662981, -0.0411111, 0.023571722, 0.0068826447, 0.12858525, 0.066894904) * inp_5_0_2; + result7 += M4(-0.00012077134, 0.08640638, 0.1581722, 0.09099293, 0.013253489, -0.059615664, 0.05376947, -0.052911837, -0.0055005294, -0.0047757532, -0.069641255, 0.015263207, -0.017336125, -0.031187296, -0.15659216, -0.030545805) * inp_5_1_2; + result7 += M4(-0.013796228, 0.023354108, 0.114026226, 0.07178701, 0.00032975187, -0.025668027, -0.24524234, -0.021683352, -0.01659007, -0.06278088, 0.11503196, -0.0047270297, 0.0045957407, -0.10662955, -0.505408, -0.03485205) * inp_5_2_2; + const V4 inp_6_0_0 = inp[6][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_6_1_0 = inp[6][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_6_2_0 = inp[6][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_6_0_1 = inp[6][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_6_1_1 = inp[6][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_6_2_1 = inp[6][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_6_0_2 = inp[6][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_6_1_2 = inp[6][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_6_2_2 = inp[6][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.012290762, -0.010053031, -0.032378945, -0.08613342, -0.098046206, 0.040757682, 0.036342233, 0.4393168, -0.046016797, -0.0047643674, 0.0370266, 0.08644782, -0.10049338, 0.0038530978, 0.10289342, -0.13248965) * inp_6_0_0; + result0 += M4(0.0803184, 0.01775443, 0.12549195, 0.34465283, -0.020942826, -0.0074712127, -0.06487096, -0.25220165, 0.05847885, 0.023682216, 0.04019802, 0.23486874, -0.013487799, 0.0042855814, -0.16916147, -0.07776904) * inp_6_1_0; + result0 += M4(-0.01399247, 0.041809272, 0.0950955, -0.22938721, 0.010836741, 0.010237072, -0.14352037, 0.1642172, 0.016975148, 0.006265733, 0.05321698, 0.10213412, 0.06258716, 0.03063673, -0.090734646, 0.1457925) * inp_6_2_0; + result0 += M4(-0.019648109, -0.032363757, 0.009823622, -0.21900116, 0.14913297, 0.07926251, -0.13882445, -0.02467147, -0.040639803, -2.607454e-05, 0.080853544, -0.22016479, 0.03723048, 0.05562028, -0.0099998005, -0.13743635) * inp_6_0_1; + result0 += M4(0.03763351, -0.026733967, 0.09021638, -0.09725332, -0.03686128, -0.029778557, 0.15336901, 0.020229915, 0.060311295, 0.029001787, 0.10862779, 0.072356075, -0.2007617, -0.05471788, 0.0138984565, -0.33671153) * inp_6_1_1; + result0 += M4(-0.06649737, 0.02575787, -0.086657725, -0.20614621, 0.01551639, 0.14066792, -0.020360691, -0.11477864, 0.063313946, 0.013270628, -0.044209633, 0.15595552, 0.0010065356, -0.055630334, 0.06965064, -0.223778) * inp_6_2_1; + result0 += M4(-0.031712368, -0.021703426, 0.085570835, -0.025286496, 0.08787542, 0.03360042, -0.059270322, 0.05363371, 0.011414699, -0.0061137243, 0.06451853, 0.022097034, -0.03029425, -0.012400635, -0.043233823, -0.28318608) * inp_6_0_2; + result0 += M4(0.0887435, 0.03652525, 0.007045802, 0.113466926, -0.047390904, -0.006552142, -0.088271536, 0.061387442, 0.026920004, 0.012497754, 0.2254657, 0.046307944, 0.116138816, 0.025254533, 0.028496742, 0.04026703) * inp_6_1_2; + result0 += M4(0.03639295, -0.03338543, -0.08666184, -0.087324515, -0.0041676005, 0.08516525, 0.007905901, 0.021504058, 0.0005966164, -0.0026157368, -0.011342891, 0.10182345, -0.0011176856, 0.0018130606, -0.069616534, -0.18670318) * inp_6_2_2; + result1 += M4(0.100001834, -0.006519762, 0.07589816, -0.11294678, 0.044229187, -0.024166575, 0.02982691, -0.060127553, 0.010498526, 0.032989927, 0.17482181, 0.085258104, -0.34368977, -0.046102345, -0.1365521, -0.057034872) * inp_6_0_0; + result1 += M4(0.01206724, 0.03499608, 0.16093054, 0.03987434, -0.013091575, -0.003260499, 0.075450376, -0.026234658, -0.032683376, 0.010502234, 0.08847771, 0.06372449, -0.0024679932, -0.07441292, -0.28673452, 0.052531466) * inp_6_1_0; + result1 += M4(0.010136031, 0.0957933, -0.20584726, 0.0069709127, 0.0023896818, -0.06617853, -0.21756458, -0.028527215, -0.0025085746, 0.02563822, 0.28665373, -0.010468878, 0.012637448, 0.10443899, -0.0858207, 0.023251882) * inp_6_2_0; + result1 += M4(0.019162724, 0.03299633, 0.013900696, 0.3516158, 0.023411278, -0.044480763, 0.28763214, -0.03576606, -0.00919052, 0.036876984, 0.21241572, 0.058828715, -0.02252239, -0.004954775, -0.28044826, 0.108627886) * inp_6_0_1; + result1 += M4(-0.019738609, 0.09996027, -0.0413891, 0.08595848, -0.031432908, 0.04353436, 0.1595374, -0.114975184, 0.002785995, 0.039563313, 0.0034207527, 0.07813128, -0.015060294, 0.0969083, -0.07275742, -0.016173167) * inp_6_1_1; + result1 += M4(-0.0030980157, -0.050007373, -0.18056257, -0.008054277, -0.0015756225, -0.030089825, -0.14030725, -0.0002668069, 0.0039725634, -0.040632382, 0.031075573, 0.012893956, 0.0086110765, -0.06745182, -0.02574941, 0.00095321116) * inp_6_2_1; + result1 += M4(0.011731451, 0.0041523157, -0.124596514, -0.012349384, -0.0033603935, 0.013695187, -0.17548637, 0.014456587, 0.0097641805, 0.017610345, -0.0097866515, -0.002009524, 0.008148355, 0.012609436, 0.051821902, -0.10949161) * inp_6_0_2; + result1 += M4(-0.004787002, -0.01813831, -0.18435764, -0.056968693, 0.0019371605, -0.002547363, -0.20857944, 0.007997553, 0.0027675754, -0.024794357, 0.034495614, -0.04346862, 0.0034796915, -0.027214106, -0.059915133, 0.0292613) * inp_6_1_2; + result1 += M4(-0.0040159975, 0.009954769, -0.070228115, 0.0014976826, 0.0010554566, -0.01798106, -0.21380241, 0.0025268234, -0.00070417614, 0.015525404, 0.036712047, -0.0075945575, 0.0114459805, 0.00860251, 0.050212942, -0.026906004) * inp_6_2_2; + result2 += M4(-0.092685185, -0.039013248, -0.013217567, -0.009867702, 0.003679367, 0.019260691, -0.019046895, -0.000601842, 0.022774309, 0.055644892, -0.0049583134, -0.0034553488, -0.011735758, 0.02748048, 0.0035462806, 0.009289952) * inp_6_0_0; + result2 += M4(0.09151108, 0.05190418, -0.030876456, 0.05175798, -0.02009278, -0.02745277, -0.007867276, 0.02528181, 0.08029572, 0.013853951, 0.0077539766, -0.019678896, -0.14478916, -0.026613189, 0.05431084, -0.048460603) * inp_6_1_0; + result2 += M4(0.035539925, -0.004509729, 0.002448754, -0.00057535974, -0.1314407, -0.060086925, -0.020494446, -0.0050920397, 0.056524396, 0.017356997, 0.002764267, 0.015292765, 0.044016533, -0.021364672, -0.0052023907, -0.0015153401) * inp_6_2_0; + result2 += M4(0.12168915, 0.028832044, 0.046577733, -0.031671304, -0.029417643, 0.023893273, -0.008737942, 0.056590546, 0.05011546, 0.03288956, 0.011564713, 0.005065656, -0.10162401, -0.024793735, -0.06287232, 0.062156882) * inp_6_0_1; + result2 += M4(-0.066770285, -0.012950488, 0.04992858, 0.03354283, 0.057830073, 0.09960101, 0.030052505, 0.039702166, 0.11190071, 0.12188369, 0.014085785, -0.0024246175, 0.049633596, 0.0034802319, -0.1105528, -0.24383259) * inp_6_1_1; + result2 += M4(0.06832664, -0.06968258, 0.051687527, -0.02907532, -0.13083303, 0.016288249, -0.045846958, 0.0038347384, 0.02796738, 0.021050211, -0.0014437629, 0.0074234614, -0.033488605, 0.0028283196, 0.0028349007, -0.053338695) * inp_6_2_1; + result2 += M4(0.016823059, -0.016349452, 0.00019454084, -0.0031462135, 0.01131709, -0.05383347, -0.029143311, 0.012888047, 0.018022547, 0.009826473, 0.012014194, -0.0026803287, 0.012792615, -0.028527202, -0.003382069, -0.025247058) * inp_6_0_2; + result2 += M4(0.053624265, -0.022636238, -0.044413395, 0.00950327, -0.019735936, -0.028253868, 0.01283197, 0.0406327, -0.013911863, 0.008108678, 0.010259169, 0.0066404925, -0.01957056, -0.10539481, -0.022997769, -0.0026304023) * inp_6_1_2; + result2 += M4(-0.092205964, 0.04029118, -0.00829292, -0.024637619, -0.02465155, 0.021534355, -0.04077975, -0.015175284, -0.019231206, 0.038591735, 0.0017683035, -0.009013511, -0.07930131, 0.03153344, -0.03172194, -0.00024431024) * inp_6_2_2; + result3 += M4(-0.055493977, 0.007129383, 0.002141119, 0.014559398, -0.039813865, -0.016797917, 0.0023972709, 0.00041249365, -0.00981776, 0.0058928346, -0.019154385, 0.0067438628, -0.0020899016, -0.05684, -0.0030715107, -6.0925882e-05) * inp_6_0_0; + result3 += M4(-0.010217337, -0.052260514, 0.039385643, 0.007039413, 0.01799454, -0.0577382, 0.017279949, -0.0003869266, 0.04678435, 0.049023014, -0.013259489, -0.0027402127, -0.087999485, 0.06320837, -0.06278846, 0.0037576456) * inp_6_1_0; + result3 += M4(0.037293848, 0.059133735, 0.004172794, -0.0036571762, 0.032403708, -0.047526788, 0.015680587, -0.00032716952, -8.6542605e-05, 0.03529912, 0.0022475754, 0.0030072317, -0.03253773, 0.034226146, -0.004907836, 0.011426194) * inp_6_2_0; + result3 += M4(0.055072863, -0.047109336, 0.05598112, -0.013975192, 0.023803456, 0.0053572604, -0.051438857, -0.00555347, 0.04751872, 0.023362413, 0.014907863, -0.0038425177, -0.10360313, 0.008978095, -0.015678313, -0.007341501) * inp_6_0_1; + result3 += M4(0.018583154, 0.22437426, -0.045809884, -0.0053728325, -0.17897789, -0.032594856, 0.07191401, 0.0034944064, 0.13228463, 0.020752668, -0.037657455, 0.004177733, -0.3523534, -0.17746517, -0.15133438, 0.039740514) * inp_6_1_1; + result3 += M4(0.007823297, -0.019084128, -0.029645089, 0.011458788, -0.08640555, -0.038487483, 0.029919466, 0.005061168, 0.024194121, 0.0839493, -0.032946195, -0.0014752013, -0.029473893, 0.020597594, -0.086628795, -0.016999863) * inp_6_2_1; + result3 += M4(0.06281429, 0.06692882, -0.0026090737, 0.025801765, 0.029453281, 0.021063251, -0.008726748, -0.011846802, -0.0044512697, 0.009316013, -0.004615945, 0.0013774027, -0.076157436, 0.046629824, 0.044510454, 0.00059239834) * inp_6_0_2; + result3 += M4(0.12062547, -0.050718866, -0.043070678, -0.0028223314, 0.12852141, 0.04714732, -0.022386296, 0.020857165, -0.071585186, 0.041900657, -0.0019691875, -0.018944446, 0.07852056, -0.0063666897, -0.057195943, 0.041365217) * inp_6_1_2; + result3 += M4(-0.026094297, 0.08631096, -0.0069263936, -0.22591403, -0.020006517, -0.022212753, 0.004577932, -0.3976379, -0.030017998, -0.017201388, 0.0026550689, -0.043253288, -0.008901822, 0.035541028, -0.0086641405, -1.2957926) * inp_6_2_2; + result4 += M4(0.012300569, 0.003921015, 0.011946446, -0.0025676754, -0.022009345, -0.027323725, 0.03221154, 0.0039387583, 0.009339417, 0.009317359, 0.12790316, 0.012074939, -0.003204824, -0.060603764, 0.0012728475, 0.051030852) * inp_6_0_0; + result4 += M4(0.0513073, -0.037477765, -0.10366891, 0.069612145, 0.012768361, -0.014747749, -0.1575883, 0.007116781, -0.007820471, -0.019741695, 0.07611309, 0.02695164, 0.0031895523, -0.027959265, -0.010869307, -0.092739366) * inp_6_1_0; + result4 += M4(0.049377494, -0.053803347, -0.024088198, 0.051801056, -0.020724384, -0.001833845, -0.04271145, -0.013222208, 0.0076294146, 0.0054026716, 0.01093465, 0.01443401, 0.02336828, -0.043393053, -0.11242944, -0.017014882) * inp_6_2_0; + result4 += M4(0.044203218, -0.048627485, 0.03566067, 0.0149888275, -0.028386788, 0.01610052, -0.0028078037, 0.06997983, 0.028005196, 0.039874807, 0.08526987, 0.021743936, -0.04861443, -0.08495866, -0.075890996, 0.01151304) * inp_6_0_1; + result4 += M4(-0.013728403, 0.0066139954, -0.06015557, 0.19792125, 0.03464891, -0.090691015, 0.12769918, 0.014904657, 0.006668767, 0.1151996, 0.12514316, -0.0063834307, -0.13717464, -0.05704096, -0.17070036, -0.06071528) * inp_6_1_1; + result4 += M4(0.04781628, -0.0036707402, 0.08735667, -0.021188159, -0.021271601, -0.044387788, -0.04678786, -0.01467483, 0.007871949, 0.0015153021, 0.06033026, 0.019386914, 0.032788943, -0.0151405465, 0.14838706, -0.055169523) * inp_6_2_1; + result4 += M4(0.0030917637, 0.04150332, -0.059072003, 0.024329018, -0.0076141804, 0.023184728, 0.04104932, 0.02043833, -0.0029006656, 0.16169244, -0.026884088, 0.002988135, 0.025676198, 7.763838e-05, -0.057638768, -0.0001432525) * inp_6_0_2; + result4 += M4(-0.016086916, -0.21834774, -0.12303665, -0.0078081964, 0.029211925, 0.03149682, -0.07726399, 0.038729727, -0.0048046177, 0.16202135, 0.09133993, -0.0064609298, 0.051216688, -0.13541323, 0.031037724, 0.032310028) * inp_6_1_2; + result4 += M4(0.030904543, 0.007312005, -0.033106234, 0.04164746, -0.03347607, 0.016248558, 0.02423278, -0.0283094, -0.011934969, 0.0584496, 0.11275283, 0.010092434, 0.0069122305, -0.057725374, -0.10506642, 0.05114553) * inp_6_2_2; + result5 += M4(0.12327465, 0.038419377, -0.11216989, 0.023978868, -0.08152244, 0.004710024, 0.2161874, -0.033912066, 0.09562912, 0.05201862, 0.03480882, 0.077532195, -0.1214719, -0.0070755067, -0.00576491, -0.10451052) * inp_6_0_0; + result5 += M4(-0.1271294, -0.018757613, 0.06328837, 0.09443448, -0.09208765, -0.061547127, -0.017052999, -0.07314296, 0.28972462, 0.08740569, 0.037641432, 0.094780944, 0.074109964, 0.011131953, -0.046346318, 0.07219438) * inp_6_1_0; + result5 += M4(-0.049943674, -0.03984347, -0.0036058293, -0.05361642, -0.010248528, -0.009312495, -0.0481969, 0.004807876, -0.08150705, 0.00017803338, -0.013440729, -0.0148788, -0.34026754, -0.050879173, 0.0029865622, -0.07275097) * inp_6_2_0; + result5 += M4(0.34224057, -0.04396335, -0.20415224, 0.13095209, -0.03532615, 0.05827029, 0.021775814, -0.00053049, 0.18214488, 0.074128315, -0.093625456, 0.08149814, -0.05355675, -0.005840225, -0.07842599, -0.16460215) * inp_6_0_1; + result5 += M4(-0.30652338, -0.0728888, 0.122771434, 0.052094705, -0.012630002, 0.09230573, -0.09721077, -0.0094271535, 0.11488334, -0.010159144, 0.07672508, 0.1292131, -0.35355228, -0.08444311, -0.14569049, 0.11070845) * inp_6_1_1; + result5 += M4(0.17827068, 0.07690791, -0.110091045, -0.1081091, -0.01757862, -0.08965607, -0.1006825, -0.037371036, 0.016993694, 0.044062573, 0.039051022, -0.043025527, 0.04655079, 0.053222284, 0.03570332, -0.18985784) * inp_6_2_1; + result5 += M4(0.006450831, -0.04491093, -0.07097394, -0.022045014, -0.017884279, -0.048780706, -0.10489109, 0.009427876, 0.04094736, -0.038898177, -0.047679894, 0.066606395, 0.06729684, -0.090917446, -0.16663514, 0.034028154) * inp_6_0_2; + result5 += M4(-0.25590047, 0.08221804, 0.064723484, -0.07060204, 0.14776592, -0.0040918584, 0.07799097, 0.010082882, 0.07323286, 0.036311455, 0.10460265, 0.0055226083, -0.15523317, -0.0055219913, 0.21712542, 0.004518246) * inp_6_1_2; + result5 += M4(0.08408889, -0.067780204, -0.12176577, 0.0065457383, -0.07290015, 0.032551482, -0.0503736, 0.00068584416, -0.0075658257, 0.07159344, 0.05969502, -0.019791221, 0.28757152, -0.009607712, -0.008736326, -0.023250693) * inp_6_2_2; + result6 += M4(0.0826916, -0.0011589428, 0.04217768, 0.03508019, 0.20844382, 0.069929466, 0.0013225308, -0.15359119, 0.100197226, 0.037239406, 0.00882235, -0.05850417, -0.08140204, -0.13296746, -0.090059, -0.10555451) * inp_6_0_0; + result6 += M4(0.043170944, -0.070654795, 0.16726859, -0.042714182, -0.17019092, -0.018037906, 0.0005002727, 0.13694957, 0.08728689, 0.059884444, 0.017693968, 0.13340299, -0.00055857585, -0.06576273, -0.15978944, 0.02199702) * inp_6_1_0; + result6 += M4(-0.07912936, -0.098446734, 0.024297614, 0.010267006, 0.16866629, -0.034402836, -0.057588954, -0.006731306, -0.011143194, -0.0044363905, 0.009035161, 0.028604086, -0.029849688, -0.080510244, -0.014722543, 0.06951666) * inp_6_2_0; + result6 += M4(0.15960571, 0.05077707, 0.040001646, 0.06916319, -0.116350405, 0.08007057, 0.01731877, -0.104498945, -0.20638683, 0.03451314, 0.013891756, -0.04759701, -0.24217086, -0.057022028, -0.07895474, -0.15182598) * inp_6_0_1; + result6 += M4(0.012851796, 0.1265119, 0.14137456, 0.08199784, 0.052126616, -0.022660425, 0.066767074, 0.19143231, -0.022784606, -0.05656668, 0.07149101, 0.12093422, 0.20908651, -0.29562038, 0.01122719, -0.02989438) * inp_6_1_1; + result6 += M4(0.024302103, 0.058623184, 0.04026934, -0.06594341, 0.0040197996, -0.075270094, -0.052552696, 0.03661451, 0.020229882, 0.040011834, 0.028370712, 0.05044578, -0.06754057, -0.028959308, 0.047554366, -0.054447416) * inp_6_2_1; + result6 += M4(-0.13686283, -0.05232535, 0.01885817, -0.038568046, 0.14675242, -0.10084552, 0.008621979, -0.044769835, 0.05927116, 0.028497204, 0.012083906, -0.00489566, -0.14673924, -0.014464444, 0.011752121, 0.022125177) * inp_6_0_2; + result6 += M4(0.09373868, -0.08046232, 0.0056930813, 0.0035867547, -0.08200038, -0.12970145, 0.001867932, 0.024525903, 0.023822464, 0.13795632, 0.020510435, 0.011507953, 0.19085273, -0.0687676, -0.021647172, -0.06443088) * inp_6_1_2; + result6 += M4(-0.101430655, -0.010518138, -0.027467076, 0.0095609035, 0.011564041, 0.0031170845, -0.009625634, 0.003805805, -0.04701001, 0.026332378, 0.013408522, 0.04035226, -0.100561626, 0.021271843, -0.038250048, -0.03853332) * inp_6_2_2; + result7 += M4(0.0032898376, -0.005865905, -0.006957761, -0.020074202, 0.005731783, 0.006253842, 0.016897107, 0.00512188, 0.00786627, 0.0074314745, 0.06670645, 0.019218192, 0.003331795, -0.03158377, -0.11539601, -0.14413469) * inp_6_0_0; + result7 += M4(-0.02312532, -0.037246346, -0.06965573, 0.05826521, -0.0070234323, -0.028701507, -0.10759601, -0.028601447, -0.003919406, 0.014756707, 0.08884789, 0.0042593763, -0.026350876, 0.11060137, 0.13215055, -0.21373007) * inp_6_1_0; + result7 += M4(0.0028861375, -0.06460452, -0.14393088, 0.042305835, 0.0144716315, -0.030690713, 0.06531305, -0.07140867, 0.0077675744, 0.024891805, 0.07084563, 0.014540746, -0.020980177, -0.01581307, -0.25996336, -0.0464056) * inp_6_2_0; + result7 += M4(0.052179918, 0.01069332, 0.25557518, 0.077363394, 0.016674379, 0.011493623, 0.1312654, 0.0048949104, -0.006951166, 0.0049097673, 0.22596136, -0.0011749576, -0.09991268, 0.004808804, -0.20045118, -0.018384261) * inp_6_0_1; + result7 += M4(0.06070373, 0.097720645, -0.076022156, 0.04256979, -0.013493103, 0.076170936, -0.04232606, 0.075218454, 0.00676294, -0.04443509, 0.13401033, 0.12200188, 0.009537357, -0.22084852, -0.41906348, 0.04412222) * inp_6_1_1; + result7 += M4(0.0054461826, 0.07257678, 0.06913896, -0.03155972, 0.004781128, -0.060989942, -0.32721478, -0.0036027739, 0.004245522, -0.04753024, -0.010141954, 0.06272829, 0.010017422, -0.011318091, 0.18608995, -0.032175362) * inp_6_2_1; + result7 += M4(0.011460923, 0.032904617, -0.13747554, -0.02152912, 0.0090295905, 0.023118716, -0.09190288, -0.0037826712, 0.01845322, 0.00029635793, 0.08082626, -0.009689829, -0.005135765, -0.0011611588, -0.10125263, 0.044646807) * inp_6_0_2; + result7 += M4(-0.019781616, -0.058512125, -0.15905127, -0.13311842, -0.0057250247, 0.006289206, 0.0014242958, -0.07893525, -0.009187235, 0.111200534, 0.07802423, -0.005958909, -0.03959017, -0.0966615, -0.23390996, -0.098434895) * inp_6_1_2; + result7 += M4(0.006658349, -0.02962057, -0.14098343, -0.03894199, 0.010386885, -0.02859822, -0.064082175, 0.016541123, -0.000493648, 0.06329013, 0.14639452, -0.016659537, 0.011981254, 0.02536493, -0.06166385, -0.006958652) * inp_6_2_2; + const V4 inp_7_0_0 = inp[7][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_7_1_0 = inp[7][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_7_2_0 = inp[7][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_7_0_1 = inp[7][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_7_1_1 = inp[7][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_7_2_1 = inp[7][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_7_0_2 = inp[7][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_7_1_2 = inp[7][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_7_2_2 = inp[7][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.019619163, 0.01921148, 0.04440256, -0.5222853, 0.046370033, 0.03338517, 0.13385774, -0.096681684, -0.008608558, 0.06058205, 0.13609034, 0.040071595, -0.043402378, 0.008793234, 0.021240113, 0.29263994) * inp_7_0_0; + result0 += M4(-0.1109213, -0.024931358, -0.0305067, -0.20737807, -0.05294311, -0.07020198, -0.16228068, -0.8278653, 0.19909897, -0.09671268, -0.16672443, 0.20059893, 0.14637361, 0.0003353352, -0.12467028, 0.01374531) * inp_7_1_0; + result0 += M4(-0.12905861, -0.0099937, -0.18979676, -0.53485763, -0.0116048325, 0.020433571, 0.04181418, -0.04725143, -0.014288277, 0.011442115, -0.010814545, -0.09773122, -0.11255902, -0.13433866, 0.13077062, -0.52286124) * inp_7_2_0; + result0 += M4(-0.18251744, -0.021963762, -0.14580035, -0.43697283, 0.12970643, 0.02733098, -0.15955159, -0.37729254, 0.053287327, 0.065358706, 0.20084082, 0.3282861, -0.2404756, 0.014787381, 0.019458184, -0.034958147) * inp_7_0_1; + result0 += M4(-0.32293555, -0.10247339, -0.2034304, -0.5769918, -0.4534017, -0.1818026, -0.4907527, -0.7226196, -0.09522023, 0.023163613, 0.096056566, -0.007710594, 0.094863735, -0.009735608, 0.14387085, -0.36049882) * inp_7_1_1; + result0 += M4(-0.059508022, -0.1619508, -0.38009545, -0.5047528, -0.053665306, -0.1293786, 0.041960157, -0.052680194, -0.06778961, -0.100416325, -0.15890615, 0.15459825, -0.075632125, -0.22988954, 0.12310383, -0.54904133) * inp_7_2_1; + result0 += M4(0.004761123, 0.011536497, -0.16972515, -0.29813156, 0.105865955, 0.04813545, -0.37342885, 0.01624747, 0.16064364, 0.05948557, -0.024455588, -0.014247143, 0.0281806, 0.017937804, -0.028398527, 0.06430144) * inp_7_0_2; + result0 += M4(-0.03094846, -0.023887098, -0.16835493, -0.45625633, -0.4240621, -0.23580924, -0.16891237, -0.66473275, -0.1336526, -0.019848557, 0.07236185, -0.18608706, 0.07368037, -0.0070274146, 0.0060203294, 0.13581316) * inp_7_1_2; + result0 += M4(-0.06565267, -0.092021264, 0.058388345, -0.2428771, 0.12035776, -0.17074834, -0.044587415, -0.2392213, 0.0072104903, 0.04976757, 0.08389607, -0.08572632, 0.0062024267, -0.035368856, -0.084190235, 0.020714622) * inp_7_2_2; + result1 += M4(-0.027411012, -0.0006558154, 0.36119094, -0.031570382, -0.07957487, 0.018136166, -1.0776129, 0.1047041, 0.29237336, 0.121909216, -0.3122805, 0.15541574, -0.054077875, 0.019749457, -0.17331713, -0.0044874134) * inp_7_0_0; + result1 += M4(-0.021662064, -0.0233977, 0.2910494, -0.12006933, 0.033777535, -0.23034136, -0.40222427, -0.09413501, 0.024764126, -0.026446294, -0.0628491, -0.10069309, -0.040109824, -0.0011900908, -0.15767077, 0.017133659) * inp_7_1_0; + result1 += M4(0.009743534, -0.20257235, 0.15439887, 0.0071897637, 0.010785288, -0.026097942, -0.80098593, 0.020632258, -0.0122931525, -0.08317335, 0.04137996, -0.0035129718, 0.007053192, 0.019992907, -0.22204553, -0.0139648) * inp_7_2_0; + result1 += M4(0.047682434, -0.0421963, 0.027298711, -0.19487585, -0.044362977, 0.01504118, 0.15650836, -0.2918026, -0.0154652875, -0.012679184, 0.19739644, -0.26636449, -0.016848562, -0.016164871, -0.38752186, -0.0071176235) * inp_7_0_1; + result1 += M4(0.03764035, 0.024834264, -0.010222534, 0.012442136, 0.022134345, -0.11349213, -0.6615615, 0.0128131565, -0.00038987622, 0.0013724855, 0.11838443, 0.075134344, -0.005166681, -0.015660344, 0.1445425, -0.0278104) * inp_7_1_1; + result1 += M4(0.00088805344, 0.047852527, -0.10478063, -0.024633344, 0.00090017763, 0.07964519, -0.4611838, 0.00796534, 0.0048827343, 0.020747093, -0.1042169, -0.0042456375, 0.002950442, -0.011804218, 0.2772437, 0.00054366846) * inp_7_2_1; + result1 += M4(-0.0054696607, -0.0001439405, -0.05279678, 0.020695645, 0.015178085, 0.02855919, -0.07854449, -0.17121412, 0.020729193, -0.0029669595, 0.114148, 0.12826203, 0.005424357, 0.0011395529, 0.088982716, -0.017530778) * inp_7_0_2; + result1 += M4(-0.001802239, -0.008785034, -0.008640605, -0.013083186, 0.014738717, 0.0154219335, -0.31386074, -0.037077494, 0.0022477873, 0.007822429, 0.19449356, -0.015080717, 0.0005470594, -0.009511823, -0.04181818, -0.0017789806) * inp_7_1_2; + result1 += M4(-0.0066921646, -0.0036458238, -0.080104426, 0.007593998, 0.0027090157, 0.011818684, 0.13055573, 0.02397231, -0.010580146, -0.0040242216, 0.017887088, 0.006524338, 0.001104952, -0.011541328, -0.001593766, 0.007713354) * inp_7_2_2; + result2 += M4(-0.00181024, -0.0062821396, -0.028562747, -0.017439006, 0.06714445, -0.046118323, -0.011498005, -0.026847633, 0.084855564, 0.08468601, -0.041410256, 0.017027173, -0.062388983, -0.0061762678, 0.011183944, 0.012399395) * inp_7_0_0; + result2 += M4(-0.009214674, -0.043398388, 0.026245562, -0.02194355, -0.028220208, -0.0035614313, -0.015907183, -0.04670032, -0.010955945, -0.114033945, 0.094313145, -0.033299666, 0.03767305, 0.04831226, -0.009924143, 0.04698403) * inp_7_1_0; + result2 += M4(-0.0834085, 0.025948057, -0.02079768, -0.010464437, -0.0056597195, 0.012022448, -0.0085257795, 0.00060337054, -0.032568067, 0.04050433, 0.035584603, 0.014839012, 0.00086521904, 0.0036729395, -0.0052799447, -0.011319273) * inp_7_2_0; + result2 += M4(-0.116548985, -0.022739206, -0.010440332, -0.04588173, -0.36447343, -0.01833086, -0.049404077, -0.026872661, -0.007371161, -0.069598526, -0.102384, 0.14382058, 0.08921956, -0.029889785, -0.038862173, 0.02807371) * inp_7_0_1; + result2 += M4(-0.2457012, -0.057998665, -0.0018222937, -0.011622737, -0.42984796, -0.15360886, -0.08889381, -0.047691002, 0.014668313, 0.21917526, -0.07127, 0.058073115, -0.081578895, -0.019761011, 0.009938665, 0.039989498) * inp_7_1_1; + result2 += M4(-0.085061714, -0.0835048, -0.031727955, -0.011889079, 0.03850285, 0.025723798, -0.0078068813, -0.06044399, -0.029326422, -0.03445261, -0.054068994, 0.036757298, 0.031338938, 0.014910681, -0.00985985, 0.024286473) * inp_7_2_1; + result2 += M4(-0.00011266963, -0.0060369624, -0.015413404, -0.0149466125, -0.028696485, -0.060611654, -0.067734994, 0.029793596, 0.016574329, 0.051108334, 0.0035925496, -0.033243727, 0.013867411, 0.012912953, 0.0043867524, -0.0044129426) * inp_7_0_2; + result2 += M4(0.04598295, 0.006795931, 0.025450828, -0.03426622, 0.11743263, -0.036128595, -0.034959648, -0.025216965, 0.012883598, -0.07669863, -0.0070978454, 0.10277388, 0.0032985054, -0.0073466557, -0.0067402916, -0.011859282) * inp_7_1_2; + result2 += M4(0.0090787625, -0.034614343, 0.0012652007, 0.010083644, 0.010530217, -0.0024835244, -0.007734476, -0.004251591, 0.047886815, -0.0033810567, -0.039794136, 0.036148045, -0.016814964, -0.021526292, 0.011536933, -0.0017637961) * inp_7_2_2; + result3 += M4(-0.056713074, 0.017072853, 0.01924319, -0.012108567, 0.033694275, -0.00014728415, 0.0013783042, -0.0070118764, 0.10356375, 0.055793744, -0.015750544, -0.027222866, -0.05444492, 0.038992025, -0.06453667, 0.015554088) * inp_7_0_0; + result3 += M4(-0.009651923, 0.015291043, 0.0073522585, 0.0089078965, 0.049267348, 0.089883775, 0.026752485, 0.0023726642, 0.14089406, 0.04576883, -0.06899896, 0.0033200101, 0.06524402, -0.055788726, 0.03670162, 0.00042637571) * inp_7_1_0; + result3 += M4(-0.026436668, -0.08396247, 0.034431014, -0.021391103, 0.01112021, -0.004706283, 0.0113699315, -0.0062436434, 0.055922475, -0.016387999, -0.0011654728, -0.031879783, 0.026270457, 0.05134117, 0.003604511, -0.0053165792) * inp_7_2_0; + result3 += M4(-0.0006227549, 0.0034437897, 0.06543345, 0.013124324, -0.031671446, 3.3820044e-05, -0.0032878139, 0.0024007803, -0.0738113, 0.012045466, -0.11248027, 0.008195581, 0.092917256, -0.005078936, -0.05529186, 0.011254123) * inp_7_0_1; + result3 += M4(-2.3622135e-05, -0.16733384, -0.09112911, 0.021277083, -0.51431096, -0.19434457, -0.0052565695, 0.0060003204, -0.09170261, -0.03823073, 0.16561238, 0.26313868, -0.0038034117, 0.06035131, -0.007422141, -0.00716486) * inp_7_1_1; + result3 += M4(-0.12549236, -0.088710144, 0.05694673, 0.026314596, -0.11872987, -0.065887615, 0.065937184, -0.020208606, -0.057489034, -0.06889103, 0.07919115, 0.19062647, 0.0027967654, -0.051737946, -0.030278793, -0.033337694) * inp_7_2_1; + result3 += M4(0.030196456, -0.041681297, -0.0012948094, -0.0053139296, 0.17968246, 0.03346025, -0.04726979, 0.010067239, 0.038868077, -0.00091599574, 0.0025656684, 0.00058525533, -0.036029734, -0.0030704427, -0.011090419, -0.008966043) * inp_7_0_2; + result3 += M4(0.00083388394, 0.004511208, 0.055891965, 0.019707544, 0.08286773, -0.32230675, -0.053231142, 0.030822719, 0.07264268, 0.013594093, 0.017561717, 0.24278389, 0.040262565, -0.04956609, 0.00064297114, -0.04554397) * inp_7_1_2; + result3 += M4(0.04192961, -0.025178114, 0.01933823, -1.7493954, 0.049751934, 0.038322236, 0.01182845, -1.8043197, 0.036696296, 0.027128216, 0.026126176, -0.23710631, 0.025719067, -0.011830301, 0.008182878, -0.90499324) * inp_7_2_2; + result4 += M4(-0.031255115, 0.0054043555, -0.06824895, -0.032274008, -0.004812104, 0.013143836, 0.02716034, -0.020736909, -0.06167614, 0.013290974, -0.07206355, 0.0009996302, 0.019633964, -0.004111305, 0.0493287, 0.028125653) * inp_7_0_0; + result4 += M4(-0.008962232, -0.021928806, 0.062050704, 0.007442805, -0.020863477, 0.011718123, 0.1180728, -0.050780166, -0.065636836, 0.03868869, 0.050912462, 0.18666048, 0.008599102, 0.0010315233, -0.0567703, 0.039501596) * inp_7_1_0; + result4 += M4(-0.01653252, 0.044354137, 0.039605364, -0.029500913, -0.002489893, 0.010061884, -0.035556745, -0.03726708, -0.027737575, 0.08115309, 0.07203295, 0.016213454, -0.01235567, -0.03336109, 0.049459614, 0.007028942) * inp_7_2_0; + result4 += M4(-0.015206268, -0.04306828, 0.022190332, -0.011594926, -0.047630157, 0.025873762, -0.21886888, -0.04501348, -0.011394331, 0.01885127, 0.073564306, 0.25457445, -0.0398608, -0.020090638, -0.08341406, -0.024223484) * inp_7_0_1; + result4 += M4(-0.015126109, 0.023063717, -0.15114518, -0.07231576, -0.09044589, 0.098585464, -0.27854264, -0.035312053, 0.063175984, 0.030455407, 0.03429318, -0.17279996, 0.011018045, 0.026615465, 0.037567787, 0.031564843) * inp_7_1_1; + result4 += M4(-0.047758225, -0.06474845, -0.12291044, 0.025480649, -0.059943054, -0.002574203, 0.11728442, -0.045684963, -0.04039217, -0.13016894, -0.122523315, 0.030717134, -0.003979793, -0.011976826, -0.04206374, 0.007127837) * inp_7_2_1; + result4 += M4(-0.019392774, 0.04917114, -0.10028331, -0.0083147595, 0.021183515, -0.2515138, -0.042518016, -0.036571436, -0.011397838, -0.014067441, 0.16372688, 0.017796928, -0.007861154, -0.004499947, 0.06691656, -0.00077724527) * inp_7_0_2; + result4 += M4(0.017651718, -0.007916474, -0.06843244, -0.0055576186, -0.024696302, -0.45252326, -0.32949975, -0.040939137, -0.008924657, -0.0069884467, -0.09877526, 0.0291089, -0.002020753, 0.0056151017, -0.022990825, -0.005646286) * inp_7_1_2; + result4 += M4(-0.013344221, 0.025063537, -0.006814097, -0.004052438, 0.027173467, -0.064691305, -0.085724786, 0.0013728178, -0.06430201, 0.09891888, 0.06554988, -0.03776078, -0.0015164824, 0.00072032615, -0.03945359, -0.020309223) * inp_7_2_2; + result5 += M4(-0.29015565, -0.0504856, -0.086861864, -0.17976667, -0.09982806, -0.07764492, 0.07808308, -0.2716935, -0.18661919, -0.08591439, 0.26913705, -0.106487356, 0.0043998067, 0.015428668, 0.033899657, 0.09368652) * inp_7_0_0; + result5 += M4(-0.19908395, -0.022122938, -0.014650014, -0.1855974, 0.03959497, 0.09582844, -0.3052797, -0.010022708, 0.12324228, 0.058178306, -0.056906804, -0.08451868, -0.06442597, -0.010315951, 0.11165233, -0.03185339) * inp_7_1_0; + result5 += M4(-0.02280782, -0.024141643, -0.033764925, 0.06668777, 0.059855398, -0.023250736, -0.023053491, 0.057122953, 0.1670807, 0.0062083374, -0.022650175, 0.03845172, 0.083235085, 0.0062549496, -0.069462314, -0.05729075) * inp_7_2_0; + result5 += M4(-0.28318822, 0.010365026, -0.21803187, -0.16786963, -0.6574527, -0.1050853, 0.15702452, -0.5286346, 0.07007811, 0.18338402, 0.009328277, -0.057101313, -0.05055611, -0.0056140893, 0.06760786, -0.075826734) * inp_7_0_1; + result5 += M4(-0.6328875, -0.17265053, -0.32007185, -0.22473463, -0.6974956, -0.48014686, -0.35014078, -0.061697185, 0.070903875, -0.03524646, 0.046297666, -0.031512853, -0.14756496, 0.010609849, 0.07694277, 0.010614909) * inp_7_1_1; + result5 += M4(-0.77281606, 0.015591141, -0.2351573, 0.099579446, 0.02190073, 0.09145027, 0.12198186, -0.03981692, -0.04863525, -0.061372776, -0.038507737, 0.18372037, 0.22119759, -0.047318257, -0.112377256, -0.014638231) * inp_7_2_1; + result5 += M4(-0.15672669, 0.011313571, -0.0016455053, 0.011210724, -0.1784495, 0.024785213, 0.08157578, -0.1588776, 0.1746127, -0.011873531, 0.016143136, 0.0735383, -0.006958686, -0.00926741, -0.03844876, -0.011495204) * inp_7_0_2; + result5 += M4(-0.06482136, -0.024777394, -0.06982902, 0.024797598, -0.19793424, -0.17642917, -0.05805348, -0.06682204, -0.027689785, -0.016412579, -0.07270696, -0.0820727, -0.16408871, -0.0037484975, -0.0727816, 0.0182913) * inp_7_1_2; + result5 += M4(-0.18456468, -0.029399985, -0.14339076, -0.01345119, -0.08311331, -0.097834, 0.095107086, -0.013994656, -0.21792398, 0.04363722, -0.014479818, 0.06327538, 0.22798946, 0.004692031, 0.037308734, 0.0014782102) * inp_7_2_2; + result6 += M4(-0.15523385, 0.04333674, 0.011562106, 0.012884233, -0.7735287, 0.061978884, -0.06362111, -0.04721958, -0.0036680687, 0.11972103, 0.024035923, -0.18345363, -0.26641202, 0.08780031, -0.05821278, -0.01588677) * inp_7_0_0; + result6 += M4(-0.2121926, 0.040110726, 0.022474691, -0.22844389, 0.25405735, 0.01813648, -0.043270804, -0.17447673, 0.10381929, 0.02651742, -0.17135035, 0.02156415, 0.23577787, -0.07796876, -0.0015734138, 0.004324461) * inp_7_1_0; + result6 += M4(0.00079009496, 0.03650711, 0.026441671, -0.22793932, 0.00020839366, 0.07355802, -0.007732349, -0.09052142, 0.008262666, 0.024755577, -0.024505679, -0.039957236, -0.12719211, -0.017149376, -0.0006477875, 0.031975172) * inp_7_2_0; + result6 += M4(-0.2876099, -0.046882026, -0.005891971, 0.022989621, -0.11886945, 0.08643837, 0.0009815173, -0.006898907, 0.15978125, -0.076028, -0.017567702, 0.031061567, 0.0414117, -0.04043728, 0.03147516, -0.092740506) * inp_7_0_1; + result6 += M4(-0.2903089, -0.09079359, 0.07738682, -0.20626391, -0.13970353, -0.40331012, -0.10651353, -0.38800967, -0.21632771, 0.07790675, 0.18777615, 0.06797554, -0.015900627, 0.06686788, -0.004905191, -0.03612247) * inp_7_1_1; + result6 += M4(0.028590072, 0.03684793, 0.034718122, -0.07928443, 0.050980933, 0.036022484, -0.018831767, -0.360042, 0.12971504, -0.01267701, -0.014985852, 0.03258125, 0.015352274, -0.00063632405, -0.007916378, -0.055729836) * inp_7_2_1; + result6 += M4(-0.24037708, 0.06596814, 0.007908019, 4.636603e-05, -0.36411625, -0.06614084, -0.024928998, 0.022652453, 0.03707578, -0.01185145, -0.02202634, -0.012771711, -0.21605279, -0.014994912, 0.018112198, -0.017821215) * inp_7_0_2; + result6 += M4(-0.20019771, 0.016194914, -0.003984423, 0.053569168, -0.147519, -0.18751924, 0.047211252, -0.10476945, -0.21504165, 0.040334094, 0.024131812, -0.06282376, 0.2811309, 0.007064146, 0.004561811, 0.009942218) * inp_7_1_2; + result6 += M4(0.104779065, -0.02237995, 0.013157996, 0.022467796, 0.10577438, -0.041026324, 0.022738328, 0.005887924, 0.03713206, 0.0018778833, 0.01106954, 0.031748325, -0.14795572, 0.013881824, -0.006266062, 0.020826342) * inp_7_2_2; + result7 += M4(-0.017048126, -0.0014680336, 0.22264837, -0.017220203, -0.014482394, 0.039665192, -0.03148343, 0.039337862, -0.010021396, -0.0068325154, -0.076945424, 0.058321618, 0.006317953, 0.0588891, 0.24903962, -0.045815527) * inp_7_0_0; + result7 += M4(-0.011735046, 0.05164914, 0.09057689, -0.07567338, -0.013797732, 0.010123468, -0.14601725, -0.19793466, 0.010152798, 0.00010848839, -0.02723998, 0.034682594, -0.011363744, -0.01866832, -0.10351618, 0.038840428) * inp_7_1_0; + result7 += M4(0.007575896, 0.0342021, 0.019826306, -0.0063154707, -0.00014761885, 0.05654821, 0.094419114, 0.039745655, 0.018475056, 0.0267896, -0.042218987, 0.04887323, 0.021885084, -0.05690418, -0.2152488, 0.011102724) * inp_7_2_0; + result7 += M4(-0.047039494, 0.01717817, -0.007354877, 0.03097899, -0.12532277, 0.037751406, -0.5457681, -0.0066836495, -0.13203242, 0.044490185, -0.18292123, -0.12071842, -0.024309013, -0.090786345, -0.556854, -0.020559551) * inp_7_0_1; + result7 += M4(-0.0756311, -0.051617034, 0.19010684, -0.020291973, 0.034922715, -0.25529796, -0.49442846, -0.23392962, -0.093332306, 0.04667098, 0.14093527, 0.08133245, -0.022771783, 0.030318974, 0.14622752, 0.022611557) * inp_7_1_1; + result7 += M4(-0.023410842, 0.017515162, -0.15425678, 0.020815322, -0.004528309, -0.15812004, -0.7177418, -0.14774992, 0.000594787, -0.09640183, 0.03258781, 0.035561755, 0.010859937, 0.085842706, 0.26981428, 0.019011827) * inp_7_2_1; + result7 += M4(-0.0061331196, 0.006772549, 0.042385384, -0.008290503, -0.03741007, 0.0108373575, -0.23881952, -0.00053264864, 0.045162518, -0.039310794, 0.0022733111, 0.024849279, 0.0033925618, 0.0026793743, 0.07024454, 0.022384964) * inp_7_0_2; + result7 += M4(-0.008750399, 0.07044772, 0.08826913, -0.060729593, 0.002564674, -0.11470527, -0.25962645, 0.08533938, -0.0011103342, 0.09526253, 0.1411946, -0.025586285, 0.017720187, 0.007987387, -0.0671929, 0.009660629) * inp_7_1_2; + result7 += M4(-0.014092657, 0.026131075, -0.036399465, -0.034446795, 0.0011673111, -0.011000087, -0.048490893, 0.022428023, -0.010023926, 0.029476997, -0.06079816, 0.010130016, 0.010098581, -0.002678652, -0.07556091, 0.023580361) * inp_7_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(4, 2); + imageStore(out_image, output_base + ivec2(0, 0), max(result0, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 0), max(result1, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 0), max(result2, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 0), max(result3, V4(0.0))); + imageStore(out_image, output_base + ivec2(0, 1), max(result4, V4(0.0))); + imageStore(out_image, output_base + ivec2(1, 1), max(result5, V4(0.0))); + imageStore(out_image, output_base + ivec2(2, 1), max(result6, V4(0.0))); + imageStore(out_image, output_base + ivec2(3, 1), max(result7, V4(0.0))); +} + +//!DESC ArtCNN C4F32 DS (Conv2D-5) +//!COMPUTE 48 32 12 16 +//!HOOK LUMA +//!BIND conv2d_4 +//!SAVE conv2d_5 +//!WIDTH LUMA.w 4.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[8][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(4, 2); + inp[0][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(2, 0), 0)); + inp[3][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(3, 0), 0)); + inp[4][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(0, 1), 0)); + inp[5][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(1, 1), 0)); + inp[6][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(2, 1), 0)); + inp[7][y][x] = V4(conv2d_4_mul * texelFetch(conv2d_4_raw, input_base + ivec2(3, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.00012870376, 0.0015073317, 0.00012290025, -0.031450726); + V4 result1 = V4(0.00075700425, -0.00059576443, 0.00043123835, -0.0010607191); + V4 result2 = V4(-0.0012186025, -0.009817943, -0.0022624114, 2.8278655e-05); + V4 result3 = V4(0.00072065956, -0.019619042, -0.000720247, 1.1483696e-06); + V4 result4 = V4(0.0005072502, -4.716536e-06, -0.00013273496, -0.00014584724); + V4 result5 = V4(5.4984226e-05, -0.00016543601, 0.00083523017, 0.0003139287); + V4 result6 = V4(0.0010905131, 0.00019316915, 0.027474692, 0.008348107); + V4 result7 = V4(-0.00035387027, -0.026230067, -0.0020538918, 0.0008813218); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.02825234, 0.050472528, 0.07249266, -0.036686793, -0.008236348, -0.18814753, 0.0048127305, -0.07187667, 0.027375551, 0.0667412, -0.10769006, 0.06668862, -0.04494983, -0.04809392, -0.045809206, -0.038274225) * inp_0_0_0; + result0 += M4(-0.077258155, 0.11137563, -0.02073778, 0.032660037, -0.09308027, -0.02373658, 0.056329884, -0.022265574, -0.016948516, 0.01601987, -0.14742132, 0.06404055, -0.09884169, 0.21626514, -0.20251444, 0.1685334) * inp_0_1_0; + result0 += M4(-0.005836629, -0.041911867, 0.073245466, 0.042423088, -0.006572438, 0.006312453, -0.02910437, -0.035644136, 0.02247486, 0.14070247, 0.06569763, -0.073711194, -0.05906052, 0.08308226, -0.028851544, 0.06398263) * inp_0_2_0; + result0 += M4(-0.04628439, -0.034108642, 0.18604904, 0.018233646, -0.09133256, 0.019611178, 0.011687959, -0.13484737, 0.008817253, -0.14870496, 0.06186094, 0.032866117, 0.005636625, 0.0058991183, 0.06262461, 0.08848391) * inp_0_0_1; + result0 += M4(0.04486707, -0.11528956, 0.027320707, 0.06917625, -0.19171804, 0.069432884, -0.19025773, 0.31622523, 0.0075120684, 0.07121924, -0.019727655, -0.19732587, -0.17011653, 0.019549588, 0.113864094, -0.08387234) * inp_0_1_1; + result0 += M4(0.0051095663, 0.08537196, -0.03169933, 0.0323098, -0.060529582, 0.028143872, -0.052649263, 0.05718779, -0.007441134, -0.029519817, -0.051336925, 0.02123168, -0.063979246, 0.021595892, -0.033775996, 0.07181485) * inp_0_2_1; + result0 += M4(0.062568076, 0.06364635, -0.039970372, -0.006447095, 0.12519073, 0.15771787, -0.0755865, -0.017414108, 0.051324718, -0.09161432, -0.07952098, 0.081326246, -0.05753695, 0.093014814, 0.027538912, 0.002404669) * inp_0_0_2; + result0 += M4(-0.00744137, 0.029176349, 0.10101269, -0.02758753, -0.067584105, 0.059226632, -0.037246663, -0.050222486, 0.075733736, -0.12921144, 0.074807994, -0.016728248, 0.05908262, -0.12593502, 0.041971054, -0.08174431) * inp_0_1_2; + result0 += M4(0.04943014, -0.016725883, -0.026984025, 0.050061073, -0.0018541286, 0.057701662, 0.0018217978, 0.016825218, 0.13714133, -0.08471379, 0.27746886, -0.09209236, 0.044548824, -0.08745845, 0.08161209, 0.07771556) * inp_0_2_2; + result1 += M4(-0.05639158, 0.043210156, 0.061975732, 0.07048967, -0.13271971, -0.042835556, 0.086439915, -0.04577353, 0.16696368, 0.0081004985, -0.045513887, 0.014561117, 0.10838701, -0.04196252, 0.027172176, 0.020009534) * inp_0_0_0; + result1 += M4(0.102852546, -0.050327368, -0.039611086, -0.07678378, -0.14159124, -0.021460293, -0.0006992745, -0.051264238, 0.07857924, 0.044895526, -0.00033525276, 0.05508037, 0.27432808, 0.109197654, -0.05758411, -0.02754107) * inp_0_1_0; + result1 += M4(-0.09417695, -0.0151595315, -0.11193397, 0.04734054, -0.03474961, -0.020111436, 0.013753403, -0.10246779, 0.30541953, -0.002184839, 0.009467595, 0.02313922, -0.03428219, -0.013101571, -0.06601038, 0.068125926) * inp_0_2_0; + result1 += M4(-0.007718083, 0.022167645, -0.0372561, 0.017117832, -0.012538294, -0.122178264, -0.07919307, -0.0067774463, 0.06950172, 0.03165948, 0.069577605, -0.082424365, -0.043734632, 0.028616741, 0.02039027, 0.033831313) * inp_0_0_1; + result1 += M4(-0.024777768, 0.1559108, 0.13268489, 0.042481832, -0.17424461, -0.19196983, 0.33128786, 0.03052741, -0.07871133, -0.07639098, 0.07132073, 0.117071435, -0.085539624, 0.10192558, 0.032388866, -0.026032284) * inp_0_1_1; + result1 += M4(0.21044138, -0.03833567, -0.03887902, -0.015440096, -0.10548603, 0.009248851, 0.065964304, 0.056060005, 0.0033368012, 0.10262367, -0.16890131, 0.05223364, -0.021466231, 0.02432301, 0.07711907, 0.13907103) * inp_0_2_1; + result1 += M4(0.0006207559, 0.07628767, -0.024122464, -0.050615545, -0.15404795, 0.09933703, 0.023408007, -0.051729627, -0.008578353, -0.09102145, -0.004976676, 0.23550455, -0.061921887, -0.001108465, 0.038435172, -0.103362925) * inp_0_0_2; + result1 += M4(-0.103490844, -0.010899284, -0.020487739, 0.05803918, -0.09646101, 0.1026901, 0.06520469, -0.011193636, 0.09393872, 0.07114487, -0.020959882, -0.040198267, -0.2105737, -0.09829211, 0.14387673, 0.014833609) * inp_0_1_2; + result1 += M4(-0.003354044, 0.072334334, 0.16028221, -0.06162113, 0.04883901, 0.07213884, 0.02099781, -0.04124112, 0.14201511, -0.012724468, -0.2590456, 0.008002337, 0.037929222, 0.0412799, 0.055922583, -0.07824662) * inp_0_2_2; + result2 += M4(-0.013893638, 0.12770304, -0.14468402, 0.12212885, -0.020140463, 0.05470519, 0.003691885, -0.021420196, -0.06374135, -0.17111105, 0.0757188, -0.078780405, 0.13151102, 0.05572287, -0.030792726, 0.21981834) * inp_0_0_0; + result2 += M4(0.13976511, 0.065783836, 0.09327418, 0.13874762, -0.04414663, 0.005955995, 0.024778062, -0.073018044, -0.020960657, -0.08148191, -0.00080282555, -0.04114416, -0.14436159, 0.16456963, -0.12388528, 0.3568732) * inp_0_1_0; + result2 += M4(0.094088145, -0.077089556, 0.071451984, 0.10671292, 0.042371325, 0.05656689, 0.018475946, -0.09828818, -0.1001703, -0.03996161, -0.0044480283, -0.065334186, 0.17525658, -0.025878647, -0.0036411502, 0.21724771) * inp_0_2_0; + result2 += M4(0.0342944, 0.052221116, -0.01949957, 0.012354358, 0.023869658, 0.073546335, 0.0877285, -0.36431846, -0.02626674, -0.14184852, -0.046883654, -0.069614366, 0.063146956, 0.07258322, -0.049165007, 0.04512682) * inp_0_0_1; + result2 += M4(-0.0074588475, 0.14777818, -0.19874443, 0.49568745, -0.18574569, -0.15987149, -0.0764119, -0.04251646, -0.07334413, -0.38405332, 0.041632935, -0.71641743, -0.0010440225, 0.11473736, -0.046578478, 0.34829178) * inp_0_1_1; + result2 += M4(-0.006457416, -0.0041369465, -0.043947276, 0.031897474, -0.099781565, -0.04458274, 0.014765808, -0.091072455, -0.046024874, -0.00047156744, 0.059614684, -0.091088615, -0.024731526, -0.066219084, -0.0019194081, 0.032505997) * inp_0_2_1; + result2 += M4(-0.029251635, 0.056005977, -0.029172702, 0.1263884, -0.078013, 0.06456419, 0.009464262, -0.116298, 0.11641417, -0.11715053, 0.06715912, -0.11711052, -0.041919075, 0.030600216, 0.02707128, 0.043036945) * inp_0_0_2; + result2 += M4(0.054973725, 0.043513294, 0.027817035, 0.17361102, -0.05212478, -0.012061641, -0.04480146, -0.10949433, 0.054276537, 0.0677188, 0.026028277, -0.055351324, 0.33972925, -0.022167863, 0.26053816, 0.36052957) * inp_0_1_2; + result2 += M4(-0.0025867675, -0.033859693, 0.015821788, 0.184386, 0.009979756, 0.05862266, 0.008590679, -0.08470479, 0.12410391, 0.0056512062, 0.09959105, -0.038819876, 0.036758754, 0.020678207, 0.078427844, 0.19521163) * inp_0_2_2; + result3 += M4(0.07516922, 0.06817264, -0.033351846, 0.0570181, 0.023872118, -0.033119217, 0.022747792, -0.08716068, -0.1660593, -0.033284668, 0.09960433, -0.009144942, -0.009021771, 0.05191709, -0.10111086, -0.0065188347) * inp_0_0_0; + result3 += M4(0.063911155, -0.0017871537, -0.02683682, 0.031202864, 0.006626746, 0.005269876, 0.111577794, -0.07194623, -0.17961705, -0.025490053, 0.022233343, 0.010028363, 0.094795115, 0.01180024, -0.15879083, 0.12058574) * inp_0_1_0; + result3 += M4(-0.029188888, -0.0048613464, 0.10167411, -0.01733035, 0.13426104, 0.009995426, 0.0055278814, 0.03686712, -0.04044068, 0.0061511467, -0.06844516, 0.03943122, -0.05564705, -0.014750789, -0.067794405, -0.038422555) * inp_0_2_0; + result3 += M4(0.06392588, -0.035220683, -0.0046561114, -0.100309364, 0.1663134, 0.026404293, 0.124145925, -0.101793036, 0.058158122, -0.05311191, -0.078840815, -0.057253875, -0.10874026, 0.020562524, 0.04176369, -0.004982596) * inp_0_0_1; + result3 += M4(-0.055022147, -0.0015293906, 0.059985295, 0.17386433, 0.36176702, 0.07660777, -0.10384644, 0.23624507, -0.09634397, -0.029623128, 0.16258933, -0.094327964, -0.03725318, -0.032710075, 0.04545482, 0.027676413) * inp_0_1_1; + result3 += M4(0.061432358, -0.00852737, -0.16414368, 0.08852885, -0.004861569, 0.017101906, 0.050031036, -0.034904525, 0.07999701, 0.03031258, -0.03243259, -0.10931116, -0.10524792, -0.01605804, -0.00012235781, 0.0018634867) * inp_0_2_1; + result3 += M4(-0.058765683, 0.057311747, -0.09250278, 0.081500016, -0.01575219, -0.05795951, -0.04103856, 0.15493245, -0.13997552, -0.04234876, 0.07340369, -0.08439723, -0.08907591, 0.028325306, 0.038971752, -0.081953414) * inp_0_0_2; + result3 += M4(-0.016148396, -0.020256687, -0.028956844, -0.09699045, -0.044698145, -0.039668884, 0.0030640669, -0.0034066683, -0.14536853, 0.1079129, 0.046979304, -0.09782481, 0.016039869, 0.0069218553, 0.15003178, -0.284929) * inp_0_1_2; + result3 += M4(-0.10598578, -0.07503008, 0.11086802, -0.07511329, 0.081773564, 0.03757604, 0.01578927, 0.037892543, 0.01584319, 0.040191278, 0.02156386, -0.07563746, -0.119566426, -0.09166396, 0.060088415, -0.08760523) * inp_0_2_2; + result4 += M4(0.04311774, -0.0046575717, -0.0051927385, -0.034860145, -0.06816423, -0.047233056, 0.18247157, -0.06609274, 0.021896608, 0.09089035, -0.123854846, 0.059438813, -0.05742909, 0.16950338, -0.11582585, 0.0008909285) * inp_0_0_0; + result4 += M4(-0.22790666, 0.07339618, 0.09134936, 0.059751753, 0.10918637, -0.045729667, 0.03663686, -0.021690749, 0.15934144, -0.009276431, -0.19865279, 0.036363818, -0.16918212, -0.09963749, 0.0038125063, 0.36579713) * inp_0_1_0; + result4 += M4(-0.026364783, 0.04632776, 0.027796665, -0.059985835, -0.013555931, -0.087625116, -0.010512694, -0.042849503, 0.08772071, -0.056421503, -0.119292095, 0.14031912, -0.12183756, 0.13002402, 0.023274511, 0.023750989) * inp_0_2_0; + result4 += M4(0.093281195, 0.030127542, 0.05493629, 0.0069935485, 0.017689057, 0.023545517, 0.0811366, -0.024590306, -0.1099985, -0.03095163, -0.04294214, -0.09061835, -0.15771258, -0.082931705, 0.10125581, 0.09825419) * inp_0_0_1; + result4 += M4(0.44734138, -0.012180531, -0.09398181, -0.12005716, -0.2573845, 0.02849841, -0.11323677, -0.046026174, -0.22775516, -0.044774346, 0.038132742, 0.16683002, 0.32398078, -0.0869028, 0.041380864, 0.0139446845) * inp_0_1_1; + result4 += M4(0.053037174, -0.07678338, -0.041450456, 0.1608069, -0.019744877, 0.043494817, -0.044084672, 0.031270593, -0.15156747, -0.032741968, -0.007922767, 0.11055923, 0.053437173, -0.071062565, -0.086776584, 0.00960438) * inp_0_2_1; + result4 += M4(-0.038308837, -0.015956461, 0.020849645, 0.006402085, -0.009829708, -0.13160974, -0.03548144, 0.03434407, -0.11005906, 0.002573916, 0.13882823, 0.1392691, 0.016676854, -0.109087124, 0.0059470297, -0.08239393) * inp_0_0_2; + result4 += M4(-0.22784173, -0.017135287, -0.04383778, 0.13761617, 0.18187153, -0.11236875, 0.04377618, 0.0152914245, 0.12914966, 0.15687427, 0.15625125, -0.13189301, -0.25085914, 0.15259787, -0.0960026, -0.17363165) * inp_0_1_2; + result4 += M4(-0.01424878, 0.05864589, 0.05924567, -0.06697133, 0.03875816, 0.05776546, 0.008167824, -0.032441102, 0.2037382, 0.06615059, 0.01856782, 0.010310884, -0.06482916, -0.00028947697, 0.10627089, 0.030034268) * inp_0_2_2; + result5 += M4(-0.054193586, -0.025675284, 0.020265425, -0.039972305, 0.058642, 0.14323056, -0.15123907, -0.011585096, 0.16256645, -0.109824136, -0.017497974, -0.030626312, 0.05950098, -0.04655934, -0.035838444, -0.05222391) * inp_0_0_0; + result5 += M4(0.007755075, 0.05598752, -0.062134672, -0.032818593, 0.034227464, -0.19499488, -0.092409186, 0.060386922, 0.04882066, 0.09228972, -0.039126195, -0.054442573, -0.18941747, -0.07295861, 0.006411945, 0.029024774) * inp_0_1_0; + result5 += M4(-0.0033692757, -0.060536902, 0.026629914, -0.010602164, 0.05112915, 0.0024714912, -0.0032793514, 0.036075253, -0.06559311, 0.033517826, 0.106712244, 0.04076608, 0.045067567, -0.046970017, 0.078757666, 0.04772219) * inp_0_2_0; + result5 += M4(-0.038939316, -0.0031435292, 0.092506595, -0.033944752, -0.011017319, -0.057914056, -0.054770526, -0.034871124, -0.032249764, 0.014579273, 0.02030576, -0.015907379, 0.04547219, -0.040377278, -0.015825823, 0.07438816) * inp_0_0_1; + result5 += M4(0.006511647, -0.08793797, 0.15017115, 0.113985285, 0.009456968, 0.17288046, 0.18473615, 0.0019506487, -0.15352003, 0.0992849, 0.059564263, 0.050233517, -0.0027133052, 0.0049805525, 0.020023389, 0.15264674) * inp_0_1_1; + result5 += M4(0.05542958, 0.029432071, -0.118135475, 0.015489625, -0.031143768, 0.04751464, -0.0027562892, -0.014852989, -0.017441804, 0.106149465, 0.1426039, -0.11510644, 0.051034622, 0.034320943, -0.1416798, -0.15111887) * inp_0_2_1; + result5 += M4(-0.005349655, 0.03661216, -0.039780386, -0.07300103, -0.019425578, 0.021303825, -0.008560789, 0.020043299, -0.0035151679, 0.053267673, -0.051687483, 0.055022325, -0.052634656, 0.11189838, -0.08216567, -0.029388128) * inp_0_0_2; + result5 += M4(-0.020968616, -0.10576353, -0.1924763, 0.019439435, 0.15866095, -0.17673945, 0.066261984, 0.07573692, 0.0041221776, -0.08053473, -0.043083128, -0.02708184, 0.34828785, -0.06895619, -0.03632807, -0.2802769) * inp_0_1_2; + result5 += M4(-0.06797596, 0.0013385571, 0.101501465, 0.021737084, 0.0067512398, -0.0328096, -0.030926298, -0.020768786, 0.11983645, -0.10120104, -0.10023374, 0.021199556, -0.07132269, -0.025049286, 0.014568736, 0.071718924) * inp_0_2_2; + result6 += M4(0.042367354, -0.07320226, -0.05030392, -0.03097155, -0.06848109, 0.07833887, -0.018301975, 0.0063609933, 0.04086807, 0.18728144, -0.00229801, 0.11316445, 0.15861443, 0.05616942, -0.027801897, -0.17561917) * inp_0_0_0; + result6 += M4(0.053958494, 0.03252485, -0.049048904, 0.00091042725, -0.02634856, -0.012551877, 0.09447732, 0.024077548, -0.068866804, -0.033668082, 0.00077665824, 0.05336429, 0.085203566, -0.02360444, -0.19250433, 0.2850974) * inp_0_1_0; + result6 += M4(-0.0050973175, 0.009135809, 0.048632257, -0.064880505, 0.07115352, 0.017063122, -0.018218817, 0.021659104, 0.0027115762, -0.017571406, 0.034211423, -0.008411775, 0.008927597, 0.03835467, 0.013826214, -0.07440152) * inp_0_2_0; + result6 += M4(-0.16174015, 0.046346013, 0.02666784, -0.13165195, 0.043951016, 0.124979325, 0.06786961, 0.06975871, -0.01585343, -0.043367013, -0.0069699087, 0.02535214, 0.045468464, 0.0018834862, -0.0039589703, -0.12086647) * inp_0_0_1; + result6 += M4(0.029521056, 0.12073672, -0.13906795, -0.1916976, -0.09924715, 0.19344607, 0.15368523, 0.24795122, -0.105374984, -0.15754443, 0.09340845, 0.0049955756, 0.040059544, -0.00063394714, -0.1272499, -0.20504254) * inp_0_1_1; + result6 += M4(-0.09621672, 0.10360652, 0.05688453, -0.035986796, 0.020708011, -0.0028650032, 0.00011697742, 0.09977053, 0.0765529, -0.0788715, -0.04016248, 0.0611968, 0.055754177, 0.1229572, 0.084490284, 0.048277725) * inp_0_2_1; + result6 += M4(0.059959315, 0.00081622397, -0.09666786, 0.112278335, 0.036391973, -0.090539075, -0.044649478, 0.2225124, -0.025937365, -0.08318799, 0.11224739, -0.054097395, 0.059892207, 0.034853503, -0.05376071, 0.11600284) * inp_0_0_2; + result6 += M4(-0.012622818, -0.04029047, -0.041889485, -0.024164613, 0.06310475, -0.055094402, 0.067537926, 0.12939483, 0.12622632, -0.05457477, 0.06611501, -0.061707594, -0.017733011, 0.052899245, 0.042511255, -0.22232406) * inp_0_1_2; + result6 += M4(0.034716494, -0.11793546, 0.00036974082, 0.12034868, -0.01762745, -0.008249939, -0.062113576, 0.03492903, 0.0060695615, -0.07799395, 0.024927368, -0.2599195, 0.0010177202, -0.14419743, 0.011077671, 0.13116336) * inp_0_2_2; + result7 += M4(0.014553309, -0.0074470704, -0.16007134, -0.011405571, 0.030450094, -0.016226279, -0.13293181, -0.036833964, -0.1443664, 0.019579496, 0.118396215, -0.029384352, 0.0723277, 0.024669567, -0.101058155, 0.14942437) * inp_0_0_0; + result7 += M4(0.062210217, -0.021347476, -0.055580672, -0.05098232, -0.044253673, 0.015302768, 0.045021404, 0.11655919, -0.13224517, -0.06626581, 0.07285238, -0.08862336, 0.08787706, -0.12862337, -0.24408647, 0.21015218) * inp_0_1_0; + result7 += M4(0.02202156, 0.016423222, -0.0037286142, -0.011764392, -0.01310396, -0.008725548, -0.056195028, 0.010151796, 0.060830273, 0.058722235, -0.018515628, -0.004795146, 0.116256446, -0.03741499, -0.074066624, 0.04036169) * inp_0_2_0; + result7 += M4(-0.12240728, 0.030141866, 0.04576457, -0.012376768, -0.0330473, -0.017791318, 0.1571436, -0.043853898, -0.052927777, -0.014838781, 0.028267186, -0.12342817, -0.026195332, 0.0023472672, -0.04253277, -0.085550174) * inp_0_0_1; + result7 += M4(-0.2009318, -0.24020092, -0.40976435, -0.07342096, -0.3716147, 0.055616535, -0.09254849, 0.02399065, -0.012020133, 0.36927363, 0.59333795, 0.012748146, -0.14578514, -0.21347679, -0.32844797, -0.16754282) * inp_0_1_1; + result7 += M4(-0.0428318, -0.053459473, 0.028684434, -0.018248675, 0.00033567534, 0.060592398, -0.06582607, 0.018829256, 0.10419849, 0.03929341, 0.016769698, -0.014192978, 0.009670519, -0.07603321, -0.012554139, 0.051337834) * inp_0_2_1; + result7 += M4(0.042495504, -0.015798202, 0.0017990791, 0.017757915, 0.18598627, -0.06026403, -0.030309746, 0.112242505, -0.048391312, 0.047471784, 0.03632953, -0.024070622, 0.06873554, -0.01998156, 0.013355226, -0.024860214) * inp_0_0_2; + result7 += M4(0.0752057, -0.09200111, -0.106187314, 0.07621654, 0.010918868, 0.013357794, 0.0018193696, 0.02028038, -0.008123338, 0.09716468, 0.16878699, -0.053751923, 0.13322113, -0.027538763, -0.12694189, 0.11730963) * inp_0_1_2; + result7 += M4(-0.10361507, -0.068965495, -0.09642515, -0.0178064, 0.03582002, -0.009865948, -0.058565333, -0.034498867, 0.15128967, 0.082633, 0.1311318, -0.08883258, -0.06233397, -0.08476452, -0.106587805, 0.08905519) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.017418709, 0.03047621, -0.035894383, 0.029675178, -0.03798603, 0.083898894, -0.04655431, -0.006518156, 0.07839567, 0.0013389732, -0.023377389, -0.003429948, 0.009832289, -0.026624167, 0.012446694, 0.02524536) * inp_1_0_0; + result0 += M4(0.012563411, 0.03702292, -0.02875691, 0.032124132, 0.018167298, 0.018686306, -0.01379084, 0.045010097, -0.027397394, -0.06972298, 0.004102388, -0.046583287, -0.002449551, -0.058618017, 0.037217397, 0.06787799) * inp_1_1_0; + result0 += M4(0.028429842, -0.05467132, 0.025242021, 0.027141431, 0.019252473, -0.08065549, 0.09257724, 0.04900382, -0.013361784, 0.10677996, 0.10340843, -0.014217745, -0.054509588, 0.19412856, -0.16946264, 0.0723509) * inp_1_2_0; + result0 += M4(0.009138425, -0.006058701, 0.029574737, 0.08232435, 0.06400533, 0.037013065, 0.016174924, -0.008731072, 0.053147938, 0.02713442, 0.0134491995, 0.08542876, -0.03746861, 0.08111109, 0.05664614, -0.048998605) * inp_1_0_1; + result0 += M4(-0.02925496, 0.049888182, -0.030060813, 0.035322275, -0.0773797, -0.14322223, 0.1078786, -0.08756277, -0.026952974, 0.045466185, -0.019971544, -0.07595785, 0.32762298, 0.014192252, 0.349071, 0.17363691) * inp_1_1_1; + result0 += M4(0.083915, 0.100862205, 0.07701517, 0.027563948, 0.013311844, -0.00016412573, -0.027913488, -0.021475151, -0.017322414, 0.008609259, -0.044093776, 0.044156257, 0.086259566, -0.15022193, 0.0107320165, -0.069588274) * inp_1_2_1; + result0 += M4(0.039998673, -0.03382362, 0.04524961, 0.025787964, -0.10883636, 0.061441638, -0.53263533, 0.023401683, 0.36825883, 0.14872833, -0.34267634, 0.107345, -0.12917432, 0.018690834, -0.11513532, -0.030515788) * inp_1_0_2; + result0 += M4(-0.00828448, -0.0038745373, 0.023804154, -0.058837716, -0.3741643, -0.0052964333, -0.88595945, 0.24521157, -0.21722834, -0.013767049, 0.101908654, 0.2135949, -0.18464348, -0.111717455, -0.11288168, -0.11193086) * inp_1_1_2; + result0 += M4(0.065031424, 0.036405917, -0.20791979, -0.07621366, -0.020438274, 0.01369907, -0.021650977, 0.08698215, -0.055356365, 0.14324428, 0.18080603, 0.14535113, -0.05851366, -0.053593762, -0.09069061, 0.009242277) * inp_1_2_2; + result1 += M4(-0.027254121, -0.034437984, -0.004247502, 0.009127255, 0.05101741, 0.025027085, -0.079198875, 0.009514928, -0.017698936, -0.0074822307, -0.07649974, 0.040912405, -0.037677895, 0.07438578, 0.06545263, -0.07207911) * inp_1_0_0; + result1 += M4(-0.010202402, 0.007117349, -0.062361635, -0.03728422, 0.05150864, 0.037142407, 0.12592474, -0.039169103, 0.032473765, 0.013044754, 0.14421019, -0.10579016, 0.31002274, -0.04012663, 0.21835472, 0.028253479) * inp_1_1_0; + result1 += M4(0.0137379, -0.089400865, -0.017349815, 0.018399145, -0.030090353, -0.09054616, -0.02951489, -0.019568171, 0.11513796, -0.011408798, 0.023999803, 0.04628498, -0.33841875, -0.5108933, -0.09424127, -0.108504064) * inp_1_2_0; + result1 += M4(0.028551575, 0.012780736, -0.047223996, -0.02969291, -0.35930815, -0.013179916, -0.21856937, 0.0048393128, 0.100381486, 0.046919473, -0.024066515, 0.09674702, 0.04530783, 0.10557541, 0.043592915, -0.13429579) * inp_1_0_1; + result1 += M4(0.28134185, -0.058985457, 0.03692803, -0.08276008, 0.37679648, 0.36340785, 0.14437196, 0.111308895, 0.12185249, 0.065915205, 0.03668009, -0.07789429, 0.1793655, 0.35379803, -0.09055568, -0.05690878) * inp_1_1_1; + result1 += M4(-0.15130775, 0.13480394, -0.09216019, 0.04585281, -0.09969302, -0.24532558, 0.019521289, -0.14670423, -0.08655364, -0.058140524, -0.05669363, 0.06634686, 0.019699907, -0.2932691, -0.1847335, 0.13557985) * inp_1_2_1; + result1 += M4(0.01912094, 0.0039936244, -0.008487629, 0.03292135, -0.1333557, -0.01869552, -0.17619574, -0.17558426, -0.23783557, 0.03481586, -0.14363688, 0.09256015, 0.0031344262, -0.13423806, 0.07353918, 0.08341448) * inp_1_0_2; + result1 += M4(-0.11895379, -0.26720572, 0.017094158, -0.00051445625, -0.23143825, 0.27810067, -0.3132735, -0.0872267, 0.105652176, 0.09114439, 0.11441366, -0.12430906, 0.32491785, -0.075133525, 0.031382542, -0.08362819) * inp_1_1_2; + result1 += M4(0.06069166, -0.012380882, 0.053487338, 0.14757203, -0.0035123285, 0.14036289, -0.6101021, -0.030852132, 0.06909205, -0.06527503, -0.035564177, 0.058050063, -0.09365824, -0.06887864, 0.14134659, -0.049946763) * inp_1_2_2; + result2 += M4(0.060764197, -0.044476423, 0.006212088, 0.004834526, -0.033490956, -0.024018971, -0.019870147, 0.020748984, -0.104704544, -0.010575584, 0.02419713, 0.018909888, -0.014168303, 0.006435106, -0.019482184, -0.097632654) * inp_1_0_0; + result2 += M4(0.09645522, 0.06339595, -0.008657519, -0.029634126, 0.027884953, -0.03705686, 0.036230784, -0.06363273, -0.06456915, 0.035239473, -0.00907562, -0.06692202, 0.16278431, -0.090533294, -0.046527106, -0.043334037) * inp_1_1_0; + result2 += M4(0.030307516, 0.03852743, 0.02691295, 0.005781487, -0.012388547, -0.004266756, 0.021897772, 0.019205237, -0.19809248, -0.06270081, 0.024294604, 0.017338542, -0.04198413, 0.020905977, -0.053037666, 0.03417977) * inp_1_2_0; + result2 += M4(-0.02183366, 0.003552609, -0.025223436, 0.07945964, -0.044301387, 0.026234947, -0.13667427, -0.115775794, -0.09878849, -0.029482584, 0.036059596, 0.032298874, -0.069991216, 0.0048591127, 0.007684848, -0.061667748) * inp_1_0_1; + result2 += M4(0.03458296, -0.16721064, 0.19953558, 0.007891199, -0.07995672, 0.0049745836, -0.025245689, -0.09587196, -0.20514953, -0.15887311, -0.048276924, -0.026260328, -0.0007540655, 0.2853079, 0.10725677, 0.067231655) * inp_1_1_1; + result2 += M4(-0.043415755, -0.03609343, -0.15651539, 0.029634878, 0.015398887, 0.106489025, 0.16573432, 0.08572708, -0.057816554, 0.11592395, -0.061352186, 0.045980256, 0.027626013, 0.1205891, -0.12826093, 0.17988913) * inp_1_2_1; + result2 += M4(-0.07613995, 0.03188516, 0.050434474, 0.07684799, -0.048884198, -0.05990355, -0.15424035, -0.12519434, -0.13924104, -0.043877065, -0.024292545, 0.12428708, 0.049553752, -0.052151076, -0.08552776, -0.08521151) * inp_1_0_2; + result2 += M4(0.06283567, -0.09408841, 0.17939365, 0.027883235, -0.0572143, -0.12717895, -0.23556021, -0.3437946, -0.28594282, 0.21834908, 0.0075811013, 0.11526571, -0.06848633, 0.07531049, 0.10427754, 0.17251001) * inp_1_1_2; + result2 += M4(-0.00060835853, -0.1573507, -0.053589314, 0.1054587, -0.16309783, 0.17876866, -0.31901908, -0.3161011, -0.10772736, 0.060162168, 0.06941775, 0.029499564, 0.033513017, -0.10560592, 0.022555176, 0.062695414) * inp_1_2_2; + result3 += M4(-0.015335679, 0.07446124, -0.025621187, 0.017600443, 0.0027819437, -0.006842744, 0.0061612506, -0.13766107, -0.060149062, -0.037893794, 0.03802441, -0.067901194, 0.09187975, 0.008092903, -0.00014844636, 0.08863902) * inp_1_0_0; + result3 += M4(0.09968198, 0.050697595, -0.024685169, 0.03493401, -0.08088221, 0.07504558, -0.052292805, 0.13931729, 0.065187216, -0.061902452, -0.08251134, 0.04479079, 0.07394274, -0.118048705, 0.22057092, -0.23120454) * inp_1_1_0; + result3 += M4(0.03313147, 0.04955954, -0.012374923, 0.04282824, 0.06583755, -0.017040761, 0.11975665, 0.03809186, -0.16409242, -0.014598374, 0.099037714, -0.0043711704, -0.076318435, 0.087188765, 0.09313884, 0.09535661) * inp_1_2_0; + result3 += M4(-0.11161148, -0.057124633, 0.043214656, -0.110703886, -0.06603701, 0.042456217, -0.017486071, 0.027518172, -0.24374628, 0.01991404, -0.059355177, -0.02570105, 0.07711955, 0.015240446, -0.06977584, 0.12751685) * inp_1_0_1; + result3 += M4(0.054609764, -0.21227507, -0.011209875, -0.0383821, 0.06450621, 0.089725964, -0.018912842, 0.022530952, -0.05859137, -0.06519225, 0.11518891, -0.17043544, 0.30075353, 0.14126804, -0.20937167, -0.30027533) * inp_1_1_1; + result3 += M4(-0.14063236, 0.08310379, 0.14488798, -0.09376922, 0.03684436, 0.064583085, -0.0061855465, -0.0017473684, -0.2859202, 0.003856779, -0.04442142, 0.026713409, 0.40383524, -0.25232488, 0.07941386, 0.3922703) * inp_1_2_1; + result3 += M4(0.03794146, 0.06680176, 0.02033688, 0.030781304, -0.4612068, -0.10146264, -0.18086125, 0.3228064, -0.02779584, 0.05158886, -0.17849232, -0.047727022, -0.028723454, -0.0060423072, 0.1464432, 0.15395641) * inp_1_0_2; + result3 += M4(-0.018780684, -0.03252803, 0.2263186, -0.13682126, -0.47732577, -0.2497758, 0.0961493, 0.01326684, -0.07228836, -0.009488362, 0.18675251, -0.094570085, 0.17758664, 0.06300553, 0.07841854, -0.16636424) * inp_1_1_2; + result3 += M4(0.041384522, 0.14973554, -0.13226996, 0.034936458, -0.5047917, 0.054755438, 0.12391931, 0.1596265, -0.40879637, 0.059420936, 0.06657247, 0.028592296, 0.2358234, 0.033842545, 0.06944371, -0.16912213) * inp_1_2_2; + result4 += M4(0.05311598, 0.019826028, 0.011086883, -0.021887308, 0.059144896, -0.009230842, 0.054118145, 0.103895284, 0.10083564, -0.010336906, -0.07319659, -0.048320077, -0.05682911, -0.1619715, -0.05072684, -0.012430253) * inp_1_0_0; + result4 += M4(-0.071258165, -0.07206449, 0.007877828, 0.04877597, -0.03045355, 0.047173545, -0.11567965, 0.028120818, -0.022546913, 0.027650485, 0.034297872, -0.013740084, 0.18390064, 0.0110989, 0.117114075, 0.20891143) * inp_1_1_0; + result4 += M4(-0.045401983, 0.013605427, 0.016331915, -0.024901144, -0.033758435, -0.031822678, -0.016521053, -0.10487585, 0.04210012, -0.10214398, -0.018865421, -0.029367005, -0.025667086, 0.41487533, 0.032567278, -0.22080663) * inp_1_2_0; + result4 += M4(0.0037877297, 0.021871453, 0.011498469, 0.006139841, -0.021233842, 0.056552038, -0.13259467, -0.18828025, -0.026284527, -0.041182987, 0.10565905, -0.07781128, -0.07258588, -0.09024599, -0.14303032, 0.06265986) * inp_1_0_1; + result4 += M4(-0.20828693, 0.0803589, -0.07921446, -0.042546384, -0.054562993, -0.30823, 0.01087237, 0.28675285, 0.30932355, -0.10021583, -0.115128726, -0.04681989, -0.4963274, 0.12091105, -0.3624494, 0.26615098) * inp_1_1_1; + result4 += M4(-0.07072683, -0.1668421, -0.031643827, -0.16955912, 0.15100871, 0.17900783, 0.13331188, -0.024202855, 0.062017065, 0.034024704, 0.047093786, 0.082588755, -0.1429204, -0.23887563, 0.28322488, 0.011296719) * inp_1_2_1; + result4 += M4(-0.043304637, 0.050246876, 0.043262403, -0.08105104, 0.11705984, -0.3195758, 0.36736345, -0.30946398, 0.058647998, 0.032681633, -0.14707363, 0.04745867, 0.11118461, -0.054096732, 0.05881837, 0.103959955) * inp_1_0_2; + result4 += M4(0.4009369, -0.15147172, -0.020487187, 0.12404583, -0.3079209, -0.067801125, 0.8490191, -0.8472001, -0.06286357, -0.052003402, -0.05798621, 0.055178683, -0.060744245, 0.013418172, -0.12043419, 0.08806088) * inp_1_1_2; + result4 += M4(-0.03778331, 0.10257682, -0.07735904, 0.062345475, 0.29189754, -0.26781094, 0.12107478, -0.19960314, 0.041006602, -0.05646107, 0.002505815, -0.112233184, 0.055230446, -0.039380968, 0.21954706, -0.02870625) * inp_1_2_2; + result5 += M4(0.016291095, -0.011221429, 0.015665311, -0.053139552, 0.026286267, 0.023039427, 0.023016712, -0.061707195, -0.052618805, -0.015601597, -0.02011242, -0.050300457, -0.053843774, -0.20685083, 0.027301963, 0.10998949) * inp_1_0_0; + result5 += M4(0.03837473, 0.05254415, -0.00080854684, -0.040619116, -0.0020735469, -0.13120306, 0.05770567, 0.06391536, 0.028435186, 0.0027125527, -0.015089462, 0.07767398, 0.12986776, -0.4159729, 0.08245571, 0.11465695) * inp_1_1_0; + result5 += M4(0.04034278, -0.008207551, 0.03838088, 0.056135938, -0.032676563, 0.031642266, -0.045962267, 0.059938844, -0.042130135, -0.04537576, 0.028058194, -0.016807662, 0.16456495, -0.6113196, -0.42725474, -0.16307503) * inp_1_2_0; + result5 += M4(0.017811567, 0.056559052, -0.014353315, 0.0133377705, -0.03318095, 0.092453144, 0.05246356, -0.08190049, -0.06832507, -0.00080604915, -0.0076090493, 0.14349502, 0.012797353, -0.2697733, -0.12046655, -0.057533484) * inp_1_0_1; + result5 += M4(0.15638834, 0.048883244, -0.051702894, 0.06488677, -0.03852504, 0.038575765, 0.23324871, 0.09877689, -0.075095855, -0.04830458, -0.24212718, -0.014865598, -0.17191437, -0.77365506, 0.008027985, 0.22996089) * inp_1_1_1; + result5 += M4(-0.017335247, 0.14751019, 0.06585923, -0.17641634, -0.06569785, -0.26129907, -0.22370629, -0.13147283, -0.03262299, -0.013248584, 0.04594725, -0.13160022, -0.008222502, -1.0356127, -0.36193693, -0.44051754) * inp_1_2_1; + result5 += M4(-0.05584289, 0.029131265, 0.034898836, 0.038284853, 0.012738034, -0.1209926, -0.07185093, -0.18905109, 0.054480888, 0.13217686, -0.073891, -0.13050117, 0.06685193, -0.1597491, 0.09448252, -0.005437527) * inp_1_0_2; + result5 += M4(-0.0196811, -0.19598103, -0.07783923, -0.063255794, -0.052678622, -1.137565, -0.225611, -0.11549385, -0.08625303, -0.12001293, -0.06118455, 0.21607293, -0.18815157, -0.35172546, -0.0025106634, 0.002445428) * inp_1_1_2; + result5 += M4(0.13319601, -0.07210835, -0.13232388, 0.02761432, -0.18799822, -1.2781672, 0.050042987, -0.13998912, -0.106975965, -0.108207084, 0.08443993, 0.032595377, -0.01976393, -0.6081106, -0.11164538, 0.03883463) * inp_1_2_2; + result6 += M4(0.033074886, 0.01456681, -0.004679765, -0.08192022, -0.067768045, -0.055300165, -0.00333654, 0.041301347, -0.046085943, -0.03765881, 0.029648192, 0.05373143, 0.0051887627, 0.0589174, 0.015505131, 0.06869475) * inp_1_0_0; + result6 += M4(0.025754485, -0.037234567, -0.07378072, -0.099404216, 0.09122528, 0.17751941, 0.026758412, -0.039209135, 0.021081837, -0.0034884172, 0.01572646, 0.09727677, -0.036099352, 0.018142808, 0.014511881, 0.0604167) * inp_1_1_0; + result6 += M4(-0.011542189, 0.07421957, -0.009463231, -0.096331015, -0.051909856, -0.11668948, -0.025338132, -0.007597182, -0.039281595, -0.028591033, 0.008283274, 0.056748785, -0.12518261, 0.15266642, 0.024410337, -0.026743965) * inp_1_2_0; + result6 += M4(-0.15609896, -0.043293085, -0.010197192, -0.16263603, -0.13696565, 0.07399372, 0.031591773, -0.12916496, -0.03667822, -0.0747791, -0.08600092, 0.34519646, 0.09757736, -0.051031727, -0.041945048, 0.08449455) * inp_1_0_1; + result6 += M4(0.21484835, -0.13184159, 0.06463381, -0.18359545, 0.19409572, -0.059853785, -0.046886705, -0.15263551, 0.09478074, 0.06894887, -0.15709934, 0.3627044, 0.32462704, 0.22076513, -0.17329441, 0.26266629) * inp_1_1_1; + result6 += M4(0.020649584, -0.1902899, 0.30580583, -0.19065888, -0.08899363, -0.0066667954, 0.025861258, -0.22826087, 0.036973532, 0.054434314, -0.10382239, 0.27179778, 0.21625055, -0.13530569, -0.072385296, -0.065657705) * inp_1_2_1; + result6 += M4(0.016347792, 0.03480103, -0.048113488, 0.06259222, -0.4316581, 0.091990374, -0.02009009, 0.017726596, 0.0064451783, -0.04213947, -0.06700353, 0.047655486, -0.0014482669, 0.027389871, 0.0051922794, -0.08153045) * inp_1_0_2; + result6 += M4(-0.066500425, -0.07152405, -0.045412377, 0.12576097, -0.2961856, -0.1929178, 0.31079096, -0.013092226, -0.2451591, -0.039968736, -0.09930225, 0.08451656, 0.03885513, 0.0419801, 0.023305446, 0.02964816) * inp_1_1_2; + result6 += M4(0.03337743, -0.03295367, 0.07746758, 0.0657193, 0.25236058, -0.16876762, -0.1067636, 0.03514839, 0.015139447, 0.018583262, -0.07496198, 0.15334865, -0.03983048, 0.0834044, -0.027389742, -0.2050976) * inp_1_2_2; + result7 += M4(0.033491794, 0.033431564, -0.032191694, -0.03791176, -0.10448618, -0.0027218966, -0.048336614, -0.020620013, 0.0008278457, -0.005999135, -0.025837826, 0.06519663, 0.05074621, -0.018540831, 0.0029468199, 0.074196905) * inp_1_0_0; + result7 += M4(0.062896974, -0.009443187, 0.020553943, -0.120330945, 0.12485581, -0.070784785, 0.04606034, 0.014535254, -0.068321794, -0.048461266, 0.10030074, 0.03287768, -0.117403835, -0.0026079826, 0.12015297, 0.33320388) * inp_1_1_0; + result7 += M4(-0.02412423, 0.0027698653, -0.0034215215, 0.0048054494, -0.015451561, -0.038356625, 0.042229865, -0.003276745, 0.011244953, 0.02155011, -0.09089103, -0.017926773, -0.18452801, -0.0009074408, -0.027913399, -0.118693486) * inp_1_2_0; + result7 += M4(-0.044045206, -0.026545795, 0.0625399, 0.036388937, 0.023242345, 0.042980168, -0.051898457, -0.038802974, -0.05418674, 0.054400906, -0.008519099, 0.030409131, 0.06289983, -0.03152753, -0.054193035, -0.04534729) * inp_1_0_1; + result7 += M4(0.035021484, -0.1928886, 0.20334782, -0.1292003, 0.189458, 0.24525474, -0.16314523, 0.11621057, -0.04987817, 0.20187682, -0.24974394, 0.02364756, -0.44616988, 0.022775814, 0.099305615, -0.18563195) * inp_1_1_1; + result7 += M4(0.06319084, -0.06909548, 0.21568686, -0.09182502, -0.18536936, -0.026132217, -0.037597112, -0.13205439, -0.009697983, -0.033270434, 0.0004985, 0.08547708, -0.17955612, -0.109026566, 0.1683259, 0.032643046) * inp_1_2_1; + result7 += M4(-0.050920185, 0.014293551, 0.052467205, -0.013185744, 0.6167788, 0.00095461216, -0.17809248, 0.2858305, -0.004065777, 0.003838619, -0.03848994, 0.18019846, 0.08137998, 0.024889063, -0.039636772, 0.044028163) * inp_1_0_2; + result7 += M4(-0.20140332, -0.060450733, -0.00053162617, 0.060781363, 0.9409405, 0.07785594, 0.26325184, 0.06354481, -0.14579262, -0.08059214, 0.13374886, -0.11254252, 0.08748199, 0.021145327, 0.064878404, -0.06348521) * inp_1_1_2; + result7 += M4(0.0680433, 0.11711085, 0.33918294, 0.0029023325, 0.55087554, 0.119711325, 0.14793326, -0.06605746, 0.20209055, 0.006866348, -0.051688045, 0.010190858, -0.029470397, 0.013574893, 0.1306819, 0.10193515) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.07494, -0.05077266, -0.026659595, 0.030619424, -0.0038135254, 0.05391335, 0.1570492, 0.08343182, 0.015458231, -0.0057014613, -0.042156916, -0.036272705, 0.014460308, -0.030670522, 0.018927738, -0.027828531) * inp_2_0_0; + result0 += M4(0.15514928, 0.006001489, -0.09822864, 0.0346804, 0.08639671, 0.08669355, 0.065377995, 0.016002357, -0.084707804, -0.08958183, -0.029676473, -0.05378617, 0.003623887, -0.056604553, 0.0067594675, 0.022004629) * inp_2_1_0; + result0 += M4(-0.09237165, -0.1711586, -0.1387132, 0.015620278, 0.03760303, -0.109505035, -0.00024950327, -0.08786268, 0.06631906, 0.07354312, -0.02684669, -0.085153036, -0.029682446, 0.007307099, -0.05943568, 0.09192438) * inp_2_2_0; + result0 += M4(-0.051590115, -0.09793452, 0.13194951, -0.056596216, -0.18033156, -0.027467335, 0.20966366, 0.0018317275, -0.054502442, 0.04424457, -0.013086082, -0.077963166, 0.02515949, -0.031817596, 0.013543345, -0.0015129097) * inp_2_0_1; + result0 += M4(0.10139761, 0.39920083, 0.30134752, 0.17718132, 0.03846701, -0.06416088, -0.23580274, -0.07190605, -0.0031325787, -0.109290145, -0.051111437, -0.06360225, -0.045040537, -0.051740255, 0.07409316, 0.11579864) * inp_2_1_1; + result0 += M4(0.044332467, 0.0133779235, 0.12232053, -0.13510416, -0.08397025, 0.04206557, 0.0117594255, 0.0050962176, 0.0054156976, 0.05086221, 0.058712497, -0.05262061, -0.021198815, -0.036517896, -0.004759374, 0.06316373) * inp_2_2_1; + result0 += M4(0.055690076, 0.0017181535, 0.11878236, 0.03162121, -0.10013495, 0.035604306, 0.057296947, -0.07491181, 0.023251142, 0.04911363, 0.038059786, 0.015719399, 0.0046298997, -0.014167606, -0.024076566, -0.01338639) * inp_2_0_2; + result0 += M4(0.0058332984, -0.067495145, 0.11614125, -0.108366795, -0.0034360816, -0.017702324, 0.07662247, 0.01511283, -0.08448825, -0.00885264, -0.013982804, 0.022915812, 0.034426693, 0.04153597, -0.048677947, -0.0032110345) * inp_2_1_2; + result0 += M4(0.054809652, -0.0846411, 0.20322223, -0.15459712, 0.15113762, 0.038187418, -0.19329266, 0.048639983, 0.010586334, 0.05149305, 0.06670847, 0.034048304, -0.080881335, -0.026839003, -0.13555643, -0.005457974) * inp_2_2_2; + result1 += M4(0.17945331, -0.023931164, 0.027202131, 0.08880175, 0.04402973, 0.06695098, 0.08354948, -0.19006556, 0.026199497, -0.009296187, 0.0017142799, -0.08222427, -0.047533553, 0.08608704, 0.054214083, 0.052421566) * inp_2_0_0; + result1 += M4(0.09861517, -0.04518242, -0.102684125, -0.043397196, 0.05195172, 0.0066635907, -0.05621173, -0.05790526, -0.06728771, -0.07670168, 0.13762155, 0.06563987, 0.04788187, -0.003676454, -0.028143033, -0.028035967) * inp_2_1_0; + result1 += M4(0.05009104, 0.09247924, -0.18710847, 0.110595345, 0.040749308, 0.2177276, 0.13237047, 0.07979705, 0.11248281, -0.054301694, 0.13807157, -0.03904279, -0.08975319, -0.008645623, -0.12852934, 0.0369289) * inp_2_2_0; + result1 += M4(0.024393665, -0.008234926, 0.088239424, 0.07658029, 0.09357282, 0.12142016, 0.1830739, 0.02855118, -0.103374995, 0.05672652, -0.01929009, -0.08387968, 0.08673028, 0.13491224, -0.0062334486, 0.0981836) * inp_2_0_1; + result1 += M4(-0.21178693, 0.121799774, 0.110035494, -0.16204852, -0.27262422, -0.45329106, 0.07763265, 0.16171797, -0.0042413822, 0.18485485, 0.025555402, 0.008333991, 0.12641914, -0.060500026, -0.08808921, 0.020874847) * inp_2_1_1; + result1 += M4(0.10924835, 0.19907112, 0.049274243, 0.048267387, -0.14942577, -0.08877669, 0.076406814, -0.0057600373, -0.0975423, 0.18761975, -0.0658328, -0.0686535, -0.0024109816, 0.0068818084, -0.013526458, 0.048224322) * inp_2_2_1; + result1 += M4(0.06213526, -0.055960607, 0.06532137, 0.23777834, 0.16414092, 0.12011937, -0.08434864, -0.038254157, -0.119830206, -0.0276754, 0.034424048, 0.064848155, 0.024560139, 0.0823504, -0.0019978674, -0.06813539) * inp_2_0_2; + result1 += M4(-0.052649997, -0.06047692, 0.09607663, -0.020205185, 0.000105328494, -0.04821212, -0.06589419, 0.064222395, 0.0137073435, 0.063751325, 0.011678911, 0.16447645, -0.14408441, -0.046732858, 0.11591468, -0.12921704) * inp_2_1_2; + result1 += M4(-0.029070064, 0.019770756, -0.054608867, -0.0013570767, 0.01393227, 0.15071338, 0.106768034, -0.1397014, 0.086960815, -0.054786198, -0.07481496, 0.041338097, -0.12111123, 0.02133726, 0.07077017, -0.09974869) * inp_2_2_2; + result2 += M4(-0.06523624, -0.011637894, 0.013202765, 0.028338807, 0.036488313, -0.047921047, 0.10811481, -0.0680509, -0.03791697, 0.007575854, -0.071897626, -0.024764491, -0.08431334, 0.08933683, -0.05908894, -0.026652684) * inp_2_0_0; + result2 += M4(0.113793075, 0.14882053, -0.08299222, 0.15829425, 0.016099678, 0.052491635, -0.05269082, -0.14886315, -0.0727342, 0.06401357, 0.045290276, -0.1656238, 0.050183937, 0.012482351, 0.07713139, 0.09076516) * inp_2_1_0; + result2 += M4(0.12187568, 0.03305523, 0.008213214, 0.104071446, -0.03357946, -0.013462112, 0.1129802, -0.08046473, 0.04575342, 0.038853917, -0.013957368, -0.11232587, 0.015577268, -0.0051343907, -0.019716062, 0.06611522) * inp_2_2_0; + result2 += M4(-0.03968841, -0.15322322, 0.055316787, -0.005211975, -0.04737429, 0.021851042, 0.004827195, -0.060772017, 0.062346663, -0.08750688, -0.1653267, -0.22385976, -0.13247189, 0.05052236, -0.099613376, 0.11546412) * inp_2_0_1; + result2 += M4(-0.22240499, -0.27284405, 0.30428737, -0.39086345, 0.14287558, 0.03783774, -0.321136, 0.49711552, 0.19291952, -0.19244896, -0.1262286, -0.7186221, 0.021420028, 0.16798481, -0.001190083, 0.603055) * inp_2_1_1; + result2 += M4(0.04444056, -0.049011413, 0.09896402, -0.16583309, -0.1071772, -0.052570816, 0.026494984, 0.028089805, 0.07932182, 0.0862509, -0.011307004, -0.034114096, -0.07756723, -0.057702307, -0.017363068, 0.056191634) * inp_2_2_1; + result2 += M4(0.041961048, 0.004297009, -0.0545132, 0.044127725, -0.10441683, 0.11742233, -0.04116199, 0.15055777, 0.11402831, 0.0011245033, -0.033392046, -0.12580137, -0.07758799, 0.044290204, 0.027751498, 0.10705669) * inp_2_0_2; + result2 += M4(0.06467788, 0.086151935, 0.07726434, 0.09277324, -0.04042926, -0.004939324, 0.06698208, -0.0022127065, 0.0053815665, 0.0046978123, -0.11127949, -0.09446042, 0.048278403, 0.017751362, 0.012433524, 0.048401892) * inp_2_1_2; + result2 += M4(0.06402855, -0.050090324, -0.004710745, 0.08049927, -0.069437996, 0.03885143, 0.085725866, 0.022214757, 0.04614415, 0.01786597, 0.069098175, -0.036424533, -0.024743352, -0.02808395, -0.09000762, -0.003649834) * inp_2_2_2; + result3 += M4(-0.045640748, -0.0063400236, -0.0013699245, 0.030135032, 0.037648123, 0.001330038, 0.048967063, 0.021150252, 0.007981003, -0.048084144, 0.04252307, -0.0145246005, -0.06772604, 0.036997158, -0.004073418, 0.049042378) * inp_2_0_0; + result3 += M4(0.031741023, 0.0010430248, -0.112246305, -0.024879638, 0.067149535, 0.046017114, -0.0011107507, 0.020667493, 0.033573058, -0.034145474, -0.047484566, 0.14315285, 0.01293433, 0.008634882, -0.010181065, -0.030354196) * inp_2_1_0; + result3 += M4(0.19533974, -0.05397993, -0.20672618, -0.016877312, -0.0047949064, -0.027004106, -0.07124846, -0.18177177, -0.05796344, 0.03238938, -0.032951236, 0.047307037, -0.009142184, 0.0076127644, 0.029982325, 0.018763395) * inp_2_2_0; + result3 += M4(-0.012870685, -0.018568646, 0.10898687, 0.011072115, 0.022851322, -0.008432655, -0.108623154, 0.09017585, -0.076823056, 0.0005175829, -0.18020837, -0.060901105, -0.14940912, -0.0318334, 0.031519167, -0.074741654) * inp_2_0_1; + result3 += M4(-0.034363076, 0.015508316, 0.031822786, -0.21294376, 0.11306669, 0.013865108, -0.22649102, 0.14027794, -0.33663842, 0.032454435, 0.017281126, -0.015645262, 0.075483166, -0.026638439, 0.15642151, 0.025092613) * inp_2_1_1; + result3 += M4(-0.07745874, -0.014501854, -0.14062268, -0.07390119, -0.08448971, -0.0033370005, -0.066395864, 0.043039158, -0.15300897, -0.0065638325, 0.080482855, -0.035446554, 0.026744055, 0.028667608, -0.022409528, -0.019115414) * inp_2_2_1; + result3 += M4(-0.02511079, 0.041671794, 0.17295955, -0.071983226, 0.07804442, -0.015229377, 0.067681365, -0.011101983, 0.015711699, -0.014400514, 0.005392753, 0.001381756, 0.07462556, -0.00034293171, -0.047388285, 0.05993132) * inp_2_0_2; + result3 += M4(0.036151588, 0.02973521, 0.044248186, -0.11452938, 0.11488021, 0.007013514, -0.09613799, 0.12363617, -0.034297317, -0.0061639533, 0.12067807, 0.017623423, -0.06019171, -0.0772687, -0.092259265, -0.015990047) * inp_2_1_2; + result3 += M4(0.01212578, 0.010690265, -0.049116254, -0.10172036, -0.03062488, -0.019137895, 0.058667358, 0.073232345, 0.027817994, 0.06959846, -0.026369462, 0.018732924, -0.00670127, 0.011567502, 0.014396295, -0.003478614) * inp_2_2_2; + result4 += M4(-0.016565857, 0.063714094, 0.021283757, -0.10010239, -0.28761837, -0.029374009, -0.021100385, 0.08887346, -0.023292013, -0.02542198, 0.013775324, 0.17113547, -0.01357601, -0.008095763, 0.033696268, -0.021619827) * inp_2_0_0; + result4 += M4(-0.16397667, -0.06556849, -0.057644397, -0.030522967, 0.0986292, 0.019353693, 0.039616942, 0.050109237, 0.14428373, 0.05934183, -0.058447093, -0.03190684, -0.038962226, -0.050925408, 0.046515387, 0.019207321) * inp_2_1_0; + result4 += M4(0.09507322, 0.11934473, 0.02446529, 0.18916437, 0.09081171, -0.052057076, -0.03183994, 0.04618198, -0.06393724, 0.011453732, -0.0018015533, -0.09516997, 0.021399254, -0.020272523, -0.016122052, -0.008919146) * inp_2_2_0; + result4 += M4(0.030786015, 0.073883876, 0.028877417, -0.02799471, -0.2175274, -0.063089125, -0.09729074, -0.07417067, -0.078861006, 0.08268576, -0.10159341, -0.10323134, -0.084693715, 0.055255234, 0.00018154246, -0.024651531) * inp_2_0_1; + result4 += M4(0.12690236, 0.13265236, -0.52678114, -0.1622023, -0.111389056, -0.22853708, 0.2827274, 0.10031751, 0.0019659442, -0.0644262, 0.08141505, 0.12996665, 0.14963876, -0.050334495, -0.054661326, -0.10075027) * inp_2_1_1; + result4 += M4(0.16956973, -0.12632602, -0.1185003, 0.16216503, -0.07984294, 0.040402763, -0.011387946, 0.087027736, -0.05799177, -0.07410546, 0.117217034, -0.005742952, 0.052801684, -0.008091848, -0.041884046, 0.051865872) * inp_2_2_1; + result4 += M4(0.02390533, -0.061731048, 0.07325091, 0.11913895, -0.1702638, 0.026547112, -0.17446364, -0.010696006, 0.073367536, 0.02286371, -0.00652968, -0.065270185, -0.05636013, 0.043165658, -0.10097027, -0.10408143) * inp_2_0_2; + result4 += M4(-0.091289975, -0.011250953, -0.11032173, 0.10090456, -0.038040686, 0.08335754, 0.04166047, 0.0976977, -0.03980907, -0.044055067, -0.006025022, 0.012358866, 0.06741738, -0.027368607, 0.054619547, 0.069308214) * inp_2_1_2; + result4 += M4(0.14418882, 0.11888136, 0.059486203, 0.20024854, 0.09193799, 0.26633242, 0.06048822, 0.047990832, 0.015340219, 0.04504112, 0.066571854, -0.028241217, -0.013371457, 0.011218797, -0.004674537, 0.023134133) * inp_2_2_2; + result5 += M4(0.11911977, 0.18507795, -0.09412964, 0.062479537, 0.12875988, -0.2322169, 0.061461903, 0.029537681, 0.046109173, -0.011815525, -0.021828849, -0.050121646, -0.100107506, 0.025856985, 0.0055207876, 0.051024478) * inp_2_0_0; + result5 += M4(0.034037363, 0.21084681, -0.067724235, -0.0569512, -0.016327107, -0.21827069, 0.14513928, 0.15991366, 0.03875252, 0.0049411166, -0.12864988, 0.12917945, -0.0020353121, 0.011334821, 0.014256529, -0.07229825) * inp_2_1_0; + result5 += M4(-0.18729857, 0.3316997, -0.031916264, 0.29055, 0.06373419, -0.13255799, 0.095508285, -0.21461032, 0.056666374, 0.009753959, 0.05922951, 0.060121857, -0.006256435, 0.0016009604, -0.01812742, 0.011361355) * inp_2_2_0; + result5 += M4(-0.06420593, 0.23263887, 0.14168186, 0.02681991, -0.016227413, -0.48766264, 0.038944304, -0.09862829, -0.0688283, -0.04345934, -0.05915392, 0.04637451, 0.020248426, -0.0061673345, 0.038848415, 0.05389427) * inp_2_0_1; + result5 += M4(0.25341606, 0.4970163, 0.47734335, -0.14620154, 0.0515255, -0.6986546, -0.3227576, 0.108818404, -0.08365794, -0.0033023611, -0.0146560185, -0.0858513, -0.049081232, -0.019801008, 0.02899775, -0.08498034) * inp_2_1_1; + result5 += M4(0.18798043, 0.36286557, 0.13465525, -0.015814202, 0.21601401, -0.21095707, 0.060783837, -0.121664055, -0.16187255, -0.011786768, 0.04611115, -0.06684308, 0.028182462, -0.00198046, -0.018785324, 0.022524353) * inp_2_2_1; + result5 += M4(-0.082779355, 0.24071859, 0.012786101, 0.1073771, 0.041381676, -0.261746, 0.010940857, -0.015798206, 0.025085129, 0.035429824, -0.014375972, 0.054150008, 0.01492869, -0.04183125, 0.03447971, -0.05097506) * inp_2_0_2; + result5 += M4(-0.022266975, 0.43461025, -0.09900948, 0.06827321, 0.0064982283, -0.38604292, -0.07445078, 0.10005422, 0.03834597, 0.061704703, 0.04538771, -0.0039772815, -0.068917714, -0.024470262, -0.10286511, -0.012490338) * inp_2_1_2; + result5 += M4(0.13350421, 0.27473417, -0.14574355, 0.10282295, -0.04357392, -0.21660705, 0.0912675, -0.034716353, -0.018700225, -0.0933954, -0.0029876998, -0.025813917, 0.0057641435, -0.014384098, 0.039757356, 0.05858671) * inp_2_2_2; + result6 += M4(0.11544621, 0.009331294, -0.03409185, 0.041576765, 0.037711807, 0.15027703, 0.04431929, 0.018683648, -0.08355787, 0.05569185, -0.024628434, 0.025105964, -0.04255377, 0.08643012, -0.034276597, -0.017503174) * inp_2_0_0; + result6 += M4(-0.0402898, -0.21648401, 0.04964956, 0.0062383604, -0.025755888, -0.13278158, 0.029112928, 0.04210357, 0.09784074, -0.044734973, 0.034939762, 0.07313087, -0.004805195, -0.04084926, -0.0073794792, -0.06263254) * inp_2_1_0; + result6 += M4(0.07156469, 0.19937184, -0.027408663, 0.0023804537, 0.018871117, 0.02836203, 0.014850682, 0.016555728, -0.0221832, 0.05842921, -0.035973646, -0.098671794, 0.023996044, 0.032854408, 0.003671901, 0.059674773) * inp_2_2_0; + result6 += M4(-0.024599303, 0.105640784, -0.012556766, -0.051186815, -0.056619275, -0.016585678, 0.016571127, -0.0223009, 0.19242522, 0.00073244213, -0.012116432, 0.10983492, -0.15146567, 0.07593534, 0.022069179, -0.0485135) * inp_2_0_1; + result6 += M4(-0.17923881, -0.23225825, -0.1490507, 0.2403646, -0.094644114, 0.115030564, -0.14342141, -0.17417115, -0.08787826, 0.068846464, 0.42370248, -0.12356875, 0.021677576, 0.032778624, -0.1455038, 0.037231497) * inp_2_1_1; + result6 += M4(0.09711059, -0.077384725, 0.035789892, 0.062623575, -0.020504052, 0.10286945, 0.03887469, 0.060432076, 0.08667588, 0.045888357, -0.007155188, -0.029380346, 0.0083949845, 0.006929334, -0.0105934935, 0.025226818) * inp_2_2_1; + result6 += M4(0.05681853, -0.07506403, 0.016364262, -0.10113417, 0.053965632, -0.05894171, -0.02646065, 0.082565285, 0.01755858, 0.081124455, 0.044373915, -0.021322627, -0.034455776, -0.02359104, -0.03970145, 0.024455955) * inp_2_0_2; + result6 += M4(0.19519812, 0.023326106, -0.06358114, 0.008290809, 0.025569428, 0.0022160492, -0.0064826235, 0.08153404, -0.08499347, -0.103305966, 0.010947972, 0.03593276, 0.020753162, -0.0304176, 0.024631582, -0.0026721978) * inp_2_1_2; + result6 += M4(0.02968033, -0.008037597, 0.052780546, -0.16858529, 0.051812414, -0.13959612, -0.036582913, 0.027260361, -0.0017292037, 0.11300737, -0.011207886, -0.062157914, 0.06867121, 0.008292356, 0.02019452, -0.037092496) * inp_2_2_2; + result7 += M4(-0.070383064, -0.0018941662, 0.009261709, -0.029387435, 0.10982881, -0.0215069, 0.14872892, -0.10411507, -0.12109936, 0.018784482, -0.030478498, -0.08023815, 0.045679238, -0.029418876, -0.05215912, 0.031001695) * inp_2_0_0; + result7 += M4(-0.20609969, -0.06899776, 0.05168208, -0.021695405, -0.009522104, -0.052976973, 0.24030434, 0.06792218, -0.00074572675, -0.047091883, -0.11523507, 0.018632252, 0.0067120716, 0.008613463, -0.0072611556, 0.073870935) * inp_2_1_0; + result7 += M4(-0.0457607, -0.053107716, -0.024241656, 0.036762826, 0.113340124, 0.017231401, -0.06802681, 0.014421814, -0.0910611, 0.07579218, 0.03143931, 0.037379533, -0.010990686, -0.057808623, 0.016745748, 0.028558975) * inp_2_2_0; + result7 += M4(-0.027509524, -0.0015665191, 0.06562259, -0.08430343, -0.10179392, -0.083278656, 0.19010025, -0.12468562, -0.07462006, -0.013929306, -0.08613025, 0.03476423, 0.026493594, -0.02164569, 0.014731891, -0.032355193) * inp_2_0_1; + result7 += M4(-0.17326574, -0.09417346, 0.66998553, 0.009321544, 0.110744074, -0.04699417, 0.2671957, 0.03553626, 0.13114145, 0.4145705, -0.02063642, -0.12568437, -0.14781725, -0.20608905, -0.004326043, -0.035743393) * inp_2_1_1; + result7 += M4(0.07758693, 0.07410466, 0.077924885, 0.09827127, -0.034718454, -0.018233534, -0.20749852, 0.007610238, 0.08349607, 0.044641357, 0.03459079, 0.019390328, 0.026910774, 0.009283013, -0.068095274, 0.011733051) * inp_2_2_1; + result7 += M4(-0.014742071, -0.01684026, -0.039557576, -0.047406368, 0.015931614, -0.0060423487, -0.004189069, -0.023810044, 0.024215858, -0.016749816, -0.087993205, 0.03560463, -0.035238065, -0.013115836, 0.008730331, 0.028258363) * inp_2_0_2; + result7 += M4(-0.2859722, -0.03239873, -0.08711113, -0.0931549, 0.10253455, -0.011481367, -0.008811635, 0.14545655, 0.0035784945, 0.04070705, -0.012110465, 0.0019575353, 0.012843455, -0.010998855, -0.049620643, 0.02182134) * inp_2_1_2; + result7 += M4(-0.066526406, 0.024334285, 0.20216238, -0.03000161, 0.034289896, -0.04164767, -0.0610855, -0.12462786, -0.008006271, 0.020628722, 0.002383473, -0.040480513, -0.02649028, -0.0092646, -0.027685355, -0.03872741) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.09254954, -0.066149786, 0.1739582, 0.06795746, -0.20359185, -0.034307085, -0.15570211, -0.1587109, -0.039456386, 0.025139311, -0.024828294, 0.05037912, -0.55165523, -0.20256926, 1.7069019, 0.5593169) * inp_3_0_0; + result0 += M4(0.0778977, 0.18100552, 0.053122494, 0.060407706, -0.019591585, -0.027646327, -0.14089061, -0.054712098, 0.0038405368, -0.13766822, 0.044245742, -0.028563345, 0.05199818, 0.107912496, 0.21219051, 0.08904266) * inp_3_1_0; + result0 += M4(-0.040725835, -0.23843147, -0.07467649, 0.117472924, 0.062686585, -0.16958015, 0.0029354997, 0.0890783, -0.019574124, -0.01068517, -0.025981672, 0.02934722, 0.051200394, -0.044291902, -0.14113191, -0.00036737416) * inp_3_2_0; + result0 += M4(-0.23490798, -0.005662241, 0.039114837, 0.08678573, 0.089571774, 0.1137239, -0.117055096, -0.14043239, 0.025339626, -0.026701225, 0.028766695, -0.0046202834, 0.024093471, 0.18948402, 0.14255321, 0.22870497) * inp_3_0_1; + result0 += M4(0.04485922, 0.07076504, -0.07595488, 0.026019868, -0.087104715, 0.10135535, 0.40971664, 0.18662886, 0.09416117, 0.05331952, 0.018915465, -0.117340825, -0.1370123, -0.051770423, -0.32962924, 0.22879691) * inp_3_1_1; + result0 += M4(-0.055766147, 0.029093638, -0.022541687, -0.06013454, -0.016317332, 0.105744675, 0.03759028, -0.014056315, -0.03707877, -0.0073944605, -0.010918169, 0.032258492, -0.0029612882, -0.08540761, 0.07273114, 0.12243875) * inp_3_2_1; + result0 += M4(-0.1346676, 0.009190142, 0.009574206, -0.04557382, 0.052939687, 0.018892609, -0.10016458, 0.025161734, -0.09715171, -0.049740102, 0.028791618, 0.009169212, -0.057750694, -0.06637252, -0.025068432, 0.014734563) * inp_3_0_2; + result0 += M4(0.0006416769, 0.12873103, -0.06071439, 0.061351776, 0.08935858, -0.05549713, 0.07841675, -0.08964339, 0.07989987, 0.07285906, -0.020769075, 0.00069853663, 0.16606203, -0.09512037, 0.09189646, 0.09517537) * inp_3_1_2; + result0 += M4(0.01390574, -0.12350316, -0.05518436, -0.10814563, 0.030669253, -0.015254703, -0.09967872, -0.04459087, 0.019996883, 0.012870364, 0.046347335, 0.0169645, -0.064181015, 0.14752543, 0.038340397, 0.039887283) * inp_3_2_2; + result1 += M4(0.19128737, 0.055152938, 0.23503314, -0.031887658, -0.28537583, -0.14741041, -0.123044476, 0.2239382, -0.013849556, -0.025396885, 0.010835838, 0.048768003, 0.6936537, 0.5322787, 0.8627159, 2.0183182) * inp_3_0_0; + result1 += M4(-0.16392177, -0.084342286, -0.06368037, -0.054682285, -0.066886775, -0.017082512, 0.0017936974, 0.19639695, -0.08483735, 0.04340435, -0.041357446, -0.018277828, 0.30569118, -0.14916512, 0.26740617, -0.041636698) * inp_3_1_0; + result1 += M4(-0.18544926, 0.09894158, -0.08929115, 0.0891195, -0.08961769, 0.0037911495, -0.07230035, 0.015044842, -0.01178813, -0.01307943, 0.0023355505, -0.001084589, 0.01972752, 0.19321127, 0.05652662, 0.06697108) * inp_3_2_0; + result1 += M4(0.040632583, 0.052436706, 0.102042764, 0.1196807, -0.22357212, -0.0731257, -0.1231492, 0.015851084, -0.03811146, 0.13468641, -0.037803803, 0.11746919, 0.24887115, 0.16866142, 0.029094731, -0.023084702) * inp_3_0_1; + result1 += M4(-0.16234949, -0.028136345, 0.07751747, -0.086364046, 0.3496027, -0.08361247, -0.099706836, -0.11052168, 0.050157838, -0.10870487, 0.15819858, -0.07486724, -0.25571546, 0.3763421, -0.031816337, 0.15863006) * inp_3_1_1; + result1 += M4(0.024654157, 0.03522474, 0.005597233, -0.10712482, -0.025258765, 0.041888993, 0.028555676, 0.009286705, -0.03700915, -0.034389768, -0.015460933, -0.06318085, -0.0745419, -0.4322204, 0.0055549787, -0.13247797) * inp_3_2_1; + result1 += M4(0.096734256, 0.12772109, 0.028968565, -0.08951548, -0.10943124, -0.0005613298, -0.0125749, 0.013759284, 0.011261038, 0.03467039, -0.045689914, -0.035989054, -0.09738886, -0.1069808, 0.24025622, -0.04359225) * inp_3_0_2; + result1 += M4(-0.09231692, -0.033435293, -0.030702181, 0.19699563, 0.019167103, -0.005587681, -0.04937635, 0.0006784209, -0.0029995125, 0.049607303, -0.030162135, 0.10340216, 0.007716518, -0.24057621, -0.16935349, -0.017029148) * inp_3_1_2; + result1 += M4(-0.051612962, 0.04662405, 0.08940832, -0.118905425, 0.027985938, 0.16636798, 0.05474558, -0.08056813, 0.020965522, 0.003118475, 0.014856406, -0.009867242, 0.039896052, 0.27668273, -0.07101276, 0.077010944) * inp_3_2_2; + result2 += M4(0.053076826, 0.021010296, 0.13123292, -0.012441169, 0.043306947, 0.13743393, -0.047766387, 0.12708248, -0.11768613, 0.055098455, -0.023150088, -0.014197193, -0.1542718, -0.12106738, -1.8194804, -0.91348547) * inp_3_0_0; + result2 += M4(0.10943635, 0.111729674, -0.13823912, -0.035315786, 0.016806452, 0.06422305, -0.039294496, -0.0010438039, 0.05339203, -0.013665516, 0.16269884, 0.073019795, -0.08262138, -0.093185745, 0.06152265, -0.053120397) * inp_3_1_0; + result2 += M4(0.11270539, 0.14025952, -0.08041442, 0.10229776, 0.108046815, 0.06260132, -0.059683353, 0.0724034, 0.007681874, -0.0049832347, -0.0064788763, 0.016769966, -0.038609058, -0.101070486, -0.04632763, 0.08992907) * inp_3_2_0; + result2 += M4(-0.14573388, 0.048150554, 0.0073312516, 0.0820863, 0.005311342, -0.07133988, 0.07941047, -0.06518964, -0.0540065, 0.030663036, -0.015387687, 0.0024963527, 0.33523628, -0.21032298, -0.006126366, -0.0019119852) * inp_3_0_1; + result2 += M4(-0.05506345, 0.008375741, -0.06898237, 0.49355978, 0.046426956, 0.13173291, 0.34143007, 0.16885425, 0.047667753, -0.010823554, -0.049582757, -0.10253868, 0.043109186, 0.049872104, 0.10323304, -0.06117262) * inp_3_1_1; + result2 += M4(-0.12682886, -0.024398634, -0.02463526, -0.0053581437, -0.031698346, -0.09654456, 0.0134545015, 0.06747738, -0.042354576, 0.0699279, 0.06142366, 0.034909867, 0.082730986, 0.05110429, -0.04656455, 0.03800416) * inp_3_2_1; + result2 += M4(-0.17848222, 0.07386075, -0.034484997, 0.14056027, -0.016019175, -0.046031028, -0.10376105, -0.02280207, 0.024345232, 0.017198803, 0.029092256, -0.092551954, 0.12745397, 0.03982811, 0.01168676, 0.018948171) * inp_3_0_2; + result2 += M4(-0.07862329, -0.03741237, 0.08126433, 0.049272113, 0.11524571, -0.02037916, -0.030216433, -0.037595138, 0.011805941, 0.020535095, 0.036056828, 0.0073523335, -0.08362264, -0.07560603, -0.078490816, -0.021978863) * inp_3_1_2; + result2 += M4(-0.0767799, -0.015410508, -0.22519824, 0.016836038, 0.004659908, 0.015881686, 0.029287374, 0.0181264, 0.0015891637, 0.024870405, -0.04659198, 0.05982338, -0.045209248, 0.03279409, 0.054918773, -0.029691832) * inp_3_2_2; + result3 += M4(0.14641838, -0.032368448, -0.051798083, 0.100165516, -0.11626831, 0.04413833, -0.2144082, 0.073160104, -0.01514462, 0.019728959, -0.014288481, 0.048049152, -0.5357604, -0.56084126, -0.42700014, 0.258973) * inp_3_0_0; + result3 += M4(0.067878395, -0.023797305, 0.082887724, 0.09493578, 0.09728951, -0.007154798, 0.030006688, -0.13688226, 0.080369964, -0.071570344, 0.03663499, -0.04523607, 0.23509674, 0.08656335, -0.12761234, 0.10627437) * inp_3_1_0; + result3 += M4(0.047612563, -0.05812853, -0.10656436, -0.042110536, -0.06782397, 0.0029847494, -0.0073221833, -0.06700891, 0.01259655, -0.0040371697, -0.019085785, -0.034876842, -0.086568266, -0.025362449, -0.062371697, -0.055860434) * inp_3_2_0; + result3 += M4(0.0020961028, 0.033408057, 0.14776878, 0.069254436, -0.023974894, -0.044630118, -0.16477525, 0.16033758, 0.12493758, -0.060614284, -0.0020546261, -0.028748177, -0.027826814, 0.19305335, -0.23739079, 0.17232148) * inp_3_0_1; + result3 += M4(0.30260783, 0.09715787, -0.06745273, -0.2249556, 0.07854466, 0.050709903, 0.13968366, -0.06283924, -0.057586525, -0.036045283, 0.0789627, 0.09579551, 0.0323496, 0.3649893, 0.321902, -0.33644336) * inp_3_1_1; + result3 += M4(0.0085015865, -0.046508003, 0.05737567, 0.06742753, 0.08303187, 0.024977706, 0.060929872, 0.006051357, -0.099968664, -0.00418814, 0.026276669, 0.027530096, 0.060614645, 0.1000981, -0.046085663, 0.076093376) * inp_3_2_1; + result3 += M4(-0.02233, 0.049072236, 0.12531404, -0.036096096, -0.09118223, 0.012510844, -0.07377069, 0.030965295, -0.009523234, -0.024311135, -0.002075602, -0.00860735, -0.027546367, 0.013555321, 0.06914449, -0.11078691) * inp_3_0_2; + result3 += M4(0.010217063, -0.040137805, 0.124532096, -0.001681538, -0.1334867, 0.005404225, -0.044753317, -0.107077144, 0.026245933, 0.03505359, -0.03107834, 0.047365762, -0.102796964, 0.06819123, -0.17713459, 0.16009302) * inp_3_1_2; + result3 += M4(-0.053064767, -0.00038910803, -0.044331346, -0.13896687, 0.011218555, -0.05347108, -0.024523782, -0.0022578419, -0.06383166, -0.027157433, 0.0059858304, -0.045790028, 0.0887413, -0.025947573, 0.09377036, -0.041215293) * inp_3_2_2; + result4 += M4(-0.18604346, 0.008878314, 0.013272913, 0.05539693, 0.2421564, 0.14090005, 0.25091538, -0.18182102, 0.007409157, -0.03323785, 0.0043234024, 0.042201746, 0.007849639, 0.1932206, 0.9280076, 2.2401915) * inp_3_0_0; + result4 += M4(0.012913329, -0.09914007, -0.12366385, -0.09848158, -0.20237258, 0.18532643, -0.02462933, -0.059980325, -0.054811925, 0.12306637, 0.042322475, 0.002346973, -0.019184176, -0.13235821, -0.005153328, 0.11585647) * inp_3_1_0; + result4 += M4(0.10732047, 0.13869062, 0.089536235, 0.17246234, -0.20513247, 0.05316355, 0.1093314, -0.028356964, -0.020178609, 0.012088683, 0.035843994, 0.004279176, -0.059449118, 0.092298515, -0.017105749, 0.16946927) * inp_3_2_0; + result4 += M4(0.019160364, -0.047085688, 0.05366002, -0.028276762, 0.13703205, 0.00044831116, 0.06620764, -0.061500076, -0.12533294, -0.08671866, -0.019014668, 0.0497677, 0.101091735, -0.009254054, 0.1609112, 0.13902497) * inp_3_0_1; + result4 += M4(-0.058230035, 0.06264195, -0.26525855, -0.18248996, 0.2286463, 0.050672255, -0.42757395, 0.10478752, 0.20547761, -0.08584586, -0.03877289, -0.0738539, 0.007945127, -0.14242807, -0.31559646, -0.16626942) * inp_3_1_1; + result4 += M4(0.108471274, -0.06305002, 0.10488395, 0.12886141, 0.15483312, -0.10420125, -0.05469925, 0.049627285, 0.019065088, -0.09111849, 0.08850026, 0.032642707, -0.016728697, 0.14083497, 0.16343744, -0.017275989) * inp_3_2_1; + result4 += M4(-0.08110123, -0.037437815, 0.0036670845, -0.012389813, 0.003391518, -0.037371535, 0.09392287, 0.0056252186, -0.0013106877, 0.015934331, -0.047441415, -0.048825603, 0.01574346, -0.038988292, -0.13774225, 0.11974879) * inp_3_0_2; + result4 += M4(0.09821519, -0.07367004, -0.1671587, -0.13175157, 0.096806094, -0.00028934368, 0.1011974, 0.094689324, 0.058885638, 0.10860918, 0.046144772, 0.041934837, -0.05322929, 0.24820651, 0.30623418, 0.042317044) * inp_3_1_2; + result4 += M4(0.10749678, 0.041979447, 0.06428992, 0.1921631, 0.09005325, 0.003081052, 0.04427278, 0.035038162, 0.041481927, 0.003136483, 0.04282672, 0.008163647, 0.06676903, -0.17057979, -0.11313607, -0.09240135) * inp_3_2_2; + result5 += M4(0.06516661, 0.049326673, 0.03936918, 0.09226112, -0.10024755, 0.33362073, -0.10652033, -0.11264627, -0.07969274, -0.008018975, -0.052655227, 0.052439395, -0.12593323, 1.0872221, -1.2651701, 0.41566744) * inp_3_0_0; + result5 += M4(-0.045513228, -0.11950231, 0.1209804, 0.007877305, 0.10092648, 0.41289014, -0.08005187, -0.02832368, -0.006118914, 0.0949782, -0.04972284, -0.005229561, 0.024182199, -0.17841667, -0.08029278, -0.12619787) * inp_3_1_0; + result5 += M4(0.005838728, 0.16057518, -0.07368895, -0.069933906, 0.069940045, 0.093065664, -0.044347297, -0.030703027, 0.021843225, 0.035086885, 0.049631763, 0.06536256, -0.019788878, 0.11170757, -0.075200684, -0.18261178) * inp_3_2_0; + result5 += M4(0.099156775, 0.1164972, 0.006294541, -0.007732477, -0.09588161, 0.5086522, 0.13685015, -0.048572093, -0.017175527, 0.08466932, 0.064308986, 0.051214278, 0.13900544, -0.077204086, 0.07186291, -0.38778207) * inp_3_0_1; + result5 += M4(0.069707386, -0.09682797, -0.02300618, 0.079261556, -0.04800534, 0.72563374, 0.56960875, -0.0053159664, -0.06180492, -0.019749833, 0.091729395, 0.024558257, -0.060489092, 0.12238774, -0.47927248, 0.16019621) * inp_3_1_1; + result5 += M4(0.12997632, 0.015662136, -0.016555179, -0.1428028, -0.013378371, 0.16322523, -0.14021045, 0.08571332, -0.013558627, -0.08813459, 0.020676363, -0.09266872, -0.03147197, -0.024789676, 0.37013018, 0.2309393) * inp_3_2_1; + result5 += M4(-0.008761019, 0.07565732, -0.041142333, -0.046059586, -0.0512882, 0.18809535, 0.055352326, 0.015549614, 0.021744449, -0.061326817, -0.07602716, 0.040978383, -0.018101398, 0.028591217, -0.22137551, 0.08695099) * inp_3_0_2; + result5 += M4(0.0037994229, -0.06116121, -0.01840275, 0.025639147, 0.005005405, 0.0133597255, 0.016156316, 0.039870672, -0.0052740895, 0.061846644, -0.023088494, -0.12499887, -0.009223509, 0.023290524, 0.4783956, -0.077085905) * inp_3_1_2; + result5 += M4(-0.05114464, 0.03225734, -0.19172737, 0.10554599, -0.08714355, 0.06544918, -0.10703989, 0.06852276, -0.0016587988, -0.06694731, -0.006738505, 0.019996623, 0.025497781, -0.038344294, -0.23213674, -0.061307177) * inp_3_2_2; + result6 += M4(0.13491632, 0.013287625, 0.010947559, 0.11294138, -0.2521337, -0.27708814, 0.025833378, -0.07539904, -0.079497874, 0.020652197, -0.0030113307, 0.081777684, -0.71779454, -1.0798353, 0.09159261, 1.1087446) * inp_3_0_0; + result6 += M4(-0.18355171, -0.059375823, 0.04745586, 0.08226284, -0.12366443, 0.0715416, 0.12640767, -0.044321008, 0.05003234, -0.0201903, -0.06918658, 0.03307183, 0.019908654, 0.036179923, -0.008145942, 0.06775953) * inp_3_1_0; + result6 += M4(-0.0069526485, 0.088293165, -0.055144385, 0.15134218, -0.029758744, 0.046259724, 0.0020197325, -0.015014638, -0.075561896, -0.06340864, -0.03838801, -0.016902346, 0.021184303, 0.041330207, -0.014269733, -0.010986305) * inp_3_2_0; + result6 += M4(0.02769141, -0.036027133, -0.09697365, 0.19294448, -0.104395695, -0.034130737, -0.017838359, -0.10523258, -0.033646084, -0.05008058, 0.058587097, -0.058627483, -0.12708743, 0.22058709, -0.13582976, -0.10437317) * inp_3_0_1; + result6 += M4(0.044173777, 0.003539219, -0.47622097, 0.21824974, -0.097344674, 0.15406853, -0.017604077, 0.07182323, 0.020947617, 0.0055851056, 0.13544694, 0.056049135, -0.10321335, -0.21882974, -0.21870779, -0.1875005) * inp_3_1_1; + result6 += M4(0.14868195, -0.13731037, -0.019478442, 0.14187837, -0.057697177, 0.0426955, 0.06403023, 0.049729705, 0.036131207, 0.092073284, -0.047384284, -0.0338119, 0.18167923, 0.04958258, -0.10772855, 0.1121622) * inp_3_2_1; + result6 += M4(-0.045274038, 0.05365618, -0.107324526, 0.009048631, 0.026047962, 0.035374407, -0.010143593, -0.014340872, -0.07006902, 0.06860889, 0.05853425, -0.016819451, 0.17378499, -0.04515828, 0.018258387, 0.04951162) * inp_3_0_2; + result6 += M4(-0.055789858, -0.064339414, 0.017740736, -0.09462704, 0.090619236, -0.05269287, -0.009235976, 0.07033417, 0.06366415, -0.01664569, -0.06249674, -0.032444846, 0.1146286, 0.14271268, 0.014363114, 0.117870755) * inp_3_1_2; + result6 += M4(0.1616541, -0.062147476, -0.032977153, 0.0128625855, 0.02471507, -0.027155781, 0.050833214, 0.016909096, -0.013055126, -0.033375476, -0.016312419, -0.015191727, -0.21759532, -0.0804212, 0.02692404, -0.05099601) * inp_3_2_2; + result7 += M4(0.07253019, -0.035087388, 0.27128088, -0.03760534, -0.019292584, 0.055270355, -0.3426022, -0.06291199, 0.0055902447, 0.037557192, -0.024743894, -0.06223259, -2.2094288, 0.7352681, 1.0247802, 0.5603988) * inp_3_0_0; + result7 += M4(-0.17581846, -0.059658587, 0.17984822, -0.012240912, 0.12979916, 0.012898234, 0.04246356, 0.10924559, 0.047663286, 0.0038158314, -0.032040454, 0.049285993, -0.08010564, 0.22021946, 0.06039017, 0.100572005) * inp_3_1_0; + result7 += M4(-0.07905704, -0.13207316, 0.21944374, 0.049595814, -0.03912118, -0.009428204, 0.09662877, 0.06516343, -0.012615874, -0.0044159796, 0.015594373, 0.013535676, 0.056949936, 0.025803722, 0.043376565, -0.069427185) * inp_3_2_0; + result7 += M4(-0.033698197, -0.041484922, 0.20404889, 0.11029001, 0.22240984, -0.01572225, 0.041402988, -0.25517362, 0.11649469, 0.036517363, 0.028109394, 0.04130212, 0.19879432, 0.095047496, 0.102015294, 0.0016358423) * inp_3_0_1; + result7 += M4(0.19827962, -0.3081135, 0.8182635, -0.22652653, -0.19666982, -0.124621764, -0.6781147, -0.15648992, 0.01506426, 0.11177583, 0.025570663, -0.12096893, 0.15911113, 0.23864155, 0.13247603, -0.16035493) * inp_3_1_1; + result7 += M4(-0.10558998, -0.02980992, 0.15882432, 0.0019322269, -0.06324401, -0.048613906, 0.015462609, 0.07562245, -0.021553399, -0.019179452, 0.022707755, 0.09539535, -0.19717512, -0.021566661, -0.011566524, 0.07240889) * inp_3_2_1; + result7 += M4(-0.048857134, -0.027450722, 0.10871015, 0.0019058244, 0.049510036, -0.0012002293, 0.039690964, 0.079511516, -0.03686668, 0.03693529, -0.018528095, -0.042508278, -0.15140209, 0.032931436, 0.0093162395, -0.10327692) * inp_3_0_2; + result7 += M4(0.00697436, -0.011908997, 0.06820096, -0.06854557, 0.001986642, 0.011411552, 0.036190733, -0.09655649, -0.0071991254, -0.051006213, -0.013090976, 0.08769902, 0.021229148, 0.0742959, -2.0504905e-05, 0.062029213) * inp_3_1_2; + result7 += M4(0.007090045, -0.0070065823, 0.11449389, 0.07807651, -0.07478062, -0.023938473, 0.022315353, -0.045174368, -0.042782467, -0.02238688, 0.0042066914, 0.015457104, 0.10100788, -0.008693574, -0.02461605, 0.04527384) * inp_3_2_2; + const V4 inp_4_0_0 = inp[4][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_4_1_0 = inp[4][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_4_2_0 = inp[4][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_4_0_1 = inp[4][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_4_1_1 = inp[4][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_4_2_1 = inp[4][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_4_0_2 = inp[4][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_4_1_2 = inp[4][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_4_2_2 = inp[4][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.018434178, 0.049622823, 0.045119155, 0.0686234, 0.09278603, 0.08046084, -0.06695683, 0.044385765, 0.18890129, -0.014261866, -0.35378423, -0.06832126, 0.06488233, 0.061326277, 0.09549295, -0.056605693) * inp_4_0_0; + result0 += M4(0.03714057, 0.1337333, -0.10858598, -0.012010617, -0.060295638, -0.017592406, 0.039158024, -0.098632865, 0.27407366, -0.1349277, -0.012114661, 0.01871834, -0.08044955, -0.07059173, 0.078279085, -0.07203967) * inp_4_1_0; + result0 += M4(0.04509951, -0.12278074, -0.07231194, 0.0037228048, 0.044370316, 0.090483174, -0.009344479, 0.091253005, -0.06309723, 0.10966169, -0.056312956, -0.096307725, 0.010796262, 0.034634, 0.1348862, -0.01972543) * inp_4_2_0; + result0 += M4(-0.081053145, -0.06532021, 0.09809866, 0.044601522, 0.13763277, -0.08552932, -0.15657562, 0.053482037, 0.16387677, -0.1410583, -0.2270476, 0.13426694, 0.106407784, 0.027178498, -0.11867445, 0.044845153) * inp_4_0_1; + result0 += M4(0.060871486, 0.0021344237, 0.1658735, -0.114303015, 0.1591105, 0.16272436, -0.01857942, 0.244124, 0.17436458, -0.1557731, -0.22981559, 0.023261234, -0.053027753, -0.18484634, -0.021018593, -0.006894698) * inp_4_1_1; + result0 += M4(-0.009375401, 0.00030057272, -0.08269328, -0.022907406, -0.03878681, 0.07121693, 0.15280358, 0.045629557, -0.10699056, 0.06041798, 0.025238888, 0.010851332, -0.086865835, 0.03652955, 0.041686144, 0.060537767) * inp_4_2_1; + result0 += M4(-0.034835447, -0.024449775, 0.027274339, -0.004055066, -0.0055374852, -0.041705847, -0.058467496, 0.059967574, -0.067419745, -0.0935834, 0.03851681, 0.03076904, 0.0018041183, 0.05128854, 0.04868137, -0.059649237) * inp_4_0_2; + result0 += M4(-0.011844451, 0.019527428, 0.092081256, 0.0119643975, 0.1439611, -0.040145777, 0.11782478, 0.078432254, 0.014858249, 0.10277704, 0.10988425, 0.011467616, -0.010296926, 0.024298495, -0.20349382, -0.014190192) * inp_4_1_2; + result0 += M4(-0.021277873, -0.03756509, 0.0032884767, -0.024915954, 0.010813404, -0.0219491, -0.017127234, 0.07110966, -0.1083587, 0.13468519, 0.1351632, -0.054484107, -0.0069663334, 0.091877535, -0.13531296, 0.075308226) * inp_4_2_2; + result1 += M4(0.0610115, -0.02273868, 0.04560859, -0.07687807, 0.04103056, -0.07795798, -0.25112656, 0.024214633, -0.2187769, -0.20823261, -0.19474646, 0.19302827, -0.26424056, 0.11389006, -0.0274255, -0.0725048) * inp_4_0_0; + result1 += M4(-0.0014471603, -0.07749651, -0.05952297, -0.09146577, -0.12898096, -0.105988845, 0.07865901, 0.13015041, 0.09963753, -0.21074708, 0.06630236, 0.1870499, -0.058432143, 0.10289578, 0.09176906, 0.040785745) * inp_4_1_0; + result1 += M4(-0.050375693, -0.014718397, -0.04169001, 0.0052091144, 0.040490344, 0.13914068, 0.008042684, 0.17082475, 0.26016313, 0.018019961, 0.10943186, -0.055861503, -0.10225494, -0.005320025, 0.053263158, -0.041483168) * inp_4_2_0; + result1 += M4(-0.03420034, 0.039020065, 0.09437944, 0.035928633, -0.042656083, -0.08782311, -0.05664052, 0.03520092, -0.23366763, -0.1806389, -0.06514801, -0.07275233, 0.24369173, 0.043885928, 0.08140762, -0.027742673) * inp_4_0_1; + result1 += M4(0.0022973446, -0.019952578, 0.0945412, -0.075643264, -0.23445289, -0.04902638, -0.09409043, -0.1667218, -0.065547734, 0.016795011, -0.25618654, -0.055034813, 0.107082136, -0.023970228, -0.18197188, -0.1218246) * inp_4_1_1; + result1 += M4(-0.08382957, -0.0650694, 0.16925132, -0.04728398, 0.16378321, -0.15582384, -0.030366777, 0.12973088, 0.046362326, -0.06079414, 0.012548547, 0.026187118, 0.05576104, -0.05434601, -0.024864724, 0.058853254) * inp_4_2_1; + result1 += M4(0.10022295, 0.004421547, 0.009971374, 0.12618566, -0.0049330336, -0.07045002, 0.011583406, 0.0629819, 0.049423072, -0.043928783, 0.06683946, 0.020398756, -0.07111294, 0.12003535, 0.032135516, 0.029525215) * inp_4_0_2; + result1 += M4(0.16514307, -0.0629729, -0.025985986, 0.088060685, 0.008755114, -0.01807267, -0.003603859, -0.07859633, 0.12799482, 0.12027188, -0.12523472, -0.07914866, -0.047883302, 0.083567575, 0.07612459, -0.06498157) * inp_4_1_2; + result1 += M4(0.014587679, 0.025975078, -0.023844406, 0.07266172, 0.030730773, -0.059010223, 0.0119765, -0.026253965, 0.060647152, -0.029742435, -0.10303611, 0.09357952, 0.06766835, -0.10831871, 0.060497526, 0.012177835) * inp_4_2_2; + result2 += M4(-0.03446868, -0.060548592, 0.10558807, -0.073967904, -0.13120948, -0.036105353, 0.14949946, -0.013240074, 0.009351651, 0.034679778, 0.09658641, -0.14404735, -0.054775383, 0.06665587, -0.13649763, -0.090180725) * inp_4_0_0; + result2 += M4(-0.037736107, 0.033166397, -0.05246419, -0.024150483, -0.37036112, 0.027842285, 0.005863366, 0.031067898, 0.24898225, 0.18034619, -0.036727227, 0.2829593, -0.05117404, -0.07217195, 0.1895423, -0.14922643) * inp_4_1_0; + result2 += M4(-0.00022802675, 0.114544645, -0.0478971, 0.009582359, -0.18778664, 0.05062191, -0.12996319, 0.019864406, 0.09791515, 0.0059960284, 0.06578524, -0.11565061, -0.0044170176, -0.049069386, -0.01089871, -0.026803013) * inp_4_2_0; + result2 += M4(-0.1630325, -0.019274717, 0.102715194, -0.06266306, -0.11939047, -0.09086195, 0.13064456, -0.04103642, -0.026192604, -0.098094426, 0.28843316, 0.04643258, 0.05764377, 0.1645332, -0.1066325, 0.027453672) * inp_4_0_1; + result2 += M4(-0.15646996, -0.05737524, -0.06495739, -0.2436266, 0.016241936, 0.22055726, -0.04702455, 0.054669898, -0.16554731, -0.14014643, -0.18260549, -0.4382236, 0.19622582, 0.2099904, 0.040627792, 0.33798146) * inp_4_1_1; + result2 += M4(-0.12972789, 0.036690447, 0.03563221, -0.11205777, -0.13757062, 0.1118755, 0.011807173, -0.024725547, -0.023682637, -0.044875827, -0.11033335, 0.019562397, 0.02695545, -0.07396304, 0.086546585, 0.1167479) * inp_4_2_1; + result2 += M4(-0.07776693, -0.014254054, 0.0083162375, -0.00011761158, -0.08352166, -0.029421536, 0.02956944, 0.04509516, 0.010130092, 0.010642397, 0.048064332, -0.032456495, 0.012238894, 0.033714734, -0.0627502, 0.068565905) * inp_4_0_2; + result2 += M4(-0.12752682, 0.05669475, 0.11533233, -0.014176609, -0.10711373, 0.040893964, 0.05097542, -0.047303755, 0.107173756, -0.029574752, 0.02941216, 0.06525206, 0.057560835, -0.05397231, -0.11404987, 0.049302872) * inp_4_1_2; + result2 += M4(-0.064304516, -0.012414167, -0.11217402, -0.034763623, -0.14995582, 0.021495942, -0.007750655, 0.06351411, -0.020929057, 0.066652685, 0.0020182119, -0.11971596, 0.0016005685, 0.02795948, -0.0034769445, 0.00050685403) * inp_4_2_2; + result3 += M4(-0.034716997, -0.03702819, 0.011007491, 0.023010522, -0.21597584, 0.038147923, -0.00028414608, 0.037685756, 0.14614478, 0.14669707, 0.04802629, 0.11869839, 0.047092315, 0.054500878, 0.08883988, 0.0068886233) * inp_4_0_0; + result3 += M4(0.019602379, -0.0076160673, -0.053038448, -0.1294774, -0.06995248, -0.13780744, -0.04560367, -0.23195697, -0.10224064, -0.16967458, 0.11878501, 0.09578384, 0.09040383, 0.004529428, 0.06521579, -0.11174711) * inp_4_1_0; + result3 += M4(0.08485607, -0.022306591, -0.04516496, 0.017989682, -0.25434545, 0.007873913, 0.00015326319, -0.057066794, 0.037034567, -0.03178823, -0.18807301, -0.047330715, -0.12754859, 0.021273494, 0.07869164, -0.060736064) * inp_4_2_0; + result3 += M4(0.07483347, 0.045313224, 0.044391785, 0.031464998, -0.20976709, -0.051958606, -0.2170123, 0.19609435, -0.12272257, -0.14924563, -0.14202367, 0.028403468, 0.08444738, -0.009276711, -0.038434017, 0.1457306) * inp_4_0_1; + result3 += M4(-0.059973225, 0.02114767, -0.166233, -0.038052354, -0.32477218, 0.04363941, -0.032549564, -0.45016137, 0.055933047, 0.091788195, 0.07523639, 0.08410525, 0.11169555, -0.12444475, -0.05903696, -0.017554369) * inp_4_1_1; + result3 += M4(-0.04888954, -0.045461625, -0.040438406, -0.058472995, -0.07204198, -0.02853134, 0.048691347, 0.100535, 0.12957992, 0.07286983, -0.03497769, 0.08115685, 0.094174296, -0.008092268, -0.009086599, 0.112588085) * inp_4_2_1; + result3 += M4(-0.034509074, 0.009949028, 0.09974681, 0.007861836, -0.08303333, 0.030117465, 0.0682694, -0.03921216, -0.050615277, 0.018833155, 0.033861805, -0.027039213, 0.015122877, 0.030595342, -0.10777885, 0.095237285) * inp_4_0_2; + result3 += M4(0.03020026, -0.019718714, 0.060266856, 0.026768334, -0.053524353, -0.0036353362, -0.13326775, -0.027043948, -0.046914343, 0.049261674, -0.048095863, 0.06766426, 0.031893432, 0.0021852825, 0.00758896, 0.036725715) * inp_4_1_2; + result3 += M4(-0.06533603, 0.026572054, -0.018748164, 0.028237859, -0.097261354, 0.04389326, 0.0051924465, -0.07541145, 0.13301587, -0.02755958, 0.07221165, 0.0030547224, 0.06929011, -0.008908245, 0.025401644, 0.018396823) * inp_4_2_2; + result4 += M4(-0.04746825, 0.018951492, -0.0023264785, 0.07708572, 0.071010634, -0.03870001, -0.098659255, -0.10928319, 0.41780227, 0.01004282, -0.3981096, -0.505563, 0.098589525, -0.082734, -0.05396039, 0.02458752) * inp_4_0_0; + result4 += M4(0.052301582, 0.022968914, -0.06512741, -0.07361948, 0.27427474, 0.124717645, -0.06809003, -0.21796443, -0.29390582, 0.10135709, -0.025931353, -0.075833134, 0.021782123, -0.14518449, -0.02299544, 0.059578747) * inp_4_1_0; + result4 += M4(0.03213144, -0.03191139, -0.022576269, 0.05140163, -0.010867397, -0.018188905, 0.0074826954, -0.09148727, -0.09956559, -0.075166255, 0.046014354, 0.057339873, -0.014400544, -0.11268159, -0.008193156, -0.19215326) * inp_4_2_0; + result4 += M4(-0.06548154, -0.0060879444, 0.13310304, -0.008900656, 0.10680574, -0.038170066, 0.023868673, -0.19597545, 0.43738434, -0.14221796, -0.1742126, -0.04567815, -0.12347329, -0.08659759, -0.045464035, 0.03501314) * inp_4_0_1; + result4 += M4(0.009866717, -0.077169314, -0.114872776, 0.16988996, -0.057457026, 0.13311575, -0.0154428035, 0.018910473, -0.40247977, 0.326605, 0.40360212, -0.1536875, 0.048325084, 0.030349404, 0.28883633, 0.075642556) * inp_4_1_1; + result4 += M4(0.0006517612, 0.09461864, 0.0030880533, 0.061842687, -0.049034238, -0.12142291, -0.029907785, 0.003936318, 0.06435368, -0.17745653, 0.051564936, -0.081423275, -0.0038237646, -0.024854116, -0.016261674, -0.03406591) * inp_4_2_1; + result4 += M4(0.018387225, 0.062112585, 0.020659685, 0.03698026, -0.09931037, 0.02214087, 0.056241244, 0.11414437, -0.003061674, 0.02710368, 0.022636442, 0.25284192, -0.03436895, 0.11740832, -0.10811029, -0.015811529) * inp_4_0_2; + result4 += M4(0.0023214058, 0.082734086, -0.01567952, -0.0053047435, 0.062006377, 0.09231221, 0.032367308, -0.077805296, -0.030735722, 0.1505505, 0.10781633, -0.0116145285, -0.018235087, -0.012697741, -0.044910852, -0.06456537) * inp_4_1_2; + result4 += M4(0.008740162, 0.0055449195, -0.034479134, 0.09049583, 0.0053041857, 0.023528691, 0.030659825, 0.09536835, -0.12118474, -0.2391898, -0.009616882, -0.09285932, -0.22743967, 0.0258707, -0.061709628, -0.11265819) * inp_4_2_2; + result5 += M4(0.044028442, -0.04122583, 0.000550269, -0.021337532, -0.047214676, -0.1254332, 0.04745686, 0.0654274, -0.039284576, -0.23807748, 0.03728136, 0.20354709, -0.18091227, -0.043641847, 0.09648567, 0.011014285) * inp_4_0_0; + result5 += M4(0.12751298, -0.11774408, -0.011337492, 0.04147657, -0.030175004, 0.12267266, 0.0535281, 0.14082205, 0.08182579, -0.2573211, 0.15075792, 0.119687304, -0.008568953, -0.058781512, 0.12618496, 0.05222454) * inp_4_1_0; + result5 += M4(0.010520021, 0.14922525, -0.032744717, -0.010077619, 0.009180709, -0.07438485, -0.052246366, -0.28231016, 0.0033419975, -0.045650773, 0.23145644, 0.2771692, 0.058881775, 0.014836622, -0.009228067, -0.014879177) * inp_4_2_0; + result5 += M4(-0.09163705, -0.032821804, 0.013047141, 0.00010888746, -0.03259542, 0.047401156, 0.017905368, 0.08525486, 0.034333818, -0.1518838, -0.018526737, 0.111433186, 0.09728939, 0.1241472, -0.14238016, 0.13744897) * inp_4_0_1; + result5 += M4(-0.05943246, -0.09804257, -0.008240451, -0.01755478, -0.068136975, 0.03467399, 0.12868759, 0.0039837593, -0.078394555, -0.15439646, -0.072307155, 0.07028796, -0.094547324, -0.1229079, -0.32740903, 0.12146443) * inp_4_1_1; + result5 += M4(0.029553166, 0.18490258, -0.15058453, 0.08573451, 0.13650814, -0.0021613757, 0.08007432, -0.24977444, 0.0013390144, -0.34215355, -0.1117145, 0.10487715, -0.065968744, 0.0084841065, -0.0762411, 0.0798778) * inp_4_2_1; + result5 += M4(-0.017019898, 0.071032345, 0.009983099, 0.041452013, 0.025056604, 0.06516199, 0.027387524, 0.051893633, -0.023136629, 0.0074394695, 0.026207631, 0.01269897, 0.03611796, -0.10436766, 0.052628435, -0.040155966) * inp_4_0_2; + result5 += M4(0.054065004, 0.03911701, 0.1252176, -0.03445495, -0.03175568, -0.02995443, 0.04310057, -0.07631389, 0.10841199, -0.11166485, 0.19049378, 0.059140924, 0.030335514, 0.015095092, 0.007760321, 0.012673984) * inp_4_1_2; + result5 += M4(0.003389234, -0.021356242, 0.03467426, -0.012892039, -0.018554578, 0.022117883, -0.012314982, 0.003262032, 0.00051392533, 0.010092326, 0.06643337, -0.19911139, -0.03234521, 0.016684286, 0.16629112, -0.1323044) * inp_4_2_2; + result6 += M4(0.029847521, 0.011216209, 0.0014352007, 0.11196707, -0.061164424, 0.07866497, -0.045990318, 0.0031174389, 0.0762465, 0.024557918, -0.03897307, -0.128871, -0.100214586, 0.14044705, -0.030326163, -0.081816845) * inp_4_0_0; + result6 += M4(-0.0038015107, 0.025718777, -0.0070730755, 0.062903754, -0.17329313, -0.15011217, -0.0020997932, 0.32775643, -0.33540583, -0.10884601, -0.19569129, -0.024619697, 0.018821053, 0.0017868977, -0.003502404, -0.060582034) * inp_4_1_0; + result6 += M4(0.032696694, -0.060505856, -0.07638751, 0.07938569, -0.04352733, 0.030930337, 0.006419562, 0.20290491, -0.06621932, -0.010134403, 0.0045209723, -0.08216622, 0.010799845, -0.037544258, 0.032261, -0.0068984954) * inp_4_2_0; + result6 += M4(-0.020585008, -0.06686739, -0.02674714, 0.10312991, -0.04545703, -0.0023649305, 0.017600637, 0.28133342, -0.18896975, 0.21077135, 0.16459316, 0.24882057, 0.193736, 0.013784664, -0.05083905, 0.039294366) * inp_4_0_1; + result6 += M4(0.13655709, 0.0012507935, -0.12576059, 0.09325019, -0.030075591, -0.02547244, -0.2405418, 0.20916913, 0.017380645, -0.11935161, 0.0437509, -0.062131178, -0.006475726, 0.09514894, 0.07395075, -0.09047324) * inp_4_1_1; + result6 += M4(-0.019377453, -0.056720573, -0.01657622, 0.09865785, -0.16182153, 0.06522214, -0.120011814, 0.44340995, 0.08786272, 0.084312685, 0.029555505, -0.03303406, -0.03767044, 0.048726927, 0.03899395, -0.012219651) * inp_4_2_1; + result6 += M4(-0.05132402, 0.06540667, -0.01990738, -0.04480762, -0.053835515, -0.027045632, -0.03389145, -0.061064117, -0.0644717, -0.08743921, -0.020172076, -0.10008905, 0.090438485, -0.034950245, -0.04865866, 0.02537885) * inp_4_0_2; + result6 += M4(-0.02029574, 0.112929955, 0.022982717, 0.052838452, 0.0074106054, -0.036684096, -0.020033512, 0.14651367, -0.0851901, 0.06323298, 0.005073495, 0.08078632, -0.034822278, -0.030153848, -0.030336197, 0.02080248) * inp_4_1_2; + result6 += M4(0.043356642, -0.028215291, -0.0037377938, -0.017337887, -0.040176068, 0.010816982, -0.06331674, -0.005939463, -0.06420132, 0.080353424, 0.019384855, 0.039185375, -0.049747366, 0.034336146, -0.026170624, 0.06940328) * inp_4_2_2; + result7 += M4(0.03314132, -0.023960821, 0.18514064, -0.014295202, 0.13087258, -0.068065755, -0.132479, -0.14629236, 0.013114965, -0.13433266, -0.1473613, 0.3425137, 0.00014111558, 0.013769697, -0.07184184, 0.00016587533) * inp_4_0_0; + result7 += M4(-0.084272854, 0.0012606982, 0.06889056, -0.027467422, -0.07352514, -0.022028591, 0.22194062, 0.08726106, -0.33280593, -0.15533029, 0.31119695, 0.4080963, 0.17609134, 0.05854581, -0.10106332, 0.066547655) * inp_4_1_0; + result7 += M4(0.045763247, -0.07639024, 0.017230418, -0.0055212197, 0.20488957, -0.023779752, 0.06305569, -0.09244782, -0.05728563, 0.050004475, -0.017564166, 0.11946289, -0.0070229634, 0.030936288, -0.049530633, 0.045574144) * inp_4_2_0; + result7 += M4(-0.04914086, -0.015898246, 0.07324575, -0.025076395, 0.15567815, 0.056686267, 0.05144686, 0.074478626, -0.039093338, 0.17859635, 0.1160447, 0.031838417, 0.21319076, -0.04266761, -0.06598638, 0.1650486) * inp_4_0_1; + result7 += M4(-0.14048345, 0.063251905, 0.6841372, 0.112974994, 0.25103608, -0.011431417, 0.18817756, -0.18409503, 0.019608924, 0.18151504, 0.0781094, 0.22911899, 0.069921345, -0.24604486, -0.6971403, -0.0646484) * inp_4_1_1; + result7 += M4(0.021362348, -0.015138301, 0.027565897, -0.01207035, 0.09410969, -0.044307675, -0.054592002, -0.039536398, -0.016862912, 0.01962149, 0.078963764, -0.004337365, -0.03610102, -0.013718087, -0.06805554, 0.022252895) * inp_4_2_1; + result7 += M4(-0.014945598, -0.010895095, 0.057883468, 0.0007298279, 0.008888342, 0.0021205172, 0.01675877, -0.05691879, -0.1411696, -0.0032234627, 0.03448331, -0.051604025, -0.064241216, -0.034602355, 0.015839413, 0.018036243) * inp_4_0_2; + result7 += M4(-0.039344657, 0.007022265, 0.051661976, -0.06379265, 0.0479425, 0.012853767, -0.012935568, -0.034843996, 0.035373203, 0.039304648, -0.06211866, -0.106624626, 0.01128225, 0.0011852856, -0.02734015, 0.04097814) * inp_4_1_2; + result7 += M4(0.03621156, 0.029693043, 0.053518586, 0.050195668, 0.042105448, -0.017427806, -0.008055143, -0.025947731, 0.051211126, -0.021013567, -0.069184914, 0.046099614, 0.020608708, -0.035153307, -0.13925175, -0.027382685) * inp_4_2_2; + const V4 inp_5_0_0 = inp[5][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_5_1_0 = inp[5][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_5_2_0 = inp[5][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_5_0_1 = inp[5][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_5_1_1 = inp[5][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_5_2_1 = inp[5][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_5_0_2 = inp[5][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_5_1_2 = inp[5][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_5_2_2 = inp[5][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.123371445, 0.045630742, -0.037511744, 0.032656584, -0.059497476, 0.030335374, -0.14396754, -0.10950625, 0.09135156, -0.038335335, 0.0019568456, -0.1259568, -0.011304159, -0.027700229, 0.012851001, 0.077376164) * inp_5_0_0; + result0 += M4(0.024210714, -0.015638096, -0.025297, -0.016720101, 0.057668798, -0.13882223, 0.1713362, 0.040192943, -0.114138186, 0.07518621, 0.029857866, 0.02885903, 0.12833597, 0.0132782785, -0.07948901, -0.009803399) * inp_5_1_0; + result0 += M4(0.121996425, 0.006053676, 0.10021924, -0.027526055, 0.06576328, -0.11237358, 0.024446266, 0.11030945, 0.0120935645, -0.0749186, 0.09698864, 0.02708685, 0.030926049, -0.06414696, -0.07180976, 0.043693516) * inp_5_2_0; + result0 += M4(-0.015859181, 0.008474882, -0.0019583204, 0.025104256, 0.11622288, -0.065398544, 0.15351884, -0.029175289, -0.09635269, -0.008340101, 0.01007894, 0.0035908774, 0.025967816, 0.037081588, -0.14414304, 0.073466465) * inp_5_0_1; + result0 += M4(0.08065021, -0.05153395, -0.002465147, -0.013492567, -0.032598022, 0.45930138, 0.46663892, 0.103900634, -0.04901923, -0.090013206, -0.21006538, 0.20859501, -0.048301794, -0.014095961, 0.15357316, 0.0076438906) * inp_5_1_1; + result0 += M4(0.02426149, 0.0021374687, 0.077495165, -0.1258318, 0.044345193, 0.00021493588, 0.01685415, -0.0368571, 0.04374505, -0.1766028, -0.033100635, 0.040366873, 0.1395594, 0.027098102, 0.10932677, -0.06817938) * inp_5_2_1; + result0 += M4(0.009196407, -0.097988635, -0.050098717, -0.016872253, 0.090022065, -0.013037989, -0.0026730855, 0.024800278, -0.04894446, 0.05530746, 0.014768546, -0.09061225, -0.057070952, -0.07252438, -0.00062122854, 0.08389794) * inp_5_0_2; + result0 += M4(-0.101596296, -0.055642474, 0.04570439, 0.04361038, -0.14486907, 0.042797673, -0.12054768, -0.063305065, -0.019254709, 0.05217635, 0.02427707, 0.006368446, 0.14061597, -0.12326447, -0.0018781321, -0.04270873) * inp_5_1_2; + result0 += M4(0.10663404, -0.047926433, 0.044095367, -0.07026069, 0.0375175, -0.0886996, 0.044326045, -0.12775558, 0.061518982, 0.0476789, -0.025395926, 0.023615137, 0.09428052, -0.1103412, -0.009147347, -0.03133798) * inp_5_2_2; + result1 += M4(0.053163227, 0.030115737, -0.030637942, -0.025837002, -0.060941413, -0.10949551, -0.120862715, 0.1208325, -0.11690091, -0.06556051, 0.15571932, 0.007036722, 0.058079485, -0.042374987, -0.0488747, 0.0754995) * inp_5_0_0; + result1 += M4(0.03261784, 0.10626132, -0.089328535, 7.441058e-05, 0.073384576, 0.09726181, -0.07114991, -0.013974848, -0.024584785, -0.1362107, -0.14133859, -0.0019457873, 0.021470407, -0.112652674, -0.119304426, 0.099386595) * inp_5_1_0; + result1 += M4(0.24204189, -0.05820033, 0.0008264339, 0.015788814, -0.033113368, -0.014696672, -0.25541672, -0.002837327, -0.06241953, 0.010933759, -0.118518025, 0.03815822, 0.076786935, -0.029461388, -0.16738333, 0.12254171) * inp_5_2_0; + result1 += M4(-0.026658932, -0.02901586, -0.057913918, 0.023599925, 0.04478488, -0.12633042, -0.07728049, -0.022446077, -0.057294432, -0.1906596, 0.0768135, 0.023322254, 0.08313433, 0.048030186, -0.19937456, -0.16442332) * inp_5_0_1; + result1 += M4(-0.015783641, -0.0110256625, -0.13498132, -0.08360165, -0.020236097, 0.21834463, 0.3778501, -0.10348178, -0.14184757, -0.0024434915, 0.37857127, -0.09526714, 0.09978618, 0.10055827, 0.049948208, -0.09012774) * inp_5_1_1; + result1 += M4(-0.0007249339, 0.07442243, -0.046553437, 0.10058906, 0.084018774, 0.0331409, -0.022992447, -0.02720312, 0.055283006, -0.10140711, -0.008944542, -0.07686773, -0.0139478985, -0.035766657, 0.18112116, -0.295391) * inp_5_2_1; + result1 += M4(-0.03283177, -0.0788876, 0.078147784, 0.12382458, -0.028681792, -0.09797458, 0.09658886, 0.038334813, 0.05970046, 0.1042089, -0.028044544, -0.11702576, 0.04946432, -0.045566108, -0.03265196, 0.20265669) * inp_5_0_2; + result1 += M4(0.07615815, 0.053773694, -0.13425004, -0.10289403, -0.21141896, -0.027510718, 0.117724255, 0.029067636, 0.007772063, 0.05305857, -0.060303167, 0.1656609, 0.18891121, -0.18553078, -0.18784903, -0.04514619) * inp_5_1_2; + result1 += M4(-0.0058164196, -0.035942618, -0.047059286, 0.02922557, -0.040747892, 0.05588013, -0.07001004, -0.0033716587, 0.13195422, 0.18360968, 0.18187922, -0.041588735, 0.015648779, -0.015338238, 0.057859555, 0.22880732) * inp_5_2_2; + result2 += M4(-0.05089461, -0.06880747, 0.03439235, -0.10452725, -0.03418723, 0.018158589, 0.026373662, 0.01823083, 0.06179376, 0.12291096, -0.12697552, 0.07553995, 0.16819894, -0.06165895, 0.07061971, 0.08076528) * inp_5_0_0; + result2 += M4(-0.2184368, -0.03054354, 0.08202403, -0.19400576, -0.05452536, -0.011952951, -0.06794899, 0.122203216, 0.11779741, -0.05228771, 0.09199356, 0.0019564293, 0.1524904, -0.105936274, -0.010267851, 0.09411399) * inp_5_1_0; + result2 += M4(-0.1024979, 0.08116158, -0.007344123, -0.11812001, 0.040182192, 0.01606026, -0.14471118, 0.120311014, 0.10089437, -0.08400024, 0.057646155, 0.11378756, 0.110301286, -0.040258244, 0.021496408, 0.14241529) * inp_5_2_0; + result2 += M4(-0.007884671, -0.10740747, -0.01754323, -0.07541031, 0.12543997, -0.013833602, 0.048891734, 0.10121733, 0.14231123, 0.07870058, 0.06179573, 0.011016393, 0.05418917, -0.26155347, 0.13007818, 0.06546662) * inp_5_0_1; + result2 += M4(-0.035987936, -0.3930357, 0.10958193, -0.5489481, -0.19053532, 0.14033037, 0.43592274, -0.0050594276, 0.025040733, 0.17388758, -0.16107048, 0.7136927, 0.03924278, 0.04421966, 0.014932358, 0.28228682) * inp_5_1_1; + result2 += M4(0.004908621, -0.02024404, 0.060426462, -0.04234812, 0.058657315, -0.03692989, 0.04931202, -0.013500887, 0.002397611, -0.032400943, -0.024726039, 0.057190824, 0.08490632, 0.08427807, -0.3459622, 0.26250184) * inp_5_2_1; + result2 += M4(0.042929225, -0.022448707, -0.014097773, -0.09849196, 0.07650107, -0.07192543, -0.045918714, -0.09044093, -0.02750359, 0.10363463, 0.04108734, 0.14084217, 0.086739935, -0.07766882, 0.015197384, 0.086779095) * inp_5_0_2; + result2 += M4(-0.042680692, -0.0435413, -0.02081592, 0.0018394949, -0.11688039, -0.04280503, -0.073257394, -0.06731929, -0.009505822, -0.015929494, -0.06085459, -0.03652785, 0.002387642, -0.100591265, 0.24633902, 0.17450476) * inp_5_1_2; + result2 += M4(0.024364658, 0.03397147, -0.10271644, -0.10208315, -0.011779326, -0.041756544, -0.14783241, 0.038288563, 0.04646152, 0.0361934, 0.17079784, 0.025240134, 0.17275141, -0.06670544, 0.08916464, 0.14281836) * inp_5_2_2; + result3 += M4(-0.0016433772, -0.06395496, 0.044392545, -0.02376804, 0.0032578832, -0.004468666, -0.00853987, -0.08344243, -0.014666987, 0.03971033, -0.04307232, 0.10009123, -0.09495937, 0.05841456, -0.10372049, -0.012789258) * inp_5_0_0; + result3 += M4(-0.1754774, 0.023429831, 0.09371815, -0.015694408, -0.11963432, 0.04584396, 0.055807028, 0.09387724, 0.09942793, 0.008641019, 0.056752395, -0.048205625, -0.16672355, -0.008905546, -0.11106117, -0.001228154) * inp_5_1_0; + result3 += M4(-0.03829054, 0.03206877, -0.03506619, -0.007803222, 0.028911086, -0.021094246, 0.17150551, 0.1928845, -0.051899012, -0.022683851, 0.071469896, -0.009633936, -0.28371215, 0.012550104, -0.04978784, 0.14056697) * inp_5_2_0; + result3 += M4(-0.05456526, -0.0139581235, -0.14226688, 0.0024905521, 0.07598446, 0.0160824, 0.13566287, -0.097559534, 0.08470994, 0.020044724, -0.006391273, 0.03913785, -0.23592253, -0.049078852, 0.075952955, -0.18626446) * inp_5_0_1; + result3 += M4(-0.16849951, -0.030507093, -0.033838596, -0.22402312, -0.29775357, -0.022204434, 0.1599498, -0.33909023, -0.093581155, 0.015534969, 0.0009931519, 0.07484235, -0.19403413, 0.06681865, -0.09450792, 0.013082458) * inp_5_1_1; + result3 += M4(-0.008722489, 0.0006128054, 0.015211376, -0.033959948, -0.013445738, -0.006673427, 0.16608049, -0.16438295, -0.10635901, -0.026287759, -0.14944382, -0.06114431, -0.5572859, -0.13040613, 0.01806043, -0.13726111) * inp_5_2_1; + result3 += M4(0.025324216, -0.019472148, 0.12226383, 0.004561716, -0.045955773, -3.4736728e-05, 0.10386858, -0.035570566, 0.08200984, 0.013000245, -0.11241669, 0.122758955, -0.23983026, 0.021620678, -0.0069623124, -0.0866692) * inp_5_0_2; + result3 += M4(-0.063442014, 0.003991682, -0.08261214, -0.043879263, -0.047612466, 0.0064072665, -0.06443755, -0.05235255, 0.057116516, -0.042289082, 0.039665133, 0.012920242, -0.27223322, 0.020552354, 0.15560661, -0.115243696) * inp_5_1_2; + result3 += M4(0.0128492, 0.07751773, -0.020738611, -0.044284575, -0.14505552, 0.0004539792, -0.122859575, -0.08029323, -0.101424895, -0.020329434, 0.04193369, 0.03867216, -0.3186856, -0.04017953, -0.011931473, -0.00901795) * inp_5_2_2; + result4 += M4(-0.081978485, 0.008731177, -0.009671315, 0.11881761, 0.14737126, 0.026059391, 0.1453127, -0.22145276, 0.027277047, 0.012819726, -0.010473002, -0.058562577, -0.029624926, 0.017595857, 0.023331981, -0.070908226) * inp_5_0_0; + result4 += M4(0.09150548, 0.07674018, -0.012784578, -0.07985558, -0.12920624, -0.07422218, 0.08923461, 0.10953051, -0.2087261, 0.10440889, 0.06466868, -0.039136652, 0.049965568, 0.11478386, -0.25069302, 0.07872079) * inp_5_1_0; + result4 += M4(0.049709897, -0.07648281, -0.0453251, -0.052878913, -0.015357472, 0.033534553, 0.013065147, -0.029262222, -0.038605936, 0.029413693, -0.009752422, -0.0522763, 0.13201569, 0.22309795, -0.10203328, 0.07843707) * inp_5_2_0; + result4 += M4(-0.00943669, -0.02357647, -0.010168464, -0.011966337, -0.12490295, 0.24515004, 0.17846109, 0.07853887, 0.1004703, 0.011486755, 0.08667265, -0.00040034638, 0.102375336, -0.045829143, -0.07046418, 0.045852184) * inp_5_0_1; + result4 += M4(-0.4339243, -0.04240526, 0.08855913, 0.019752966, 0.19020529, 0.08014186, -0.5915188, 0.24088357, 0.19341277, 0.0058906153, 0.0487018, -0.12089922, 0.12674676, 0.095529735, 0.14496239, -0.15163405) * inp_5_1_1; + result4 += M4(-0.13066274, -0.020357536, 0.030672433, 0.03308246, 0.13391852, 0.18372144, -0.009818675, -0.054323558, 0.0026363488, -0.047271162, -0.055748943, 0.07969257, 0.085714854, -0.025382305, 0.03431107, -0.1627272) * inp_5_2_1; + result4 += M4(0.003020665, -0.10396593, 0.011902204, 0.07312435, 0.093765184, -0.1325592, 0.22710894, 0.018937884, -0.13183898, 0.031228388, -0.07443412, -0.038861208, -0.07230957, 0.07616656, 0.086517304, 0.08261749) * inp_5_0_2; + result4 += M4(0.116928734, 0.10872434, 0.005216119, -0.08336637, -0.08692142, -0.24494134, -0.07662935, -0.15244098, -0.024772238, -0.08173158, -0.17380379, 0.07253603, -0.09260726, -0.100188315, 0.20209496, 0.11850252) * inp_5_1_2; + result4 += M4(-0.014173898, 0.050055653, 0.021336745, 0.028097194, 0.10676832, -0.14054227, -0.032997448, 0.09759295, 0.1968065, 0.119522, 0.0064996337, -0.08544998, -0.06480004, 0.06684704, 0.17936917, -0.0064673736) * inp_5_2_2; + result5 += M4(0.08665207, -0.014733728, -0.03439795, 0.014946461, 0.12191395, 0.34902343, -0.15557007, -0.06618843, -0.038352728, -0.015582131, 0.008399964, 0.019552283, 0.006831162, 0.0484393, 0.041982424, 0.04917752) * inp_5_0_0; + result5 += M4(0.061198276, 0.1254916, -0.0866367, -0.039402395, -0.14817049, 0.5130939, -0.19919015, -0.17593104, 0.022492269, 0.053934958, -0.08103255, -0.006178789, -0.08096894, -0.13555562, 0.06531979, 0.031465143) * inp_5_1_0; + result5 += M4(-0.0017537047, -0.0058338325, -0.022249585, -0.040268507, -0.15536328, 0.33079246, -0.20307569, -0.040409602, -0.081662245, -0.0057570254, -0.02416426, -0.0034949684, -0.12064619, 0.053589292, -0.048280526, -0.060501892) * inp_5_2_0; + result5 += M4(-0.023151474, 0.025483055, 0.03302465, -0.053557098, 0.01878202, 0.48855963, 0.14157878, -0.052844502, 0.04966715, 0.08792078, 0.12310278, 0.06091125, 0.069299795, -0.11052675, -0.057348035, -0.039336666) * inp_5_0_1; + result5 += M4(-0.012678735, -0.20442308, 0.039045762, -0.051613014, 0.07281968, 1.0343851, 0.4127859, -0.048605893, -0.0015168578, -0.07037902, 0.12139327, 0.043819714, 0.045538, -0.18176125, 0.022056846, 0.0005423375) * inp_5_1_1; + result5 += M4(0.04133189, 0.0012175002, -0.05802783, -0.086031586, -0.057386238, 0.44495016, -0.032954965, 0.037303012, 0.16479154, 0.05773966, 0.01573409, 0.018100003, 0.06942059, -0.22936065, -0.01792656, 0.09765454) * inp_5_2_1; + result5 += M4(-0.05759195, 0.048286095, -0.01451397, 0.07753058, -0.06851057, 0.25636473, -0.04180832, 0.01919419, 0.05657882, -0.051161885, -0.005812322, -0.076693, -0.023606462, -0.01839714, 0.03828975, 0.06775395) * inp_5_0_2; + result5 += M4(-0.035349704, 0.024843054, 0.09386931, 0.099540524, -0.09546079, 0.46071944, -0.044423927, -0.06338417, -0.027697293, -0.047288228, -0.07253479, 0.097908825, -0.09055675, 0.14732157, 0.03998545, 0.10484554) * inp_5_1_2; + result5 += M4(0.030144554, 0.09282306, -0.106014095, -0.043188702, -0.06866675, 0.24503854, -0.33104092, 0.060447738, -0.07752346, -0.14617719, 0.027633805, -0.059127916, -0.2133411, 0.11343608, 0.108426996, -0.078282446) * inp_5_2_2; + result6 += M4(0.017146543, 0.07195347, 0.020474782, 0.10021011, 0.07946469, -0.048385706, 0.035112847, -0.006273241, -0.022339504, 0.10111638, -0.046621624, -0.16082487, 0.042175107, -0.103130214, 0.028282315, -0.0988534) * inp_5_0_0; + result6 += M4(0.0352779, -0.042162426, 0.071050584, 0.05833724, 0.11845236, 0.1251091, 0.024088811, -0.08335935, -0.12863266, 0.11600836, 0.03180283, -0.08279313, -0.06791756, -0.18051551, -0.040628698, -0.105102845) * inp_5_1_0; + result6 += M4(-0.067785904, -0.06739106, -0.017867617, -0.017591527, 0.047302313, -0.030611094, -0.027617399, 0.028833665, 0.04271483, -0.0016429841, 0.018974971, -0.050833248, 0.020180678, -0.0019380851, 0.014650357, -0.10082412) * inp_5_2_0; + result6 += M4(0.009767641, -0.009299312, -0.022824276, 0.09675148, 0.027000414, -0.10451104, -0.024415737, -0.13894948, -0.05768862, 0.082830854, 0.06221253, -0.2545634, -0.14260367, 0.091374844, -0.0071491837, -0.13828793) * inp_5_0_1; + result6 += M4(0.028257204, -0.04447945, 0.13823047, -0.09031003, 0.1818435, -0.16005519, -0.075830966, 0.26581088, 0.03027853, 0.06225854, -0.17510638, 0.12744462, 0.019942556, 0.065034024, -0.10274122, -0.07896024) * inp_5_1_1; + result6 += M4(0.038249422, -0.029685864, -0.0094582075, -0.10248129, -0.008710387, -0.026165457, 0.005976542, -0.0066294908, -0.046754308, 0.0018705112, 0.061219167, 0.0062646423, -0.10355338, -0.112634316, 0.042089604, -0.103306025) * inp_5_2_1; + result6 += M4(-0.045211665, -0.033496004, 0.07130816, -0.093034185, -0.024511328, 0.078480706, 0.022099065, -0.0063585923, 0.08217455, -0.068966866, -0.06517585, 0.1392229, -0.09056001, -0.052128717, 0.015343711, -0.12273842) * inp_5_0_2; + result6 += M4(-0.041267555, -0.0121253915, 0.047172245, -0.030350387, 0.12069247, 0.12190868, -0.00843262, -0.012527678, 0.060970213, -0.012181705, 0.03164267, 0.062954076, -0.078739755, 0.036241636, 7.553352e-05, -0.12768728) * inp_5_1_2; + result6 += M4(0.009428621, 0.03308015, -0.020445896, -0.121635035, 0.12464413, -0.012552904, 0.018786203, -0.061635923, 0.02892714, -0.04556199, 0.009078409, 0.08156567, 0.07953163, 0.14660418, 0.03281469, -0.10681093) * inp_5_2_2; + result7 += M4(-0.07755879, 0.001409955, 0.080113985, 0.044837657, -0.02902784, 0.0453789, -0.19918056, -0.13519815, 0.06071678, -0.017768841, -0.107843705, -0.028775323, 0.078276545, -0.00448468, 0.011384543, -0.07118215) * inp_5_0_0; + result7 += M4(0.020012148, 0.06290545, 0.08594064, -0.059813794, -0.071024366, 0.02439831, 0.022521794, -0.05762041, -0.079059206, 0.03366543, 0.06894578, 0.04634653, -0.018088952, -0.055296224, 0.048158336, 0.00052413566) * inp_5_1_0; + result7 += M4(0.06857875, 0.04631308, 0.063786946, -0.12448301, -0.05874095, -0.04511761, 0.11245571, -0.17079069, 0.05397501, -0.007799154, -0.03738197, 0.004935458, 0.06348767, -0.044503845, 0.029091693, 0.021400971) * inp_5_2_0; + result7 += M4(-0.012583525, -0.018320743, 0.055667475, -0.14299099, 0.053300552, 0.03134462, -0.053179096, 0.086316325, 0.0009091387, -0.015577178, 0.019550147, -0.10241137, -0.12569317, 0.013249083, 0.06836901, 0.0133160055) * inp_5_0_1; + result7 += M4(-0.03420927, 0.23104991, 0.47808087, 0.060338102, -0.19527173, -0.2905466, 0.09608559, -0.124330826, -0.096963815, -0.29860568, -0.49789473, -0.09644599, -0.0034421296, -0.058462963, -0.14370023, 0.02043516) * inp_5_1_1; + result7 += M4(0.105033144, 0.055408422, 0.15040505, 0.042433683, -0.09824583, 0.014011664, 0.0780022, -0.010407359, -0.069793984, -0.026357459, -0.050134815, -0.0056409263, 0.13164721, -0.023186551, -0.034109626, -0.08412489) * inp_5_2_1; + result7 += M4(-0.000686607, 0.015475212, -0.0076115374, -0.030022096, 0.09115867, 0.0049877916, 0.028928516, 0.024060426, 0.09289277, -0.025827307, -0.0028435676, -0.036280386, -0.009932912, -0.0026674443, -4.2211093e-05, -0.09942692) * inp_5_0_2; + result7 += M4(-0.080379285, 0.08226599, 0.06263767, 0.02839101, -0.2889866, 0.0071601234, 0.11777941, -0.1139161, -0.02848327, -0.054467835, 0.029276526, 0.06994259, 0.2020753, -0.05809008, -0.047375616, -0.15917233) * inp_5_1_2; + result7 += M4(0.017120434, 0.061842583, 0.16634838, -0.048323035, 0.015774501, 0.02568165, 0.19701882, 0.056263637, -0.0083325235, -0.00514872, -0.07123524, 0.0025612267, -0.17592408, -0.004829901, 0.16188622, -0.010181982) * inp_5_2_2; + const V4 inp_6_0_0 = inp[6][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_6_1_0 = inp[6][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_6_2_0 = inp[6][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_6_0_1 = inp[6][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_6_1_1 = inp[6][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_6_2_1 = inp[6][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_6_0_2 = inp[6][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_6_1_2 = inp[6][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_6_2_2 = inp[6][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.022662565, 0.02176172, 0.031047488, -0.11067613, 0.010133441, 0.033218984, -0.033945628, -0.077870145, -0.008262249, 0.032401863, -0.031276446, -0.016952295, -0.043772437, 0.056907352, -0.0946162, 0.09006121) * inp_6_0_0; + result0 += M4(0.017040696, -0.044044662, 0.13394083, -0.09612405, -0.08078334, 0.07400945, -0.020238824, 0.029793039, -0.07849465, -0.02886134, 0.055123046, -0.010653626, 0.16018832, -0.036940917, -0.06712302, -0.12673457) * inp_6_1_0; + result0 += M4(0.12287229, -0.015073312, 0.15345484, -0.13125063, -0.017165022, 0.4159603, -0.097369164, -0.1395624, -0.008073821, 0.013593207, 0.021631084, 0.040323455, 0.06321758, -0.028390089, -0.07807858, -0.021472875) * inp_6_2_0; + result0 += M4(-0.07047176, 0.032713864, 0.0137235, -0.04372021, 0.045677308, 0.09478718, -0.026812516, -0.030567927, -0.057995263, -0.049896773, 0.0059265587, 0.033297904, -0.020974014, 0.21497244, -0.23850913, -0.07458344) * inp_6_0_1; + result0 += M4(0.093734205, 0.048767734, 0.08533877, -0.1599017, 0.0831247, -0.42410544, 0.06197638, -0.025946354, 0.01345063, 0.1433013, 0.124061465, -0.1340586, -0.1532807, 0.0071958816, 0.11053866, -0.17644954) * inp_6_1_1; + result0 += M4(-0.12367105, 0.09430558, -0.28992137, 0.093805075, -0.044040952, 0.095564984, 0.109782256, 0.0437214, -0.027480988, -0.03442494, -0.13606414, -0.0033933218, -0.07537912, 0.20092618, 0.16240402, 0.07673302) * inp_6_2_1; + result0 += M4(-0.031000234, 0.03345831, -0.085711, -0.10966906, -0.007225471, -0.00018210147, -0.027986502, -0.034326024, 0.19785415, 0.14977622, -0.07502296, 0.07963666, -0.07693806, -0.1751338, 0.017238509, 0.13737452) * inp_6_0_2; + result0 += M4(-0.033897035, -0.060299773, -0.047966577, -0.16041975, -0.018925058, -0.0069016516, 0.065542795, -0.10214473, -0.023588412, 0.023308706, -0.12040352, 0.09502946, 0.16837138, 0.027456043, 0.11100462, -0.1577611) * inp_6_1_2; + result0 += M4(-0.28854597, 0.069381654, -0.10589031, 0.059290722, -0.048073024, -0.072590716, -0.030349195, -0.06293276, 0.007873924, -0.005269388, -0.11836302, 0.07247899, -0.07915952, -0.01155746, -0.12287877, -0.031772703) * inp_6_2_2; + result1 += M4(-0.1492508, 0.04419659, 0.08584264, -0.09106756, 0.040658787, -0.0068975417, -0.08413319, -0.007948746, -0.104236335, -0.015870739, -0.076965615, -0.027703, -0.11968809, 0.0036426606, -0.13528155, -0.06675776) * inp_6_0_0; + result1 += M4(0.046767768, 0.14498001, 0.0137019195, -0.2762634, -0.08301796, -0.0381739, -0.122010425, -0.049715903, 0.012905702, 0.032977697, 0.06306705, -0.027665475, 0.12606758, -0.00935986, 0.06770101, 0.12946673) * inp_6_1_0; + result1 += M4(-0.47543922, 0.06766018, 0.05186825, -0.09191922, 0.15787455, -0.121539526, 0.31240228, -0.14566931, 0.0008109791, 0.041136768, -0.03195533, 0.04042247, -0.016029973, 0.0940737, 0.040516343, 0.004909924) * inp_6_2_0; + result1 += M4(0.07979845, -0.06353748, 0.030827152, 0.041357685, -0.0800338, -0.106950775, -0.06833297, -0.12957431, -0.036484595, 0.013483876, 0.1311274, 0.14309974, 0.18997373, 0.030550603, -0.1454263, -0.077398196) * inp_6_0_1; + result1 += M4(-0.08351891, 0.087970376, 0.15670797, -0.07483462, 0.4136507, 0.23026279, -0.1595789, 0.1342068, 0.20100828, -0.15992345, 0.24500774, -0.06217506, -0.13873757, -0.10639632, -0.25519928, 0.12289211) * inp_6_1_1; + result1 += M4(0.05649937, -0.13829966, -0.06926285, 0.16086845, 0.11136481, -0.13024735, -0.11109521, 0.17485645, 0.01666002, 0.09547379, -0.024069212, 0.047422227, -0.17598514, -0.103104554, -0.009266948, 0.09092815) * inp_6_2_1; + result1 += M4(-0.10474804, 0.016698934, 0.029720983, -0.13150644, -0.063225284, -0.05904626, -0.009949913, 0.00018698188, 0.07028293, -0.033586286, -0.07864628, 0.033227555, 0.16869347, -0.081360534, 0.094108135, 0.2211802) * inp_6_0_2; + result1 += M4(-0.26949, -0.044507578, 0.1477516, 0.036132596, -0.043683667, -0.076060124, 0.026270686, 0.06416137, -0.1283779, -0.13623863, -0.042199202, -0.05594856, 0.3736512, 0.08141126, -0.23937687, -0.119359955) * inp_6_1_2; + result1 += M4(0.084934175, 0.061839666, 0.010982163, -0.26843917, 0.004296467, 0.09378715, 0.09337865, -0.03648232, 0.020570103, 0.09742387, -0.00092384644, -0.05229222, 0.029906118, 0.058147784, -0.004575042, -0.0021433174) * inp_6_2_2; + result2 += M4(-0.09728809, 0.12705815, -0.028977007, -0.13854632, 0.07775079, -0.01154811, -0.054849498, 0.042522572, -0.013445212, 0.025924275, 0.027557472, -0.043836106, -0.03986896, -0.117435925, 0.062532805, -0.1545375) * inp_6_0_0; + result2 += M4(-0.14383373, 0.18368949, -0.10276375, -0.09745836, 0.057789564, -0.033151116, -0.07986056, -0.17011829, 0.006027637, 0.034716703, -0.070138164, -0.003411713, -0.007138873, 0.0833064, -0.044077292, -0.030886922) * inp_6_1_0; + result2 += M4(-0.10252342, 0.056591894, -0.023250006, -0.22413959, 0.05353864, -0.06627729, -0.0886889, -0.10153446, -0.03933207, 0.009793733, -0.0045435447, -0.004461575, 0.017490178, 0.080378845, -0.0071444563, -0.05331926) * inp_6_2_0; + result2 += M4(-0.098941, 0.040722124, 0.027304756, -0.16025057, 0.2098127, -0.07817846, 0.04404543, -0.18956026, -0.08948699, 0.01230849, 0.07202974, 0.050348695, 0.048572678, -0.168869, 0.045545164, -0.24809511) * inp_6_0_1; + result2 += M4(-0.09936324, 0.31672347, -0.13130951, 0.045155503, 0.36198738, -0.12747245, 0.074202925, -0.3330781, -0.1464172, -0.1622254, 0.090740085, -0.10589896, -0.085408434, -0.16782056, 0.11473101, -0.3355733) * inp_6_1_1; + result2 += M4(0.010354405, 0.123217784, 0.15721191, -0.45024335, 0.04826859, -0.012769763, 0.06803188, -0.04514185, 0.021900792, -0.01662945, -0.12624656, 0.044610206, -0.00435643, -0.008694052, -0.047312513, 0.007757288) * inp_6_2_1; + result2 += M4(-0.08055778, 0.07800522, -0.053581987, -0.10969689, 0.080745876, 0.042631555, -0.09987554, -0.099668436, 0.085227326, 0.070624724, 0.08070706, -0.0028242047, -0.12818842, -0.075480625, -0.015591966, -0.10367721) * inp_6_0_2; + result2 += M4(0.027008172, 0.14759146, -0.1670905, -0.15166657, 0.21059166, -0.0551149, -0.15026438, 0.07846565, -0.041948162, -0.06116516, -0.10198152, 0.0049422076, -0.22084834, 0.026073638, -0.012006051, -0.23930168) * inp_6_1_2; + result2 += M4(-0.37885672, 0.09818381, -0.15209103, -0.21781725, 0.14618927, -0.0040617506, 0.05117922, -0.02672699, 0.042790525, 0.07494308, -0.10597002, -0.050133295, -0.05204497, 0.061795615, 0.014891126, -0.036957268) * inp_6_2_2; + result3 += M4(0.185546, -0.032288086, 0.03415255, 0.10309088, 0.12632178, -0.0089605255, -0.00026329645, -0.05788586, -0.013285484, 0.014707667, -0.0064637004, -0.034020472, -0.025541177, -0.012849491, 0.052110005, -0.02604595) * inp_6_0_0; + result3 += M4(0.41292533, -0.0627427, 0.01737347, -0.057093598, -0.16102254, -0.037011318, -0.007919761, -0.025018075, 0.0450738, -0.026855862, -0.049001496, -0.02301973, 0.07580025, -0.037616286, -0.032519244, -0.06378584) * inp_6_1_0; + result3 += M4(0.3346523, -0.017829685, 0.33904034, -0.10046771, -0.2506381, 0.06847256, -0.16621499, -0.037054002, -0.06243941, 0.03671546, 0.011701322, -0.028419089, 0.041693617, 0.00808051, -0.055128235, -0.1270356) * inp_6_2_0; + result3 += M4(0.14584646, 0.040582735, -0.03203946, 0.029161131, 0.1569903, 0.031786006, 0.02203093, 0.052464753, -0.17344344, -0.05616043, -0.02038793, 0.16157192, -0.00088637654, -0.08918169, -0.21939383, 0.02132507) * inp_6_0_1; + result3 += M4(0.22482826, 0.18882215, -0.2109867, 0.20965013, -0.21185277, 0.08119736, -0.094712876, 0.36543417, -0.032067187, 0.03824958, 0.07664706, -0.11212712, 0.1502659, 0.14563361, -0.08573973, -0.09569288) * inp_6_1_1; + result3 += M4(0.5668292, 0.07864384, -0.15851574, 0.2253648, 0.36334848, -0.06548732, -0.02119428, -0.23140793, -0.03483558, -0.029035846, -0.011677813, -0.0063593257, 0.043029856, 0.041056473, 0.054387067, 0.15371555) * inp_6_2_1; + result3 += M4(0.18089499, -0.047573827, 0.005182853, 0.12310185, 0.0988627, -0.022082662, -0.074445374, 0.031603467, -0.10876057, 0.034450483, -0.21183711, 0.27282053, 0.023163272, -0.05425671, 0.21672472, -0.06922515) * inp_6_0_2; + result3 += M4(0.3654263, -0.060631882, 0.18439434, 0.12481628, 0.04861879, 0.022381956, 0.025325563, 0.012068141, 0.25170138, -0.040667526, -0.054647002, 0.0020854932, 0.047459282, 0.037005134, -0.22579049, 0.1441387) * inp_6_1_2; + result3 += M4(0.31363022, 0.017053004, 0.033711996, 0.2867573, 0.101877645, -0.025373004, 0.04963279, 0.033481166, -0.07591163, -0.0007023842, -0.06795067, -0.09677775, 0.0070751975, 0.0111449305, -0.106338166, 0.037016667) * inp_6_2_2; + result4 += M4(0.03351123, -0.11655427, -0.03357911, -0.07020249, -0.09868351, 0.020003919, 0.15566629, 0.111611955, 0.03797199, 0.0100544365, 0.01791509, -0.028324421, -0.08026222, -0.088658996, 0.079744495, -0.05380528) * inp_6_0_0; + result4 += M4(0.2093525, -0.19591491, -0.041430935, -0.1769227, 0.19246429, 0.026085977, -0.05653853, 0.07229085, -0.021525076, -0.012955541, 0.05822974, 0.022376334, 0.10470525, -0.043411467, 0.08422375, -0.08633609) * inp_6_1_0; + result4 += M4(-0.113138996, -0.29777002, 0.097035415, -0.17521766, -0.12739336, -0.017126556, -0.0025361879, -0.091820754, 0.010870739, 0.040008564, 0.010054603, -0.008001849, 0.0048292037, -0.08841783, 0.061841697, -0.03285206) * inp_6_2_0; + result4 += M4(0.15313675, 0.10109318, 0.05147042, -0.101560265, 0.1182915, -0.02052267, 0.059898324, 0.11955758, -0.0039292537, 0.10427425, 0.12080389, 0.052777626, 0.04190581, 0.16115965, -0.18883778, -0.04855676) * inp_6_0_1; + result4 += M4(0.1106125, 0.06403678, -0.03785207, -0.2804395, -0.23224425, 0.0776971, 0.102057956, -0.07645924, -0.12819959, -0.13052844, -0.15730965, -0.12691382, -0.13231787, -0.21864872, -0.20197552, 0.120350175) * inp_6_1_1; + result4 += M4(-0.028920438, 0.30645525, -0.09111205, 0.0016827547, -0.21038549, 0.12553698, -0.07064634, -0.08422061, 0.05563499, 0.08968355, -0.026228696, 0.017037652, -0.098600306, 0.063330404, -0.008508259, 0.027112292) * inp_6_2_1; + result4 += M4(0.020318398, -0.1082526, -0.046913218, -0.0086583495, 0.1518727, -0.06683231, -0.040266704, -0.07956474, 0.071654856, 0.039180983, 0.26956534, 0.064652994, -0.016598048, 0.010794737, -0.010483676, 0.16300574) * inp_6_0_2; + result4 += M4(0.11134099, -0.05475089, -0.08916288, -0.0788205, -0.05166639, 0.14720303, -0.051651753, 0.18677604, -0.13057844, 0.14725175, -0.06957975, 0.044068716, 0.11644188, 0.16409175, 0.11227571, 0.3046591) * inp_6_1_2; + result4 += M4(0.34201884, -0.14044404, -0.04303451, 0.025608726, -0.085761964, 0.0022005555, 0.0053634727, -0.06099608, 0.022460181, -0.0020911195, -0.10174249, -0.01883417, -0.10148095, 0.0049525136, 0.047242865, 0.12056862) * inp_6_2_2; + result5 += M4(-0.03084787, -0.043743838, 0.0013361761, 0.0010635621, -0.0006340321, 0.14626092, -0.062524706, -0.056714725, -0.046213068, 0.008212069, -0.038495477, -0.052282322, 0.13648538, 0.10985524, -0.034487, 0.03140544) * inp_6_0_0; + result5 += M4(-0.11180962, 0.07738783, 0.00013493697, 0.069898434, -0.014950715, -0.034949496, -0.045437455, 0.040848527, 0.056710213, 0.023578113, -0.041299984, 0.034865517, 0.09137486, 0.044838328, -0.011997275, 0.09208104) * inp_6_1_0; + result5 += M4(0.21378994, 0.20275737, 0.08551785, -0.03031537, 0.23998004, -0.1881181, 0.03192166, 0.11558745, -0.007510867, 0.005142982, -0.0186586, -0.054318935, 0.13884911, -0.080374055, 0.07896791, -0.13564576) * inp_6_2_0; + result5 += M4(0.010643287, -0.050605524, 0.0893235, -0.036525786, 0.040669795, -0.03025073, -0.06990102, -0.0415294, -0.08315493, 0.10482798, 0.017328838, 0.01531095, 0.0717909, 0.047141626, 0.016256347, -0.19347054) * inp_6_0_1; + result5 += M4(-0.067926444, -0.036405887, 0.054175954, -0.22704571, -0.031879175, -0.094859935, -0.0075357556, -0.009981205, 0.06891248, -0.3400711, 0.042274006, -0.13024047, -0.29953814, 0.29648513, -0.0837207, -0.13472189) * inp_6_1_1; + result5 += M4(-0.17257512, -0.035090223, 0.22645073, -0.19988519, -0.01734958, 0.013582395, 0.009763802, 0.0021932905, 0.044697754, 0.11186724, -0.054914236, 0.04331771, -0.13643798, 0.015042445, -0.050239883, 0.106387116) * inp_6_2_1; + result5 += M4(0.017438427, -0.0083507905, 0.010537823, -0.04127759, -0.0062385714, 0.04496947, -0.11327308, 0.082287, 0.07574159, 0.17377695, -0.022043332, -0.09117809, -0.075235374, -0.068843804, 0.03966712, 0.17877273) * inp_6_0_2; + result5 += M4(0.00517535, 0.040186256, 0.013450924, 0.078003824, 0.029452236, -0.06100186, -0.037188433, -0.04982236, -0.094965905, -0.120676585, 0.10076764, 0.02894041, 0.11453628, -0.20461118, 0.05865534, 0.027957011) * inp_6_1_2; + result5 += M4(-0.052163508, 0.09756601, -0.054054465, 0.16970202, -0.0024914322, 0.16250038, -0.030870328, -0.027966816, -0.02453819, 0.03823494, -0.012348601, -0.042337127, 0.040229857, 0.079429656, -0.03855773, 0.05825826) * inp_6_2_2; + result6 += M4(0.03146201, -0.077358946, -0.009481048, 0.09710753, 0.043762375, -0.041047815, 0.023138152, -0.11795152, 0.0030393472, -0.04231185, 0.0029345278, 0.0078117833, -0.028776566, -0.07412193, 0.06371752, 0.06826864) * inp_6_0_0; + result6 += M4(0.058841508, 0.11625898, 0.042352494, 0.1264791, 0.100371085, -0.046975877, -0.014642208, 0.02348159, 0.035280276, 0.006505467, 0.053266108, 0.066343956, -0.03194247, 0.050474428, 0.092937015, 0.036239758) * inp_6_1_0; + result6 += M4(-0.12247129, -0.054473232, -0.034500774, 0.040724248, -0.024916235, -0.06906076, 0.042794775, -0.099764116, -0.0015231459, 0.06014854, 0.008951344, 0.009885078, 0.06924082, 0.039011408, 0.014870041, 0.059346154) * inp_6_2_0; + result6 += M4(0.07254418, 0.059764046, -0.0020460703, 0.18339461, 0.08526254, 0.0022531361, 0.037749656, -0.01943397, -0.10345676, 0.101171695, 0.04093941, 0.058882628, 0.04914567, 0.096198894, 0.02462599, 0.067873724) * inp_6_0_1; + result6 += M4(0.20057377, -0.16678156, 0.07223634, 0.2106842, -0.17483, -0.04045807, 0.1341446, -0.23947048, 0.21032043, -0.20521832, -0.16874912, -0.010895902, 0.055160496, -0.03556664, 0.1067081, 0.040328085) * inp_6_1_1; + result6 += M4(-0.0597152, 0.04561408, -0.07391488, 0.24235682, -0.09921651, -0.13398564, 0.02576114, -0.08956477, -0.06787527, 0.012861433, -0.034934904, 0.07118085, 0.0150615545, -0.052876145, 0.007870862, 0.16341296) * inp_6_2_1; + result6 += M4(0.033775102, -0.07671312, 0.012382573, 0.121964484, 0.14321166, 0.035436336, 0.0481375, -0.032273855, 0.111287475, 0.08795221, -0.10027117, 0.10220403, -0.16663294, -0.14994253, 0.024246393, 0.09996502) * inp_6_0_2; + result6 += M4(-0.1047591, -0.052500725, 0.10865591, -0.02306723, 0.033228405, -0.005258342, 0.013029212, -0.11010327, -0.15415265, 0.08881764, -0.03938417, 0.08686939, -0.13690643, -0.18577002, 0.05901176, 0.08083571) * inp_6_1_2; + result6 += M4(0.07044876, -0.065358914, -0.12994884, 0.26130137, 0.008974159, 0.011586497, 0.07753359, -0.07690641, -0.014970455, -0.0409436, -0.021933433, 0.055242892, -0.0860284, 0.11282399, 0.0029614477, -0.028931513) * inp_6_2_2; + result7 += M4(0.05293374, -0.034820583, -0.06703012, 0.06325874, -0.022009883, 0.06587183, -0.1410693, -0.09765959, 0.05999544, -0.022391513, -0.04569822, -0.015547883, -0.10717338, 0.035043966, 0.100084364, -0.077007905) * inp_6_0_0; + result7 += M4(-0.05390019, 0.012426201, 0.019088764, 0.05139499, -0.1787579, 0.017130725, -0.041534886, 0.1716623, -0.030412016, 0.011566945, 0.06312229, -0.016118886, -0.053645458, 0.017684467, 0.15130924, -0.103701614) * inp_6_1_0; + result7 += M4(-0.045972627, 0.00783866, -0.016245978, -0.21848169, -0.03677847, 0.13728806, -0.05128183, 0.115026064, 0.023616668, 0.0046225972, -0.02629118, -0.0065984633, 0.017711861, -0.0076629, 0.009504906, -0.03888971) * inp_6_2_0; + result7 += M4(0.0011861536, -0.028205145, -0.003721589, 0.011130133, 0.036028538, -0.021428093, -0.06982834, -0.045311913, 0.18088165, 0.052478503, 0.09143515, 0.0017651046, 0.13371183, -0.044848405, 0.21105206, -0.12305451) * inp_6_0_1; + result7 += M4(0.19593745, 0.03210811, -0.114854224, 0.22755061, -0.28998613, 0.118310034, -0.52791077, 0.1544713, 0.14201693, 0.1977915, -0.31013045, 0.024472913, 0.07843247, 0.1989355, 0.23659293, 0.0866097) * inp_6_1_1; + result7 += M4(-0.020790655, -0.014497923, 0.18173507, -0.1529637, 0.26787937, -0.05265967, -0.09187476, 0.09301387, -0.063401826, -0.034877323, -0.0010457438, -0.065697156, 0.02080821, -0.034697264, -0.057621155, 0.12996827) * inp_6_2_1; + result7 += M4(0.054232243, -0.0003540933, -0.08789266, -0.014577661, -0.06187757, 0.019614697, -0.024848888, 0.023302058, 0.16288719, -0.018200437, -0.11264242, 0.03584354, -0.21507101, -0.008851964, 0.074968085, 0.108757906) * inp_6_0_2; + result7 += M4(0.1375424, 0.054197382, -0.03428461, -0.08468458, 0.021722917, 0.0034591001, -0.062179934, 0.08813356, -0.007602519, -0.05286331, -0.07144538, -0.020984, 0.31013587, 0.11048175, 0.06766904, 0.05246831) * inp_6_1_2; + result7 += M4(-0.14231342, -0.051772982, -0.053020842, 0.16402012, -0.11601745, 0.0093022045, 0.0012165563, 0.08256463, 0.12014372, 0.0039739157, -0.034550488, 0.0368548, -0.020246841, -0.008722948, 0.027616262, -0.043535452) * inp_6_2_2; + const V4 inp_7_0_0 = inp[7][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_7_1_0 = inp[7][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_7_2_0 = inp[7][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_7_0_1 = inp[7][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_7_1_1 = inp[7][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_7_2_1 = inp[7][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_7_0_2 = inp[7][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_7_1_2 = inp[7][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_7_2_2 = inp[7][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.11022096, 0.011482773, 0.039873466, 0.015228517, 0.056417406, 0.06373515, -0.11187405, -0.09049438, -0.04402273, 0.09030303, -0.2376386, -0.11208759, -0.07346641, -0.027435657, 0.0050526243, -0.00019081912) * inp_7_0_0; + result0 += M4(0.09013321, 0.08215407, -0.09750597, -0.021216216, -0.13443422, -0.21532916, 0.056260515, 0.029428372, -0.070409745, -0.11779351, 0.07556854, 0.059305828, 0.0891374, 0.05234228, 0.17114203, 0.0074714324) * inp_7_1_0; + result0 += M4(-0.028173164, 0.07556595, -0.09262134, -0.0077569564, -0.010631451, 0.021527193, 0.09270138, -0.060953435, 0.004196015, 0.11433513, 0.018561658, -0.11694085, -0.0058117625, -0.091905855, -0.078881845, -0.107506305) * inp_7_2_0; + result0 += M4(-0.03187561, -0.021113746, -0.07477762, -0.012591281, 0.012346929, 0.02665705, -0.043360375, -0.040885903, -0.09451367, -0.011944276, 0.18507242, -0.0920411, -0.13992557, 0.055390105, 0.15251854, -0.17506237) * inp_7_0_1; + result0 += M4(-0.1555577, -0.10397788, 0.05424246, -0.014995283, -0.06352323, 0.007809084, 0.17071044, -0.05167155, 0.022469448, 0.05773306, -0.009096258, -0.09406734, 0.22249402, -0.20213959, -0.012580843, -0.10672017) * inp_7_1_1; + result0 += M4(-0.11183928, 0.0028043718, 0.16121423, 0.05857266, 0.048791114, -0.055762686, 0.06332813, -0.0006916623, 0.025087772, -0.05771214, -0.07257306, -0.07195575, -0.14890692, 0.0036384193, -0.03936884, -0.10538251) * inp_7_2_1; + result0 += M4(0.10405207, -0.0016909636, -0.01495242, 0.007569798, 0.005287026, -0.0061448645, -0.12386408, -0.021777894, 0.065546274, 0.01808067, 0.011864633, -0.045296848, -0.067812555, -0.10803324, 0.24383216, 0.0093610175) * inp_7_0_2; + result0 += M4(0.0884318, -0.027104398, 0.013594732, 0.029033976, 0.07884433, -0.1712009, 0.0826759, 0.023523081, 0.12975687, -0.08164581, 0.08321164, -0.00020502675, 0.28008497, -0.10125179, 0.20977367, -0.24806002) * inp_7_1_2; + result0 += M4(0.117803596, 0.016670883, 0.2681313, -0.039233547, -0.12944682, 0.063220635, -0.018049292, 0.07075836, -0.045880605, -0.0021113674, 0.094006605, 0.025561247, -0.050408095, 0.020062549, -0.14858866, 0.0053829835) * inp_7_2_2; + result1 += M4(-0.038750425, -0.035261627, 0.032208346, -0.085805334, -0.15405802, 0.04878469, -0.09173975, -0.0071753953, -0.17335176, -0.03724122, -0.06007797, -0.054613985, 0.0065317773, -0.10838213, -0.011641486, -0.04792059) * inp_7_0_0; + result1 += M4(-0.036310017, -0.034187578, -0.028452702, -0.10241997, -0.06146276, 0.117450446, 0.079410054, 0.08022572, 0.04140629, -0.0121517, 0.089955114, 0.027275046, 0.01531277, 0.07248514, 0.071419254, 0.008395838) * inp_7_1_0; + result1 += M4(0.081174605, 0.09528748, -0.2238008, 0.12270269, 0.05815606, 0.02410455, -0.0048464807, -0.0067078983, 0.07424298, -0.121125326, -0.06281625, -0.10278789, -0.04710438, -0.0038722854, -0.040362097, -0.029764604) * inp_7_2_0; + result1 += M4(0.050712507, 0.027368419, 0.008513996, 0.07460419, -0.021956451, -0.00053891493, -0.08340941, -0.047463886, 0.06599599, -0.06234021, -0.12184921, -0.046419006, -0.19751067, 0.07278192, -0.015982216, -0.14425221) * inp_7_0_1; + result1 += M4(-0.12677167, -0.024302546, 0.25301355, 0.24907334, -0.14745091, 0.0123119, 0.03315016, -0.12604839, 0.02104371, 0.03689506, 0.081811585, 0.08363414, 0.1222896, 0.09136149, -0.17691818, -0.06523168) * inp_7_1_1; + result1 += M4(0.42910525, 0.0426603, -0.18015476, 0.060419783, 0.07315737, 0.02736246, 0.0031960397, 0.049161665, -0.051263805, 0.009277149, -0.05801566, 0.058256052, -0.09557392, -0.11019185, 0.07357578, 0.10300213) * inp_7_2_1; + result1 += M4(0.0076170317, 0.017688349, -0.06172023, 0.0018221186, -0.1785554, -0.022142278, 0.06663555, 0.046899498, -0.07946061, 0.019766206, 0.008300228, 0.04099154, 0.19570711, 0.028938306, 0.005188872, 0.09505019) * inp_7_0_2; + result1 += M4(0.1728114, 0.05928747, -0.22721566, -0.13097271, 0.05977639, 0.06833878, -0.09385581, -0.21699071, -0.035750587, -0.019792644, 0.008943096, -0.015955642, -0.040257793, -0.11289454, 0.1052812, -0.01123072) * inp_7_1_2; + result1 += M4(0.29802194, 0.04513804, -0.21758196, -0.15869115, 0.043702345, -0.02264359, -0.027486468, -0.020602042, 0.066951565, -0.03860428, -0.031131841, 0.027195996, -0.14034495, 0.054269828, 0.07415559, -0.1069007) * inp_7_2_2; + result2 += M4(0.052797157, -0.020076701, 0.03573245, -0.050302766, -0.048102334, 0.0543038, -0.16020842, -0.013800323, 0.13463417, -0.012401103, -0.051421653, 0.0022438113, 0.18893264, 0.017786704, 0.010133415, 0.011534617) * inp_7_0_0; + result2 += M4(0.04592096, -0.10930645, 0.047207676, 0.060161136, -0.052191216, -0.014479013, 0.065343685, -0.03444602, 0.19656916, -0.015796266, -0.032448865, 0.049579673, 0.21404935, 0.107823774, -0.22215053, -0.06535876) * inp_7_1_0; + result2 += M4(-0.05690197, -0.11155782, 0.19012444, 0.026279641, -0.03171601, -0.07634178, 0.04033474, -0.07088044, 0.15690391, -0.09723734, 0.124490164, -0.072359726, 0.22667551, 0.0052638124, -0.012935682, -0.05421189) * inp_7_2_0; + result2 += M4(-0.013069922, -0.118209556, 0.004201549, -0.03968757, 0.19180593, 0.04374746, -0.07282215, 0.030352551, 0.30208516, -0.049557123, 0.12146452, -0.14485435, 0.112649664, -0.010713434, 0.1611247, -0.16300488) * inp_7_0_1; + result2 += M4(-0.031452656, 0.07456825, -0.0443281, 0.10157587, -0.018472794, 0.06993026, 0.059775315, -0.21900661, 0.1678983, -0.072115056, 0.10735342, -0.29979613, 0.17353845, 0.13813142, -0.18877776, -0.10629891) * inp_7_1_1; + result2 += M4(0.08179209, -0.047584996, 0.26713505, 0.22933918, 0.11315587, -0.09299391, -0.004207574, 0.106423035, 0.13896208, -0.14027683, 0.029845243, -0.052466318, 0.0036428093, -0.076062515, 0.0543791, 0.053804114) * inp_7_2_1; + result2 += M4(0.059942096, 0.011214699, -0.03698835, -0.02760338, 0.020503722, -0.03803051, -0.064014696, -0.08796878, 0.17849848, -0.06559597, -0.038528904, -0.13167964, 0.061552744, 0.03322383, 0.06599091, -0.040332813) * inp_7_0_2; + result2 += M4(-0.0050247153, -0.033658862, 0.083789095, 0.01603673, 0.039516848, 0.019611977, -0.017596444, -0.014390076, 0.24864224, -0.075751014, -0.0901808, -0.14308771, 0.12755138, -0.1403204, 0.033521403, -0.16512023) * inp_7_1_2; + result2 += M4(0.06304413, 0.19934912, 0.14972568, 0.07063272, -0.03589309, 0.03259011, 0.12179023, 0.01988989, 0.13880207, -0.04782535, 0.083721, -0.052201588, 0.14937533, -0.02124665, 0.046289448, -0.10333444) * inp_7_2_2; + result3 += M4(-0.014162571, 0.022528606, -0.021292126, 0.013722922, -0.026890505, 0.05631975, -0.10062739, -0.08847613, 0.08882607, 0.049216077, -0.118859775, -0.008137586, 0.10595997, 0.010337946, -0.07013328, -0.038930215) * inp_7_0_0; + result3 += M4(0.034575455, 0.08361816, -0.10919548, 0.17638136, 0.18224913, 0.046795767, 0.018567959, 0.14453304, 0.0335291, 0.050131854, -0.009804896, 0.06362119, 0.087263234, 0.07719271, 0.09225559, 0.23594186) * inp_7_1_0; + result3 += M4(0.049647845, -0.09350715, 0.034789413, -0.16308914, 0.0208552, 0.009179951, 0.0770476, -0.031192025, 0.17365715, 0.050686467, 0.036260754, 0.038846176, 0.26197204, -0.03973592, -0.016903615, 0.012020142) * inp_7_2_0; + result3 += M4(-0.026583632, 0.0013850909, 0.08024547, -0.031676076, 0.047013383, -0.022702007, -0.18380836, 0.09443742, 0.14200814, -0.037908416, 0.054748967, -0.10782969, 0.026259264, -0.017020205, 0.0017113617, -0.18204968) * inp_7_0_1; + result3 += M4(0.013689261, 0.18524802, -0.030867858, -0.05774088, 0.10711539, -0.09515505, 0.22342813, -0.094552, -0.15552238, -0.09500935, 0.012716829, 0.156438, -0.12898937, 0.16744038, 0.1940056, 0.1469972) * inp_7_1_1; + result3 += M4(0.37122875, -0.32382846, 0.028528692, -0.13682099, 0.010868172, 0.02463163, 0.030062033, -0.017400049, 0.17285028, -0.01587462, -0.119849585, -0.05350483, 0.39955628, -0.020757338, -0.06740248, -0.052394763) * inp_7_2_1; + result3 += M4(0.037440807, 0.022528477, -0.048126973, 0.00017738802, 0.017091148, -0.018729787, -0.0069110454, 0.011290475, 0.10123653, -0.0038787266, -0.062889926, -0.027114239, 0.15313332, -0.041154493, 0.17189945, -0.14410292) * inp_7_0_2; + result3 += M4(0.030311767, 0.18222551, 0.10998553, -0.08351889, -0.08203493, 0.0143294735, -0.007684832, -0.07510801, 0.05418675, 0.007856149, -0.15420091, -0.023835426, 0.13697478, -0.07019518, -0.042528722, 0.09751385) * inp_7_1_2; + result3 += M4(0.26491177, -0.112983905, -0.007609828, -0.12998493, 0.036402006, 0.007275075, 0.042161185, 0.09351155, 0.0003693852, 0.03934608, -0.010582391, -0.015830005, 0.014427005, 0.009677277, -0.06288287, 0.23942441) * inp_7_2_2; + result4 += M4(0.05266788, 0.027158823, -0.014034541, -0.009965593, 0.24604249, 0.012403979, -0.08652453, -0.020045457, 0.07192276, 0.050629944, -0.093924254, 0.024841465, -0.015011351, 0.15076591, -0.011793535, -0.014103332) * inp_7_0_0; + result4 += M4(-0.10568932, -0.03767174, -0.13513038, 0.0914478, 0.030558135, -0.0075513315, 0.09578352, 0.25301346, -0.1565884, 0.0038170163, 0.08188047, 0.15906128, -0.12059487, 0.0042721555, -0.06668525, 0.12577975) * inp_7_1_0; + result4 += M4(0.08938064, -0.044811964, -0.15163065, -0.040140662, -0.06713511, -0.018461373, 0.04495951, -0.094427675, -0.10349378, 0.025671815, -0.051892366, -0.06280779, -0.023974685, -0.05006379, 0.021145446, -0.11373016) * inp_7_2_0; + result4 += M4(-0.06279524, -0.026311915, 0.027277492, 0.060682897, 0.006103371, 0.09189192, -0.041464116, -0.0697834, -0.18994297, -0.011132484, -0.07862491, -0.024247596, -0.14507513, 0.09190709, 0.041282136, -0.113652304) * inp_7_0_1; + result4 += M4(0.3497865, -0.030769339, 0.12593327, -0.16335618, 0.0060147024, -0.1861027, 0.043191463, -0.04540035, 0.016091045, 0.08277523, 0.055683367, -0.006602088, -0.13116595, 0.039121456, -0.097923495, 0.1096506) * inp_7_1_1; + result4 += M4(-0.11811273, 0.26734427, -0.026286134, -0.053799637, 0.010350008, -0.08110212, -0.018327205, -0.102141015, 0.049078543, 0.065229535, -0.069745116, 0.11258639, 0.1404141, 0.11233924, 0.04683271, 0.021124389) * inp_7_2_1; + result4 += M4(-0.0010085531, -0.04498275, -0.04986057, -0.0040743, -0.013810281, -0.07274953, 0.0012835872, 0.018870972, 0.026488658, 0.08273377, 0.026578818, 0.090879664, -0.09691592, 0.12268741, -0.06423878, 0.054662813) * inp_7_0_2; + result4 += M4(-0.23530272, 0.029757394, -0.017722711, 0.072323896, 0.057143938, 0.023623768, 0.10339405, 0.057755485, -0.027147548, 0.017620232, 0.105267964, 6.799308e-05, -0.016083946, -0.14741136, -0.11125042, 0.13146009) * inp_7_1_2; + result4 += M4(-0.013640705, -0.14611275, -0.015377387, 0.06866489, -0.012629134, -0.10099124, -0.085796155, -0.047821183, 0.07384608, 0.016671525, -0.03840764, -0.039736804, -0.026625872, 0.10741123, 0.11415058, 0.06206821) * inp_7_2_2; + result5 += M4(0.05254084, -0.03618419, 0.023501085, 0.0056306478, -0.100311495, -0.13521314, 0.031401906, -0.08381413, 0.12670153, -0.016282525, -0.013178172, -0.08223539, 0.09254608, -0.034764078, -0.029238414, -0.013276624) * inp_7_0_0; + result5 += M4(0.06647183, -0.09633117, 0.12872927, -0.043654773, -0.033849824, 0.029661471, 0.018389048, -0.076479696, 0.13080731, 0.1384392, 0.0184105, -0.085272565, -0.0060437256, -0.07819326, 0.08589423, -0.0700786) * inp_7_1_0; + result5 += M4(-0.022850612, -0.044623993, 0.079330996, -0.009538862, 0.006363927, -0.046481546, 0.020831624, -0.003924319, 0.014489123, -0.11144054, 0.07664926, 0.087895356, 0.06953369, 0.06760292, 0.091705956, 0.17266676) * inp_7_2_0; + result5 += M4(-0.014408775, 0.02914897, -0.0033331045, -0.07358319, 0.0072816038, 0.08571597, 0.042665605, 0.043397482, -0.01727832, -0.1982741, 0.14628245, -0.16529793, -0.10693148, -0.20501375, -0.012105054, 0.03013684) * inp_7_0_1; + result5 += M4(-0.054995872, 0.07685547, -0.1569899, -0.0023547648, 0.058497522, 0.20743807, 0.14692727, 0.010326364, 0.12803675, 0.18334745, 0.033009302, -0.06388357, 0.18871413, 0.2798391, -0.027372744, -0.017254217) * inp_7_1_1; + result5 += M4(0.20483567, 0.114196286, 0.17187226, 0.09272362, -0.0058950544, -0.07003576, 0.04160463, 0.044610906, 0.030789075, -0.03595957, 0.029076457, 0.028777014, -0.14943944, -0.06678312, -0.06306165, 0.22895761) * inp_7_2_1; + result5 += M4(-0.023096116, -0.006917437, 0.0021108715, 0.041196633, -0.019993216, -0.001894041, -0.045894228, 0.024407577, 0.074497215, -0.06217066, -0.050677497, -0.013254962, 0.011975119, -0.11239947, 0.032038398, 0.13186377) * inp_7_0_2; + result5 += M4(0.01742654, -0.03852992, -0.03729594, 0.07947045, -0.048096783, -0.098710634, -0.01726188, 0.11849713, 0.017860059, 0.13130726, -0.0025118445, -0.05278241, 0.069821626, 0.15241168, -0.05023817, -0.08602724) * inp_7_1_2; + result5 += M4(-0.03396705, 0.2799761, -0.0929207, -0.066131175, -0.0460967, -0.016618725, 0.10093002, -0.01057141, 0.042762898, -0.0845663, 0.03090186, -0.014841956, -0.070289955, 0.013369748, 0.18829757, 0.119572245) * inp_7_2_2; + result6 += M4(-0.0071559725, 0.07536959, 0.00026839742, -0.016584475, -0.09725099, 0.1392313, -0.023261173, -0.11467251, 0.0905596, 0.054679852, 0.024681402, -0.16289128, 0.046488147, -0.11445065, 0.036976665, -0.07590544) * inp_7_0_0; + result6 += M4(-0.08670319, -0.041526556, -0.0941201, 0.037765447, 0.0046336106, 0.06339999, -0.066575885, -0.069352746, 0.040602203, -0.123128735, -0.01903979, -0.13627307, -0.0007248225, -0.017895356, -0.018853044, -0.11512713) * inp_7_1_0; + result6 += M4(-0.096611865, -0.11682056, -0.039424088, -0.030300787, 0.015231648, 0.0458185, 0.051526282, -0.06569795, 0.08748213, -0.0002701986, 0.05107693, -0.24146003, 0.049040336, 0.017540535, -0.024997583, -0.09934556) * inp_7_2_0; + result6 += M4(-0.035219774, -0.032697555, -0.059689417, 0.045763858, 0.0020797334, -0.01705579, 0.016583934, -0.20581028, -0.08171271, 0.09913759, 0.14018895, -0.26824296, -0.03941014, -0.0017919509, 0.12647048, -0.1974253) * inp_7_0_1; + result6 += M4(0.14142707, 0.105095565, -0.12100015, -0.17409892, -0.039365645, -0.14624794, 0.25097856, -0.19304596, 0.03673455, -0.07840369, 0.28851572, -0.2402052, -0.05521226, -0.20060153, 0.18241851, -0.37887594) * inp_7_1_1; + result6 += M4(-0.3049196, -0.0765604, -0.05726946, 0.04906905, -0.06441495, 0.090938956, -0.012081342, -0.11954974, 0.0015079661, 0.107147, 0.117364705, -0.32942018, -0.011466697, 0.26969522, 0.105870984, -0.17526019) * inp_7_2_1; + result6 += M4(0.014619589, -0.028079614, 0.02073476, -0.055835027, 0.048343558, -0.006500031, 0.0478469, -0.03542944, 0.10161081, -0.06341167, 0.064226255, -0.049521063, -0.03686742, 0.026317399, 0.050769668, 0.03707769) * inp_7_0_2; + result6 += M4(-0.0149490535, -0.08933156, -0.1246248, -0.07752168, -0.0014393497, -0.032868005, 0.012045632, 0.07724925, 0.06565778, 0.059539903, 0.02893959, -0.01473295, -0.0524063, 0.08517658, 0.1877856, 0.04533674) * inp_7_1_2; + result6 += M4(-0.13004984, -0.15174131, -0.11309212, -0.15254354, -0.054834303, 0.021882122, -0.012051568, 0.008080886, -0.042497925, 0.0294425, 0.04106712, -0.09667882, 0.09549975, -0.017691262, 0.042142697, 0.022984017) * inp_7_2_2; + result7 += M4(-0.0077916672, -0.027966924, 0.03468131, -0.067923024, -0.057723507, 0.040405888, -0.21148612, -0.05582302, -0.0076574115, 0.0670587, -0.20746379, -0.042938404, -0.10752802, 0.021326538, 0.04150565, 0.04923152) * inp_7_0_0; + result7 += M4(0.08102916, -0.052608807, 0.09266592, -0.010365845, 0.114378475, -0.0505393, 0.022057299, -0.039993554, 0.08132919, -0.019973908, 0.040771905, -0.001818081, 0.073593006, -0.08648303, 0.08805889, 0.03136114) * inp_7_1_0; + result7 += M4(0.29631892, 0.05282411, -0.118613176, -0.15662101, -0.0065989047, 0.06710252, -0.06422556, -0.04665918, 0.012305429, 0.09719638, -0.13023031, 0.025091173, -0.055439446, 0.018266166, 0.027750297, -0.013691361) * inp_7_2_0; + result7 += M4(-0.020559523, -0.038350347, 0.033233337, 0.012717172, 0.035103276, -0.018585201, -0.102326125, -0.112207465, -0.061808314, 0.08301896, -0.2150042, -0.07788801, -0.015529255, -0.04170462, -0.03692421, -0.002797482) * inp_7_0_1; + result7 += M4(-0.052067265, 0.17229162, -0.11679125, -0.026611092, 0.033428237, 0.08556734, -0.746378, 0.037271217, 0.053675238, 0.19858685, -0.49936712, 0.13117796, -0.13473603, 0.017219624, -0.26075226, 0.17999813) * inp_7_1_1; + result7 += M4(-0.04627403, -0.16542645, -0.40278998, -0.01836751, -0.08184449, 0.03158726, 0.030242775, -0.06568364, 0.00017920652, 0.12186311, -0.20341, -0.046461523, -0.08162309, -0.012435354, -0.17582749, -0.055916633) * inp_7_2_1; + result7 += M4(0.03419231, -0.013769477, -0.057379484, -0.005457218, -0.02622803, 0.015990876, -0.004157733, 0.016983222, 0.023646917, 0.0027527115, -0.07274222, -0.016722947, -0.21292742, -0.03911355, 0.05032142, -0.052389875) * inp_7_0_2; + result7 += M4(-0.056231152, -0.03131215, -0.120435156, 0.055342045, 0.07679648, 0.049795173, 0.03567084, -0.03335904, 0.0040013855, 0.049628217, -0.067027554, 0.08025685, -0.122372925, 0.08895673, -0.240034, 0.15934667) * inp_7_1_2; + result7 += M4(0.06257615, -0.059765525, -0.0941319, 0.100090675, -0.051750794, -0.01381247, -0.078400746, -0.02342833, 0.029323364, 0.028017256, -0.046246424, -0.07830525, -0.15122958, 0.0084200865, 0.009015041, 0.012911715) * inp_7_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(4, 2); + imageStore(out_image, output_base + ivec2(0, 0), result0); + imageStore(out_image, output_base + ivec2(1, 0), result1); + imageStore(out_image, output_base + ivec2(2, 0), result2); + imageStore(out_image, output_base + ivec2(3, 0), result3); + imageStore(out_image, output_base + ivec2(0, 1), result4); + imageStore(out_image, output_base + ivec2(1, 1), result5); + imageStore(out_image, output_base + ivec2(2, 1), result6); + imageStore(out_image, output_base + ivec2(3, 1), result7); +} + +//!DESC ArtCNN C4F32 DS (Conv2D-6) +//!COMPUTE 12 16 12 16 +//!HOOK LUMA +//!BIND conv2d +//!BIND conv2d_5 +//!SAVE conv2d_6 +//!WIDTH LUMA.w 1.0 * +//!HEIGHT LUMA.h 1.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +const ivec2 ksize = ivec2(3, 3); +const ivec2 offset = ksize / 2; +const ivec2 wg_size = ivec2(gl_WorkGroupSize); +const ivec2 isize = wg_size + ksize - 1; +shared V4 inp[8][isize.y][isize.x]; +void hook() { + const uvec2 local_xy = gl_LocalInvocationID.xy; + ivec2 base = ivec2(gl_WorkGroupID) * wg_size; + for (uint y = local_xy.y; y < isize.y; y += wg_size.y) { + for (uint x = local_xy.x; x < isize.x; x += wg_size.x) { + const ivec2 input_base = (base + ivec2(x,y) - offset) * ivec2(4, 2); + inp[0][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(0, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 0), 0)); + inp[1][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(1, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 0), 0)); + inp[2][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(2, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(2, 0), 0)); + inp[3][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(3, 0), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(3, 0), 0)); + inp[4][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(0, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(0, 1), 0)); + inp[5][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(1, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(1, 1), 0)); + inp[6][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(2, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(2, 1), 0)); + inp[7][y][x] = V4(conv2d_5_mul * texelFetch(conv2d_5_raw, input_base + ivec2(3, 1), 0) + conv2d_mul * texelFetch(conv2d_raw, input_base + ivec2(3, 1), 0)); + } + } + + barrier(); + V4 result0 = V4(0.0959251, 0.09110822, 0.09650877, 0.09255176); + const V4 inp_0_0_0 = inp[0][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_0_1_0 = inp[0][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_0_2_0 = inp[0][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_0_0_1 = inp[0][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_0_1_1 = inp[0][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_0_2_1 = inp[0][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_0_0_2 = inp[0][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_0_1_2 = inp[0][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_0_2_2 = inp[0][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.0024803148, 0.0061496943, -0.012449193, 0.0073621483, -0.045883644, -0.028469354, -0.021872455, -0.013641374, 0.048815586, -0.027767755, 0.02023503, -0.019092541, -0.11619551, -0.008204599, -0.031663228, 0.004230975) * inp_0_0_0; + result0 += M4(-0.0154742785, 0.001580846, 0.030910095, 0.026366804, 0.014976256, -0.008040035, -0.0343701, -0.029946564, 0.00802191, 0.009333432, 0.0071688807, 0.03446165, -0.030649843, -0.09222414, -0.006500449, -0.03616832) * inp_0_1_0; + result0 += M4(0.0014083753, -0.020643668, 0.03291238, 0.031495478, -4.888124e-06, -0.016903343, 0.016248288, 0.0045557297, -0.020466309, 0.0124922125, 0.015675034, 0.009169885, -0.06222808, -0.11944605, -0.006970385, -0.0057183346) * inp_0_2_0; + result0 += M4(0.022844896, -0.022662897, 0.018163698, -0.02237418, 0.01051026, 0.047844805, -0.04638999, -0.005816182, -0.0094567975, 0.007950851, -0.017502684, -0.0014783115, 0.008181939, 0.049455367, 0.0035870285, 0.035811253) * inp_0_0_1; + result0 += M4(0.012149711, 0.002857962, -0.020723958, -0.014262196, -0.0731076, 0.016717864, 0.050864466, 0.039048813, -0.050111603, 0.032852042, 0.0264944, -0.070120804, 0.23030543, 0.21245444, 0.2514827, 0.21681325) * inp_0_1_1; + result0 += M4(0.00026614024, -0.014592406, -0.052835893, -0.009333221, 0.027286464, 0.01788344, -0.028332489, 0.012026034, 0.0195929, -0.057542615, -0.004489864, 0.027690006, 0.0017270166, -0.032714684, -0.020642947, -0.0243522) * inp_0_2_1; + result0 += M4(-0.003605971, -0.0037990278, 0.013443389, 0.0032558083, 0.014250842, -0.022822047, 0.088929966, 0.01906915, -0.0117064025, -0.012363594, -0.024934087, 0.015533799, 0.016953493, 0.021677295, -0.08007897, 0.0136948535) * inp_0_0_2; + result0 += M4(-0.010370639, 0.024111917, -0.0429522, -0.024620702, 0.044366717, 0.0014879879, -0.023410184, 0.0032722626, 0.017069954, 0.01791276, -9.927996e-05, 0.03784902, 0.04688709, 0.05669612, 0.031083766, 0.02205755) * inp_0_1_2; + result0 += M4(-0.00498235, 0.02581799, 0.035523787, 0.0015227398, 0.0014288066, -0.0047221635, -0.0020985513, -0.023438053, 0.0022145351, 0.01736244, -0.023317814, -0.039515197, 0.015297988, -0.008451679, -0.02760897, -0.13545682) * inp_0_2_2; + const V4 inp_1_0_0 = inp[1][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_1_1_0 = inp[1][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_1_2_0 = inp[1][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_1_0_1 = inp[1][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_1_1_1 = inp[1][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_1_2_1 = inp[1][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_1_0_2 = inp[1][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_1_1_2 = inp[1][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_1_2_2 = inp[1][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.020167993, -0.011707798, 0.0052746953, -0.0025438035, -0.03900516, -0.027827376, -0.06808679, -0.016391763, -0.055144995, 0.009080459, -0.025470305, 0.0034430495, 0.019877076, -0.027499162, 0.01735567, -0.021593254) * inp_1_0_0; + result0 += M4(0.026026038, -0.016657133, 0.00051480625, 0.0027274373, 0.026398936, -0.020757765, -0.013426359, -0.027223574, 0.037935305, 0.056971017, -0.01697824, 0.000212611, 0.040871743, 0.02722182, -0.017228011, -0.030938586) * inp_1_1_0; + result0 += M4(0.012312127, 0.015262848, -0.015563217, 0.008229303, -0.019722743, 0.04133501, 0.01658207, 0.006229595, 0.011189575, -0.04199504, -0.0060323775, -0.010775301, 0.0057308204, -0.05988524, 0.03452266, -0.045770258) * inp_1_2_0; + result0 += M4(0.0072394228, -0.020105828, 0.021175856, -0.004134102, 0.055959962, 0.00492456, 0.058467004, 0.031046674, 0.045348175, 0.004603531, -0.022029502, -0.00011847204, -0.009968324, 0.015092161, -0.011953061, -0.016064638) * inp_1_0_1; + result0 += M4(0.028076487, 0.0035854043, -0.060402386, -0.029058471, -0.0072221295, 0.057470273, 0.019654285, 0.0011732208, 0.003916707, -0.039282702, 0.09103609, 0.0022973546, 0.050179973, 0.058690213, 0.012151577, 0.065982126) * inp_1_1_1; + result0 += M4(-0.030709263, 0.014990504, 0.03154153, 0.05089986, -0.004910079, -0.055143367, -0.022346955, -0.004397486, -0.030800344, 0.005695878, 0.0035220806, 0.020010155, -0.050312437, 0.014153254, 0.00183779, 0.018095266) * inp_1_2_1; + result0 += M4(3.7243535e-05, -0.000986496, 0.04947859, -0.00044930333, -0.02260156, 0.004070056, -0.0068188934, -0.017675867, -0.0012635521, 0.010501988, 0.07379109, 0.0036660777, -0.010059596, 0.0070117684, 0.0008917458, -0.016142484) * inp_1_0_2; + result0 += M4(-0.034091663, 0.020721935, -0.0563292, -0.00031147193, 0.01600523, -0.00076478475, 0.011453966, 0.058299642, -0.0057894327, -0.030628685, -0.04329043, 0.0049181534, -0.052465882, -0.029118914, -0.015184712, 0.01648398) * inp_1_1_2; + result0 += M4(0.0127214035, -0.0010161864, 0.018413868, -0.023975352, -0.004263343, -0.003388053, 0.0046015806, -0.031919565, 0.00040597055, 0.02559611, -0.048390925, -0.034250475, 0.0027305828, -0.008735211, -0.017057508, 0.034712195) * inp_1_2_2; + const V4 inp_2_0_0 = inp[2][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_2_1_0 = inp[2][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_2_2_0 = inp[2][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_2_0_1 = inp[2][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_2_1_1 = inp[2][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_2_2_1 = inp[2][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_2_0_2 = inp[2][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_2_1_2 = inp[2][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_2_2_2 = inp[2][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.046517123, -0.03144731, -0.013003455, -0.0144427195, -0.026888411, -0.019632282, -0.0022917655, 0.023907091, -0.033237234, -0.03246015, -0.01762068, 0.008442245, 0.011746117, 0.009625908, -0.016068695, 0.014444248) * inp_2_0_0; + result0 += M4(-0.0017242148, 0.036009163, 0.03872198, 0.08203957, -0.027689282, -0.034052547, -0.0530817, -0.00090698246, 0.0009306031, 0.015914964, -0.014899198, 0.013926757, 0.06857021, -0.004917596, 0.0026890791, -0.0064454577) * inp_2_1_0; + result0 += M4(0.0368235, -0.016642114, 0.0060480977, -0.014503015, -0.016500719, -0.01615307, -0.012411641, -0.04918024, 0.018010553, 0.03379412, 0.014476691, -0.0031881856, 0.0076076966, 0.09234624, -0.0150485765, 0.019926859) * inp_2_2_0; + result0 += M4(0.03721801, 0.04649571, 0.05185349, 0.016636897, 0.025164919, -0.082934745, 0.01659212, -0.037209753, -0.03874437, -0.05868011, -0.03918787, -0.029960385, -0.04982479, 0.047894415, -0.023677306, 0.005803603) * inp_2_0_1; + result0 += M4(0.014214814, -0.122045755, -0.04091448, -0.09923212, 0.1825342, 0.06708852, 0.21284619, 0.04525967, 0.016581232, 0.1308973, 0.06391266, 0.021281907, 0.10081535, -0.2297843, 0.20921506, -0.054864246) * inp_2_1_1; + result0 += M4(0.03683215, 0.085150585, 0.050251767, 0.03877321, -0.123000294, 0.0010182575, -0.12104044, 0.0381896, 0.030854423, -0.010185459, -0.014670957, -0.008536624, -0.0769851, 0.009933245, -0.0834486, 0.0030970199) * inp_2_2_1; + result0 += M4(-0.017967954, -0.018456286, -0.02938185, -0.02457528, 0.013047364, 0.03651452, 0.018712142, 0.0018768593, -0.014925934, -0.003460091, 0.014484092, -0.01407737, 0.01265772, 0.014692806, -0.008226725, 0.020290695) * inp_2_0_2; + result0 += M4(0.024245752, 0.006800942, -0.04863811, -0.051620487, 0.025180908, 0.012563389, 0.002786174, -0.09517265, 0.0048836106, -0.06677479, -0.019171556, 0.010917907, -0.008704971, 0.0060687275, 0.06200121, -0.038049277) * inp_2_1_2; + result0 += M4(-0.016914193, 0.0003756224, -0.0075365487, -0.007128756, -0.013107135, 0.016854344, -0.04599476, 0.04629266, 0.013610901, -0.007050954, 0.010291758, 0.004635868, -0.03869191, -0.010872149, -0.04360142, 0.022049412) * inp_2_2_2; + const V4 inp_3_0_0 = inp[3][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_3_1_0 = inp[3][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_3_2_0 = inp[3][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_3_0_1 = inp[3][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_3_1_1 = inp[3][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_3_2_1 = inp[3][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_3_0_2 = inp[3][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_3_1_2 = inp[3][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_3_2_2 = inp[3][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(-0.018057039, -0.0056532323, -0.004921754, -0.012813976, 0.09519288, 0.015642338, 0.034959156, 0.0061383033, -0.024794618, 0.0033005886, -0.02530454, 0.0104278, 0.0015168404, -0.011411513, -0.004112359, 0.0014673101) * inp_3_0_0; + result0 += M4(0.038401797, 0.005379411, 0.0070208795, -0.018810933, 0.17417842, 0.19247055, 0.12278762, 0.14103527, -0.006320876, 0.0024225677, -0.008491686, 0.004179332, 0.049641743, -0.026433079, 0.019399887, 0.0020980397) * inp_3_1_0; + result0 += M4(0.0012757385, 0.012202646, 0.0035623172, 0.018136656, 0.09881706, 0.15917927, 0.0151400855, 0.00028577476, 0.04524848, -0.041263968, -0.017249944, -0.033683904, -0.01698196, 0.028303217, 0.02324336, 0.028754951) * inp_3_2_0; + result0 += M4(-0.052198302, 0.04360304, -0.02999543, 0.0030104658, 0.18560326, 0.0930691, 0.18070237, 0.16930774, 0.02439472, -0.008087286, 0.03613677, -0.015432936, -0.04436675, 0.0016982829, 0.0010508823, 0.022050397) * inp_3_0_1; + result0 += M4(0.007704695, -0.020238692, 0.01664558, 0.062356647, 0.15066172, 0.21183403, 0.18684728, 0.18240704, 0.006795045, 0.014074486, -0.008198805, -0.011049521, 0.07712641, -0.040222466, -0.033840235, -0.029639326) * inp_3_1_1; + result0 += M4(-0.026629766, 0.00077255396, -0.029040106, 0.0016355875, 0.013167326, 0.056489877, 0.07705183, 0.14948712, -0.043355707, 0.038330242, 0.042948004, 0.074978165, -0.046013735, 0.012165618, 0.028225949, -0.062387478) * inp_3_2_1; + result0 += M4(0.010352451, 0.0042662695, -0.018839378, -0.012445232, 0.046970673, 0.059868846, 0.1182908, 0.055844508, -0.0026135112, -0.013493774, -0.049471732, 0.008198826, 0.009780549, -0.0149789825, -0.027584512, 0.032418776) * inp_3_0_2; + result0 += M4(0.024346182, 0.0128713865, 0.016823815, -0.00078594836, 0.18802495, 0.15259756, 0.19018641, 0.111326836, 0.011781, -0.001944474, 0.0057664015, -0.005663143, -0.02084346, 0.037947528, 0.008893353, 0.016256006) * inp_3_1_2; + result0 += M4(-0.008431248, -0.003988211, -0.023087665, -0.014284694, 0.027970873, 0.04896214, 0.053775385, 0.1719036, -0.012696675, 0.006055201, 0.025086151, -0.030800432, -0.008749005, 0.013912466, -0.01604956, -0.013278638) * inp_3_2_2; + const V4 inp_4_0_0 = inp[4][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_4_1_0 = inp[4][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_4_2_0 = inp[4][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_4_0_1 = inp[4][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_4_1_1 = inp[4][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_4_2_1 = inp[4][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_4_0_2 = inp[4][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_4_1_2 = inp[4][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_4_2_2 = inp[4][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.027035957, -0.001727983, -0.038058687, 0.0019215011, -0.016602492, 0.04142214, -0.031124985, 0.008754783, 0.024437508, 0.023904093, -0.0073170806, 0.029633144, 0.053886887, -0.000786443, 0.0011853979, -0.0018102605) * inp_4_0_0; + result0 += M4(0.025673365, 0.0045333095, -0.023430139, 0.01593989, 0.017856536, -0.008548894, -0.009236777, 0.032396384, -0.037782874, -0.010345727, -0.0089425985, -0.025484724, -0.011748494, -0.019960396, 0.022057177, 0.010870722) * inp_4_1_0; + result0 += M4(-0.0132035995, -0.023796497, -0.0124581745, 0.025035223, -0.014144588, 0.011791141, 0.006945861, 0.010792054, 0.019469071, -0.030315429, 0.011015117, 0.029947242, 0.02119249, -0.03689373, 0.0088984305, -0.030573372) * inp_4_2_0; + result0 += M4(0.0023931018, -0.023345822, 0.040904418, -0.015035632, 0.01703145, 0.00425396, 0.0140907345, -0.0140721705, -0.027787715, 0.0075224033, 0.022050116, -0.026504023, -0.034039967, -0.003643743, -0.006023711, 0.039483856) * inp_4_0_1; + result0 += M4(-0.029590117, -0.021141862, 0.071957596, -0.0336122, -0.04172074, 0.024803123, -0.036530722, -0.040557653, 0.06285093, -0.021099618, -0.10349131, 0.0707771, -0.030481586, 0.036682453, 0.024502464, -0.061435662) * inp_4_1_1; + result0 += M4(0.011174801, 0.046214238, -0.0021442403, -0.029147811, 0.009365192, -0.029595075, 0.013788462, -0.0015760353, -0.04568219, 0.035792053, 0.05072393, -0.06544221, 0.023942366, 0.03853977, 0.022735637, 0.06610698) * inp_4_2_1; + result0 += M4(0.006338041, 0.020361701, -0.0067824423, -0.003947627, 0.032704953, -0.006698835, -0.0035317035, 0.0057447855, -0.0006970734, 0.008827609, 0.0139317615, 0.010289846, 0.01783806, 0.011726625, -0.004648798, -0.0010518747) * inp_4_0_2; + result0 += M4(-0.027534317, -0.002725158, -0.021682195, 0.009276546, 0.00465403, -0.020062914, 0.022039669, -0.02260507, 0.0144522535, 0.013655418, 0.061702747, -0.0226064, 0.008605401, -0.0073773633, -0.057404615, 0.019998875) * inp_4_1_2; + result0 += M4(-0.005678357, -0.0049298555, 0.0009996515, 0.02981446, 0.006154661, -0.012960902, 0.013703339, 0.008300753, -0.008354904, -0.028808627, -0.039570443, -0.00041028977, -0.03499294, -0.013585765, -0.017727628, -0.059121564) * inp_4_2_2; + const V4 inp_5_0_0 = inp[5][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_5_1_0 = inp[5][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_5_2_0 = inp[5][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_5_0_1 = inp[5][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_5_1_1 = inp[5][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_5_2_1 = inp[5][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_5_0_2 = inp[5][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_5_1_2 = inp[5][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_5_2_2 = inp[5][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.04170388, -0.019529209, -0.018018834, -0.019438146, -0.02083078, -0.0033040587, 0.0100842295, -0.0050027166, -0.0003378173, 0.06727183, 0.04650859, 0.048375327, 0.038303796, 0.027663454, -0.039137155, 0.009171028) * inp_5_0_0; + result0 += M4(0.019982602, -0.0249459, -0.012751955, 0.0045725615, 0.01627793, -0.014319806, -0.014722928, 0.021963373, -0.011650147, -0.07553433, -0.011966025, 0.01771322, -0.007950032, -0.013973676, 0.006713495, 0.011459011) * inp_5_1_0; + result0 += M4(-0.014447713, 0.008614453, 0.011193385, 0.007141866, 0.009824456, -0.00089666364, -0.002548852, 0.007748586, -0.011388673, 0.020810105, -0.0060611335, 0.014017124, 0.0023328953, -0.01573938, 0.01285341, -0.01807662) * inp_5_2_0; + result0 += M4(0.056046084, -0.023535885, -0.068331786, 0.02717778, 0.017807333, 0.0019748374, -0.0068850107, 0.038708404, 0.04318588, 0.0015067973, -0.03975645, 0.015628079, -0.014467969, 0.04084449, -0.0070325895, 0.012846049) * inp_5_0_1; + result0 += M4(-0.027800586, -0.020602718, 0.029230159, 0.0044212798, -0.05378062, 0.0642442, 0.043125078, -0.083871625, -0.051508404, 0.016264955, 0.04234981, -0.08965283, -0.0052434076, -0.0038138004, 0.0007658168, -0.019944321) * inp_5_1_1; + result0 += M4(-0.03192375, 0.053306185, 0.0049367724, 0.022651577, -0.027063776, 0.012003454, 0.005051003, -0.016263183, 0.00873581, -0.031931564, 0.0043969397, -0.0099551575, -0.023384333, -0.027997399, -0.021852894, 0.022383798) * inp_5_2_1; + result0 += M4(-0.019426594, 0.034683526, 0.0296715, 0.010804579, -0.0040897997, -0.0060237497, -0.0071962196, -0.0019908044, -0.019693485, 0.01076535, 0.017219638, -0.018238243, -0.012853426, -0.016389381, 0.05436375, -0.0121085895) * inp_5_0_2; + result0 += M4(-0.03382291, 0.002641697, 0.0019049572, -0.028393315, 0.015440549, -0.0018384404, 0.011452913, 0.004228759, 0.0362448, -0.02262268, -0.060999524, 0.01705417, 0.001508362, -0.021008112, -0.030081322, -0.019391933) * inp_5_1_2; + result0 += M4(0.009400724, -0.009104288, 0.0203178, -0.028126992, 0.0034908918, -0.004305072, -0.010145071, -0.001757641, 0.006817819, 0.014272401, 0.008344729, 0.004703456, 0.025134873, 0.031027516, 0.024994971, 0.007308565) * inp_5_2_2; + const V4 inp_6_0_0 = inp[6][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_6_1_0 = inp[6][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_6_2_0 = inp[6][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_6_0_1 = inp[6][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_6_1_1 = inp[6][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_6_2_1 = inp[6][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_6_0_2 = inp[6][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_6_1_2 = inp[6][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_6_2_2 = inp[6][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.046216406, 0.04013223, 0.022637717, 0.037999507, -0.0044159004, -0.00794685, 0.024207864, 0.0025732666, 0.043559026, 0.03873699, 0.01724756, 0.038473018, 0.023778522, 0.031236663, 0.025550468, 0.012978487) * inp_6_0_0; + result0 += M4(-0.0077000028, 0.026568945, -0.032858387, -0.020589037, -0.012868758, 0.013613979, -0.0020443846, 0.02042987, -0.09788121, -0.087637395, 0.00041312847, 0.00019147444, 0.08031381, 0.03283401, 0.12233605, 0.110899396) * inp_6_1_0; + result0 += M4(-0.042462565, -0.054496534, -0.0042801765, -0.029539658, 0.01379497, 0.0046376577, -0.016495699, 0.025020067, 0.01520732, -0.018245175, -0.0032068873, -0.010169325, 0.04624384, 0.07442156, 0.022851434, 0.014711161) * inp_6_2_0; + result0 += M4(-0.024853684, -0.025812684, 0.017901164, -0.042111825, -0.025046045, 0.036586355, -0.017606065, 0.020700235, 0.054814752, 0.08914263, 0.07000427, 0.15368068, 0.014881902, 0.03106977, 0.0012084277, 0.044843007) * inp_6_0_1; + result0 += M4(0.049438998, 0.0050062365, 0.047619678, -0.019605236, 0.014014792, -0.028813789, 0.008099111, -0.019973837, -0.22015119, -0.18944478, -0.35285142, -0.33329636, -0.21391287, -0.16782136, -0.13154778, -0.12509756) * inp_6_1_1; + result0 += M4(-0.02102647, 0.03372183, -0.048304737, 0.07164249, 0.026282452, -0.044945322, -0.013348963, -0.0110169565, -0.14309788, -0.12572491, -0.10030742, -0.08777088, -0.019639987, -0.03769315, -0.034074374, -0.010990223) * inp_6_2_1; + result0 += M4(-0.011997156, 0.0013695782, -0.045060657, -0.007001333, 0.01274352, 0.01616127, -0.0030261306, -0.011585007, 0.10423707, 0.10118122, 0.1123679, 0.11356589, 0.012429659, 0.018145185, 0.013008774, -0.0007892717) * inp_6_0_2; + result0 += M4(-0.00245833, -0.014636837, 0.05095593, 0.051648714, -0.012071569, -0.005331082, -0.00559285, 0.029061157, 0.20002998, 0.1608516, 0.15972093, 0.028499007, -0.017951163, -0.016680818, -0.015706625, -0.0057914127) * inp_6_1_2; + result0 += M4(0.01927152, -0.006052032, -0.008298531, -0.050855458, -0.011943485, 0.016552849, 0.027173173, -0.059561986, 0.022545243, 0.042098846, -0.0028235172, 0.035457514, -0.0149872275, -0.0134542575, 0.0010188918, 0.003915661) * inp_6_2_2; + const V4 inp_7_0_0 = inp[7][local_xy.y + 0][local_xy.x + 0]; + const V4 inp_7_1_0 = inp[7][local_xy.y + 0][local_xy.x + 1]; + const V4 inp_7_2_0 = inp[7][local_xy.y + 0][local_xy.x + 2]; + const V4 inp_7_0_1 = inp[7][local_xy.y + 1][local_xy.x + 0]; + const V4 inp_7_1_1 = inp[7][local_xy.y + 1][local_xy.x + 1]; + const V4 inp_7_2_1 = inp[7][local_xy.y + 1][local_xy.x + 2]; + const V4 inp_7_0_2 = inp[7][local_xy.y + 2][local_xy.x + 0]; + const V4 inp_7_1_2 = inp[7][local_xy.y + 2][local_xy.x + 1]; + const V4 inp_7_2_2 = inp[7][local_xy.y + 2][local_xy.x + 2]; + result0 += M4(0.01986294, 0.0013975124, -0.021860953, -0.023892097, 0.026175946, 0.0031710062, -0.0047705346, 0.010474724, 0.051030103, -0.0055353106, 0.00083526655, -0.0073956363, 0.006312569, -0.0132266125, 0.008836988, -0.0071050567) * inp_7_0_0; + result0 += M4(-0.026274044, -0.064851485, -0.0033733554, -0.015098632, 0.09444398, 0.07071972, 0.05556516, 0.07357374, 0.019003304, 0.056178555, -0.04381748, -0.035710856, 0.047391187, -0.009564349, 0.017872961, -0.008098228) * inp_7_1_0; + result0 += M4(0.029733414, -0.018371698, -0.0125034135, 0.02052616, -0.040687542, -0.020336702, -0.009098794, -0.018565234, 0.015604587, 0.02960498, -0.012892026, 0.0037323094, 0.00053185824, 0.0025688836, -0.008037344, 0.02582504) * inp_7_2_0; + result0 += M4(0.022677144, 0.024004947, 0.044669386, -0.018299077, 0.13872012, 0.011745517, 0.071726315, -0.044237614, 0.018301947, -0.008789172, 0.081117205, -0.03719678, -0.019320574, 0.015496215, -0.0009444586, 0.014418554) * inp_7_0_1; + result0 += M4(-0.04247576, 0.0041989894, 0.013913582, 0.100882426, 0.34981325, 0.4189776, 0.21993862, 0.3714919, -0.23627701, -0.061629415, 0.05012969, 0.23213203, 0.011181464, 0.04809275, -0.031068724, -0.013325444) * inp_7_1_1; + result0 += M4(-0.045233317, 0.028607037, 0.020917512, -0.05380463, -0.15105844, -0.016501931, -0.17456064, -0.13417023, -0.0028739634, -0.080853365, -0.00080034445, -0.02251335, -0.049287587, 0.0016940259, -0.0017634231, -0.041333154) * inp_7_2_1; + result0 += M4(0.015168607, 0.011885032, -0.02304455, -0.014429955, -0.08853672, -0.065099955, 0.025816185, -0.050758783, 0.024936106, 0.018456984, -0.00069481827, 0.001492164, -0.0069567575, -0.0025601152, 0.01969471, 0.0057533914) * inp_7_0_2; + result0 += M4(0.015999861, -0.018546596, 0.014207756, 0.033255726, -0.18008111, -0.21260013, 0.0057166554, -0.0055222693, 0.041074067, 0.01763359, -0.08603409, -0.051240996, 0.018637924, -0.03223119, -0.06413628, -0.022618188) * inp_7_1_2; + result0 += M4(0.008689513, 0.031285986, -0.0359882, -0.02487851, -0.15231301, -0.13464579, -0.1711299, -0.11705904, 0.043780815, 0.031348348, 0.016351987, -0.04400004, 0.013258273, 0.0038718034, 0.04604814, 0.025674326) * inp_7_2_2; + const ivec2 output_base = ivec2(gl_GlobalInvocationID) * ivec2(1, 1); + imageStore(out_image, output_base + ivec2(0, 0), result0); +} + +//!DESC ArtCNN C4F32 DS (Depth-To-Space) +//!COMPUTE 12 16 12 16 +//!HOOK LUMA +//!BIND conv2d_6 +//!WIDTH LUMA.w 2.0 * +//!HEIGHT LUMA.h 2.0 * +//!COMPONENTS 4 +//!WHEN OUTPUT.w LUMA.w / 1.3 > OUTPUT.h LUMA.h / 1.3 > * +#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable +#ifdef GL_EXT_shader_explicit_arithmetic_types_float16 +# define V4 f16vec4 +# define M4 f16mat4 +# define F float16_t +#else +# define V4 vec4 +# define M4 mat4 +# define F float +#endif + +void hook() { + vec4 result = vec4(0.0, 0.0, 0.0, 1.0); + vec2 f0 = fract(conv2d_6_pos * conv2d_6_size); + ivec2 i0 = ivec2(f0 * vec2(2.0)); + result.x = conv2d_6_tex((vec2(0.5) - f0) * conv2d_6_pt + conv2d_6_pos)[i0.y * 2 + i0.x]; + imageStore(out_image, ivec2(gl_GlobalInvocationID), clamp(result, 0.0, 1.0)); +}