Coverage Report

Created: 2024-10-01 06:54

/src/Simd/src/Simd/SimdAvx512bwSynetConvolution8iDirect1x1.cpp
Line
Count
Source (jump to first uncovered line)
1
/*
2
* Simd Library (http://ermig1979.github.io/Simd).
3
*
4
* Copyright (c) 2011-2024 Yermalayeu Ihar.
5
*
6
* Permission is hereby granted, free of charge, to any person obtaining a copy
7
* of this software and associated documentation files (the "Software"), to deal
8
* in the Software without restriction, including without limitation the rights
9
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10
* copies of the Software, and to permit persons to whom the Software is
11
* furnished to do so, subject to the following conditions:
12
*
13
* The above copyright notice and this permission notice shall be included in
14
* all copies or substantial portions of the Software.
15
*
16
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22
* SOFTWARE.
23
*/
24
#include "Simd/SimdSynetConvolution8i.h"
25
#include "Simd/SimdSynetConvolution8iCommon.h"
26
#include "Simd/SimdSynet.h"
27
#include "Simd/SimdMath.h"
28
#include "Simd/SimdBase.h"
29
#include "Simd/SimdAvx512bw.h"
30
#include "Simd/SimdCpu.h"
31
32
namespace Simd
33
{
34
#if defined(SIMD_AVX512BW_ENABLE) && defined(SIMD_SYNET_ENABLE)  
35
    namespace Avx512bw
36
    {
37
        using AlgParam = SynetConvolution8iNhwcDirect::AlgParam;
38
        using ConvolutionPtr = SynetConvolution8iNhwcDirect::ConvolutionPtr;
39
40
        //---------------------------------------------------------------------
41
42
        template<Term8iType term, SimdConvolutionActivationType type, int M> void ConvolutionNhwcDirect1x1_2xM(
43
            const uint8_t* src0, const ConvParam& p, const AlgParam& a, size_t srcC, size_t dstC, const int8_t* weight0,
44
            const __m512* norm, const __m512* bias, const __m512* params, const __m512* scale, const __m512* shift, int32_t* buf, uint8_t* dst, int first)
45
0
        {
46
0
            __m512i d00, d01, d10, d11, d20, d21, d30, d31, d40, d41, d50, d51, d60, d61, d70, d71, d80, d81, d90, d91, dA0, dA1, dB0, dB1, s0, w0, w1;
47
0
            size_t dS = p.srcC * p.strideX, dD = p.dstC * a.size, dB = p.dstC;
48
0
            const int8_t* weight1 = weight0 + DivHi(p.srcC, 4) * A;
49
0
            const uint8_t* src1 = src0 + 1 * dS;
50
0
            const uint8_t* src2 = src0 + 2 * dS;
51
0
            const uint8_t* src3 = src0 + 3 * dS;
52
0
            const uint8_t* src4 = src0 + 4 * dS;
53
0
            const uint8_t* src5 = src0 + 5 * dS;
54
0
            __m128i upper = _mm_set1_epi32(a.upper);
55
0
            if (dstC > F)
56
0
            {
57
0
                if (first)
58
0
                {
59
0
                    if (M > 0x0) d00 = _mm512_setzero_si512(), d01 = _mm512_setzero_si512();
60
0
                    if (M > 0x1) d10 = _mm512_setzero_si512(), d11 = _mm512_setzero_si512();
61
0
                    if (M > 0x2) d20 = _mm512_setzero_si512(), d21 = _mm512_setzero_si512();
62
0
                    if (M > 0x3) d30 = _mm512_setzero_si512(), d31 = _mm512_setzero_si512();
63
0
                    if (M > 0x4) d40 = _mm512_setzero_si512(), d41 = _mm512_setzero_si512();
64
0
                    if (M > 0x5) d50 = _mm512_setzero_si512(), d51 = _mm512_setzero_si512();
65
0
                    if (M > 0x6) d60 = _mm512_setzero_si512(), d61 = _mm512_setzero_si512();
66
0
                    if (M > 0x7) d70 = _mm512_setzero_si512(), d71 = _mm512_setzero_si512();
67
0
                    if (M > 0x8) d80 = _mm512_setzero_si512(), d81 = _mm512_setzero_si512();
68
0
                    if (M > 0x9) d90 = _mm512_setzero_si512(), d91 = _mm512_setzero_si512();
69
0
                    if (M > 0xA) dA0 = _mm512_setzero_si512(), dA1 = _mm512_setzero_si512();
70
0
                    if (M > 0xB) dB0 = _mm512_setzero_si512(), dB1 = _mm512_setzero_si512();
71
0
                }
72
0
                else
73
0
                {
74
0
                    if (M > 0x0) d00 = _mm512_loadu_si512(buf + 0x0 * dB + 0), d01 = _mm512_loadu_si512(buf + 0x0 * dB + F);
75
0
                    if (M > 0x1) d10 = _mm512_loadu_si512(buf + 0x1 * dB + 0), d11 = _mm512_loadu_si512(buf + 0x1 * dB + F);
76
0
                    if (M > 0x2) d20 = _mm512_loadu_si512(buf + 0x2 * dB + 0), d21 = _mm512_loadu_si512(buf + 0x2 * dB + F);
77
0
                    if (M > 0x3) d30 = _mm512_loadu_si512(buf + 0x3 * dB + 0), d31 = _mm512_loadu_si512(buf + 0x3 * dB + F);
78
0
                    if (M > 0x4) d40 = _mm512_loadu_si512(buf + 0x4 * dB + 0), d41 = _mm512_loadu_si512(buf + 0x4 * dB + F);
79
0
                    if (M > 0x5) d50 = _mm512_loadu_si512(buf + 0x5 * dB + 0), d51 = _mm512_loadu_si512(buf + 0x5 * dB + F);
80
0
                    if (M > 0x6) d60 = _mm512_loadu_si512(buf + 0x6 * dB + 0), d61 = _mm512_loadu_si512(buf + 0x6 * dB + F);
81
0
                    if (M > 0x7) d70 = _mm512_loadu_si512(buf + 0x7 * dB + 0), d71 = _mm512_loadu_si512(buf + 0x7 * dB + F);
82
0
                    if (M > 0x8) d80 = _mm512_loadu_si512(buf + 0x8 * dB + 0), d81 = _mm512_loadu_si512(buf + 0x8 * dB + F);
83
0
                    if (M > 0x9) d90 = _mm512_loadu_si512(buf + 0x9 * dB + 0), d91 = _mm512_loadu_si512(buf + 0x9 * dB + F);
84
0
                    if (M > 0xA) dA0 = _mm512_loadu_si512(buf + 0xA * dB + 0), dA1 = _mm512_loadu_si512(buf + 0xA * dB + F);
85
0
                    if (M > 0xB) dB0 = _mm512_loadu_si512(buf + 0xB * dB + 0), dB1 = _mm512_loadu_si512(buf + 0xB * dB + F);
86
0
                }
87
0
                if (Base::Overflow(p.compatibility) || Base::Narrowed(p.compatibility))
88
0
                {
89
0
                    for (size_t offs0 = 0, offs6 = offs0 + 6 * dS; offs0 < srcC; offs0 += 4, offs6 += 4)
90
0
                    {
91
0
                        w0 = _mm512_loadu_si512((__m512i*)weight0);
92
0
                        w1 = _mm512_loadu_si512((__m512i*)weight1);
93
0
                        if (M > 0x0) s0 = Set4(src0 + offs0), Madd4<true>(d00, s0, w0), Madd4<true>(d01, s0, w1);
94
0
                        if (M > 0x1) s0 = Set4(src1 + offs0), Madd4<true>(d10, s0, w0), Madd4<true>(d11, s0, w1);
95
0
                        if (M > 0x2) s0 = Set4(src2 + offs0), Madd4<true>(d20, s0, w0), Madd4<true>(d21, s0, w1);
96
0
                        if (M > 0x3) s0 = Set4(src3 + offs0), Madd4<true>(d30, s0, w0), Madd4<true>(d31, s0, w1);
97
0
                        if (M > 0x4) s0 = Set4(src4 + offs0), Madd4<true>(d40, s0, w0), Madd4<true>(d41, s0, w1);
98
0
                        if (M > 0x5) s0 = Set4(src5 + offs0), Madd4<true>(d50, s0, w0), Madd4<true>(d51, s0, w1);
99
0
                        if (M > 0x6) s0 = Set4(src0 + offs6), Madd4<true>(d60, s0, w0), Madd4<true>(d61, s0, w1);
100
0
                        if (M > 0x7) s0 = Set4(src1 + offs6), Madd4<true>(d70, s0, w0), Madd4<true>(d71, s0, w1);
101
0
                        if (M > 0x8) s0 = Set4(src2 + offs6), Madd4<true>(d80, s0, w0), Madd4<true>(d81, s0, w1);
102
0
                        if (M > 0x9) s0 = Set4(src3 + offs6), Madd4<true>(d90, s0, w0), Madd4<true>(d91, s0, w1);
103
0
                        if (M > 0xA) s0 = Set4(src4 + offs6), Madd4<true>(dA0, s0, w0), Madd4<true>(dA1, s0, w1);
104
0
                        if (M > 0xB) s0 = Set4(src5 + offs6), Madd4<true>(dB0, s0, w0), Madd4<true>(dB1, s0, w1);
105
0
                        weight0 += A, weight1 += A;
106
0
                    }
107
0
                }
108
0
                else
109
0
                {
110
0
                    for (size_t offs0 = 0, offs6 = offs0 + 6 * dS; offs0 < srcC; offs0 += 4, offs6 += 4)
111
0
                    {
112
0
                        w0 = _mm512_loadu_si512((__m512i*)weight0);
113
0
                        w1 = _mm512_loadu_si512((__m512i*)weight1);
114
0
                        if (M > 0x0) s0 = Set4(src0 + offs0), Madd4<false>(d00, s0, w0), Madd4<false>(d01, s0, w1);
115
0
                        if (M > 0x1) s0 = Set4(src1 + offs0), Madd4<false>(d10, s0, w0), Madd4<false>(d11, s0, w1);
116
0
                        if (M > 0x2) s0 = Set4(src2 + offs0), Madd4<false>(d20, s0, w0), Madd4<false>(d21, s0, w1);
117
0
                        if (M > 0x3) s0 = Set4(src3 + offs0), Madd4<false>(d30, s0, w0), Madd4<false>(d31, s0, w1);
118
0
                        if (M > 0x4) s0 = Set4(src4 + offs0), Madd4<false>(d40, s0, w0), Madd4<false>(d41, s0, w1);
119
0
                        if (M > 0x5) s0 = Set4(src5 + offs0), Madd4<false>(d50, s0, w0), Madd4<false>(d51, s0, w1);
120
0
                        if (M > 0x6) s0 = Set4(src0 + offs6), Madd4<false>(d60, s0, w0), Madd4<false>(d61, s0, w1);
121
0
                        if (M > 0x7) s0 = Set4(src1 + offs6), Madd4<false>(d70, s0, w0), Madd4<false>(d71, s0, w1);
122
0
                        if (M > 0x8) s0 = Set4(src2 + offs6), Madd4<false>(d80, s0, w0), Madd4<false>(d81, s0, w1);
123
0
                        if (M > 0x9) s0 = Set4(src3 + offs6), Madd4<false>(d90, s0, w0), Madd4<false>(d91, s0, w1);
124
0
                        if (M > 0xA) s0 = Set4(src4 + offs6), Madd4<false>(dA0, s0, w0), Madd4<false>(dA1, s0, w1);
125
0
                        if (M > 0xB) s0 = Set4(src5 + offs6), Madd4<false>(dB0, s0, w0), Madd4<false>(dB1, s0, w1);
126
0
                        weight0 += A, weight1 += A;
127
0
                    }
128
0
                }
129
0
                __mmask16 tail = TailMask16(dstC - F);
130
0
                if (Base::FmaAvoid(p.compatibility))
131
0
                {
132
0
                    if (M > 0x0) Save2<term, type, true>(dst, buf, d00, d01, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
133
0
                    if (M > 0x1) Save2<term, type, true>(dst, buf, d10, d11, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
134
0
                    if (M > 0x2) Save2<term, type, true>(dst, buf, d20, d21, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
135
0
                    if (M > 0x3) Save2<term, type, true>(dst, buf, d30, d31, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
136
0
                    if (M > 0x4) Save2<term, type, true>(dst, buf, d40, d41, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
137
0
                    if (M > 0x5) Save2<term, type, true>(dst, buf, d50, d51, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
138
0
                    if (M > 0x6) Save2<term, type, true>(dst, buf, d60, d61, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
139
0
                    if (M > 0x7) Save2<term, type, true>(dst, buf, d70, d71, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
140
0
                    if (M > 0x8) Save2<term, type, true>(dst, buf, d80, d81, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
141
0
                    if (M > 0x9) Save2<term, type, true>(dst, buf, d90, d91, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
142
0
                    if (M > 0xA) Save2<term, type, true>(dst, buf, dA0, dA1, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
143
0
                    if (M > 0xB) Save2<term, type, true>(dst, buf, dB0, dB1, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
144
0
                }
145
0
                else
146
0
                {
147
0
                    if (M > 0x0) Save2<term, type, false>(dst, buf, d00, d01, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
148
0
                    if (M > 0x1) Save2<term, type, false>(dst, buf, d10, d11, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
149
0
                    if (M > 0x2) Save2<term, type, false>(dst, buf, d20, d21, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
150
0
                    if (M > 0x3) Save2<term, type, false>(dst, buf, d30, d31, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
151
0
                    if (M > 0x4) Save2<term, type, false>(dst, buf, d40, d41, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
152
0
                    if (M > 0x5) Save2<term, type, false>(dst, buf, d50, d51, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
153
0
                    if (M > 0x6) Save2<term, type, false>(dst, buf, d60, d61, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
154
0
                    if (M > 0x7) Save2<term, type, false>(dst, buf, d70, d71, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
155
0
                    if (M > 0x8) Save2<term, type, false>(dst, buf, d80, d81, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
156
0
                    if (M > 0x9) Save2<term, type, false>(dst, buf, d90, d91, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
157
0
                    if (M > 0xA) Save2<term, type, false>(dst, buf, dA0, dA1, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
158
0
                    if (M > 0xB) Save2<term, type, false>(dst, buf, dB0, dB1, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
159
0
                }
160
0
            }
161
0
            else
162
0
            {
163
0
                if (first)
164
0
                {
165
0
                    if (M > 0x0) d00 = _mm512_setzero_si512();
166
0
                    if (M > 0x1) d10 = _mm512_setzero_si512();
167
0
                    if (M > 0x2) d20 = _mm512_setzero_si512();
168
0
                    if (M > 0x3) d30 = _mm512_setzero_si512();
169
0
                    if (M > 0x4) d40 = _mm512_setzero_si512();
170
0
                    if (M > 0x5) d50 = _mm512_setzero_si512();
171
0
                    if (M > 0x6) d60 = _mm512_setzero_si512();
172
0
                    if (M > 0x7) d70 = _mm512_setzero_si512();
173
0
                    if (M > 0x8) d80 = _mm512_setzero_si512();
174
0
                    if (M > 0x9) d90 = _mm512_setzero_si512();
175
0
                    if (M > 0xA) dA0 = _mm512_setzero_si512();
176
0
                    if (M > 0xB) dB0 = _mm512_setzero_si512();
177
0
                }
178
0
                else
179
0
                {
180
0
                    if (M > 0x0) d00 = _mm512_loadu_si512(buf + 0x0 * dB + 0);
181
0
                    if (M > 0x1) d10 = _mm512_loadu_si512(buf + 0x1 * dB + 0);
182
0
                    if (M > 0x2) d20 = _mm512_loadu_si512(buf + 0x2 * dB + 0);
183
0
                    if (M > 0x3) d30 = _mm512_loadu_si512(buf + 0x3 * dB + 0);
184
0
                    if (M > 0x4) d40 = _mm512_loadu_si512(buf + 0x4 * dB + 0);
185
0
                    if (M > 0x5) d50 = _mm512_loadu_si512(buf + 0x5 * dB + 0);
186
0
                    if (M > 0x6) d60 = _mm512_loadu_si512(buf + 0x6 * dB + 0);
187
0
                    if (M > 0x7) d70 = _mm512_loadu_si512(buf + 0x7 * dB + 0);
188
0
                    if (M > 0x8) d80 = _mm512_loadu_si512(buf + 0x8 * dB + 0);
189
0
                    if (M > 0x9) d90 = _mm512_loadu_si512(buf + 0x9 * dB + 0);
190
0
                    if (M > 0xA) dA0 = _mm512_loadu_si512(buf + 0xA * dB + 0);
191
0
                    if (M > 0xB) dB0 = _mm512_loadu_si512(buf + 0xB * dB + 0);
192
0
                }
193
0
                if (Base::Overflow(p.compatibility) || Base::Narrowed(p.compatibility))
194
0
                {
195
0
                    for (size_t offs0 = 0, offs6 = offs0 + 6 * dS; offs0 < srcC; offs0 += 4, offs6 += 4)
196
0
                    {
197
0
                        w0 = _mm512_loadu_si512((__m512i*)weight0);
198
0
                        if (M > 0x0) s0 = Set4(src0 + offs0), Madd4<true>(d00, s0, w0);
199
0
                        if (M > 0x1) s0 = Set4(src1 + offs0), Madd4<true>(d10, s0, w0);
200
0
                        if (M > 0x2) s0 = Set4(src2 + offs0), Madd4<true>(d20, s0, w0);
201
0
                        if (M > 0x3) s0 = Set4(src3 + offs0), Madd4<true>(d30, s0, w0);
202
0
                        if (M > 0x4) s0 = Set4(src4 + offs0), Madd4<true>(d40, s0, w0);
203
0
                        if (M > 0x5) s0 = Set4(src5 + offs0), Madd4<true>(d50, s0, w0);
204
0
                        if (M > 0x6) s0 = Set4(src0 + offs6), Madd4<true>(d60, s0, w0);
205
0
                        if (M > 0x7) s0 = Set4(src1 + offs6), Madd4<true>(d70, s0, w0);
206
0
                        if (M > 0x8) s0 = Set4(src2 + offs6), Madd4<true>(d80, s0, w0);
207
0
                        if (M > 0x9) s0 = Set4(src3 + offs6), Madd4<true>(d90, s0, w0);
208
0
                        if (M > 0xA) s0 = Set4(src4 + offs6), Madd4<true>(dA0, s0, w0);
209
0
                        if (M > 0xB) s0 = Set4(src5 + offs6), Madd4<true>(dB0, s0, w0);
210
0
                        weight0 += A;
211
0
                    }
212
0
                }
213
0
                else
214
0
                {
215
0
                    for (size_t offs0 = 0, offs6 = offs0 + 6 * dS; offs0 < srcC; offs0 += 4, offs6 += 4)
216
0
                    {
217
0
                        w0 = _mm512_loadu_si512((__m512i*)weight0);
218
0
                        if (M > 0x0) s0 = Set4(src0 + offs0), Madd4<false>(d00, s0, w0);
219
0
                        if (M > 0x1) s0 = Set4(src1 + offs0), Madd4<false>(d10, s0, w0);
220
0
                        if (M > 0x2) s0 = Set4(src2 + offs0), Madd4<false>(d20, s0, w0);
221
0
                        if (M > 0x3) s0 = Set4(src3 + offs0), Madd4<false>(d30, s0, w0);
222
0
                        if (M > 0x4) s0 = Set4(src4 + offs0), Madd4<false>(d40, s0, w0);
223
0
                        if (M > 0x5) s0 = Set4(src5 + offs0), Madd4<false>(d50, s0, w0);
224
0
                        if (M > 0x6) s0 = Set4(src0 + offs6), Madd4<false>(d60, s0, w0);
225
0
                        if (M > 0x7) s0 = Set4(src1 + offs6), Madd4<false>(d70, s0, w0);
226
0
                        if (M > 0x8) s0 = Set4(src2 + offs6), Madd4<false>(d80, s0, w0);
227
0
                        if (M > 0x9) s0 = Set4(src3 + offs6), Madd4<false>(d90, s0, w0);
228
0
                        if (M > 0xA) s0 = Set4(src4 + offs6), Madd4<false>(dA0, s0, w0);
229
0
                        if (M > 0xB) s0 = Set4(src5 + offs6), Madd4<false>(dB0, s0, w0);
230
0
                        weight0 += A;
231
0
                    }
232
0
                }
233
0
                __mmask16 tail = TailMask16(dstC);
234
0
                if (Base::FmaAvoid(p.compatibility))
235
0
                {
236
0
                    if (M > 0x0) Save1<term, type, true>(dst, buf, d00, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
237
0
                    if (M > 0x1) Save1<term, type, true>(dst, buf, d10, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
238
0
                    if (M > 0x2) Save1<term, type, true>(dst, buf, d20, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
239
0
                    if (M > 0x3) Save1<term, type, true>(dst, buf, d30, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
240
0
                    if (M > 0x4) Save1<term, type, true>(dst, buf, d40, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
241
0
                    if (M > 0x5) Save1<term, type, true>(dst, buf, d50, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
242
0
                    if (M > 0x6) Save1<term, type, true>(dst, buf, d60, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
243
0
                    if (M > 0x7) Save1<term, type, true>(dst, buf, d70, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
244
0
                    if (M > 0x8) Save1<term, type, true>(dst, buf, d80, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
245
0
                    if (M > 0x9) Save1<term, type, true>(dst, buf, d90, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
246
0
                    if (M > 0xA) Save1<term, type, true>(dst, buf, dA0, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
247
0
                    if (M > 0xB) Save1<term, type, true>(dst, buf, dB0, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
248
0
                }
249
0
                else
250
0
                {
251
0
                    if (M > 0x0) Save1<term, type, false>(dst, buf, d00, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
252
0
                    if (M > 0x1) Save1<term, type, false>(dst, buf, d10, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
253
0
                    if (M > 0x2) Save1<term, type, false>(dst, buf, d20, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
254
0
                    if (M > 0x3) Save1<term, type, false>(dst, buf, d30, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
255
0
                    if (M > 0x4) Save1<term, type, false>(dst, buf, d40, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
256
0
                    if (M > 0x5) Save1<term, type, false>(dst, buf, d50, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
257
0
                    if (M > 0x6) Save1<term, type, false>(dst, buf, d60, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
258
0
                    if (M > 0x7) Save1<term, type, false>(dst, buf, d70, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
259
0
                    if (M > 0x8) Save1<term, type, false>(dst, buf, d80, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
260
0
                    if (M > 0x9) Save1<term, type, false>(dst, buf, d90, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
261
0
                    if (M > 0xA) Save1<term, type, false>(dst, buf, dA0, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
262
0
                    if (M > 0xB) Save1<term, type, false>(dst, buf, dB0, norm, bias, params, scale, shift, upper, tail), dst += dD, buf += dB;
263
0
                }
264
0
            }
265
0
        }
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 1>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 2>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 11>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10, 12>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
266
267
        typedef void(*ConvolutionNhwcDirect1x1_2xM_Ptr)(const uint8_t* src0, const ConvParam& p, const AlgParam& a, size_t srcC, size_t dstC,
268
            const int8_t* weight0, const __m512* norm, const __m512* bias, const __m512* params, const __m512* scale, const __m512* shift, int32_t* buf, uint8_t* dst, int first);
269
270
        template<Term8iType term, SimdConvolutionActivationType type> ConvolutionNhwcDirect1x1_2xM_Ptr GetConvolutionNhwcDirect1x1_2xM(size_t M)
271
0
        {
272
0
            switch (M)
273
0
            {
274
0
            case 0x0: return NULL;
275
0
            case 0x1: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x1>;
276
0
            case 0x2: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x2>;
277
0
            case 0x3: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x3>;
278
0
            case 0x4: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x4>;
279
0
            case 0x5: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x5>;
280
0
            case 0x6: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x6>;
281
0
            case 0x7: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x7>;
282
0
            case 0x8: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x8>;
283
0
            case 0x9: return ConvolutionNhwcDirect1x1_2xM< term, type, 0x9>;
284
0
            case 0xA: return ConvolutionNhwcDirect1x1_2xM< term, type, 0xA>;
285
0
            case 0xB: return ConvolutionNhwcDirect1x1_2xM< term, type, 0xB>;
286
0
            case 0xC: return ConvolutionNhwcDirect1x1_2xM< term, type, 0xC>;
287
0
            }
288
0
            assert(0);
289
0
            return NULL;
290
0
        }
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)3>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)3>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)2, (SimdConvolutionActivationType)0>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)4>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)4>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)5>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)5>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)6>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)6>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)7>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)7>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)8>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)8>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)9>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)9>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)0, (SimdConvolutionActivationType)10>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
Unexecuted instantiation: void (*Simd::Avx512bw::GetConvolutionNhwcDirect1x1_2xM<(Simd::Term8iType)1, (SimdConvolutionActivationType)10>(unsigned long))(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, signed char const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, float __vector(16) const*, int*, unsigned char*, int)
291
292
        template<Term8iType term, SimdConvolutionActivationType type> void ConvolutionNhwcDirect1x1_2(const uint8_t* src,
293
            const ConvParam& p, const AlgParam& a, size_t dstC, size_t yBeg, size_t yEnd, size_t srcC, const int8_t* weight,
294
            const float* norm, const float* bias, const float* params, const float* scale, const float* shift, int32_t* buf, uint8_t* dst, int first)
295
0
        {
296
0
            size_t n = 12, n1 = (yEnd - yBeg) * p.dstW, nn = AlignLoAny(n1, n), m = n1 - nn;
297
0
            ConvolutionNhwcDirect1x1_2xM_Ptr convolutionNhwcDirect1x1_2xN = GetConvolutionNhwcDirect1x1_2xM<term, type>(n);
298
0
            ConvolutionNhwcDirect1x1_2xM_Ptr convolutionNhwcDirect1x1_2xM = GetConvolutionNhwcDirect1x1_2xM<term, type>(m);
299
0
            __m512 _norm[2], _bias[2], _params[2], _scale[2], _shift[2];
300
0
            _params[0] = _mm512_set1_ps(params[0]);
301
0
            _params[1] = _mm512_set1_ps(params[1]);
302
0
            for (size_t dc = 0; dc < dstC; dc += DF)
303
0
            {
304
0
                size_t dC = Simd::Min(DF, dstC - dc);
305
0
                _norm[0] = _mm512_loadu_ps(norm + dc + 0);
306
0
                _norm[1] = _mm512_loadu_ps(norm + dc + F);
307
0
                _bias[0] = _mm512_loadu_ps(bias + dc + 0);
308
0
                _bias[1] = _mm512_loadu_ps(bias + dc + F);
309
0
                if (type == ::SimdConvolutionActivationPrelu)
310
0
                {
311
0
                    _params[0] = _mm512_loadu_ps(params + dc + 0);
312
0
                    _params[1] = _mm512_loadu_ps(params + dc + F);
313
0
                }
314
0
                _scale[0] = _mm512_loadu_ps(scale + dc + 0);
315
0
                _scale[1] = _mm512_loadu_ps(scale + dc + F);
316
0
                _shift[0] = _mm512_loadu_ps(shift + dc + 0);
317
0
                _shift[1] = _mm512_loadu_ps(shift + dc + F);
318
0
                const uint8_t* s = src + yBeg * p.srcW * p.srcC;
319
0
                uint8_t* d = dst + (dc + yBeg * p.dstW * p.dstC) * a.size;
320
0
                int32_t* b = buf + dc + yBeg * p.dstW * p.dstC;
321
0
                size_t i = 0;
322
0
                for (; i < nn; i += n, s += p.srcC * n, b += p.dstC * n, d += p.dstC * a.size * n)
323
0
                    convolutionNhwcDirect1x1_2xN(s, p, a, srcC, dC, weight, _norm, _bias, _params, _scale, _shift, b, d, first);
324
0
                for (; i < n1; i += m, s += p.srcC * m, b += p.dstC * m, d += p.dstC * a.size * m)
325
0
                    convolutionNhwcDirect1x1_2xM(s, p, a, srcC, dC, weight, _norm, _bias, _params, _scale, _shift, b, d, first);
326
0
                weight += DivHi(p.srcC, 4) * DA;
327
0
            }
328
0
        }
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)3>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)2, (SimdConvolutionActivationType)0>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)4>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)5>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)6>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)7>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)8>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)9>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)0, (SimdConvolutionActivationType)10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
Unexecuted instantiation: void Simd::Avx512bw::ConvolutionNhwcDirect1x1_2<(Simd::Term8iType)1, (SimdConvolutionActivationType)10>(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int)
329
330
        //---------------------------------------------------------------------
331
332
        template <Term8iType term, SimdConvolutionActivationType activation> void SetDirect1x1(const ConvParam& p, const AlgParam& a, ConvolutionPtr* d)
333
0
        {
334
0
            assert(a.microD == 2 * F && p.Is1x1() == true);
335
0
            d[term] = ConvolutionNhwcDirect1x1_2<term, activation>;
336
0
        }
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)3>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)3>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)2, (SimdConvolutionActivationType)0>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)4>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)4>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)5>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)5>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)6>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)6>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)7>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)7>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)8>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)8>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)9>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)9>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)0, (SimdConvolutionActivationType)10>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(Simd::Term8iType)1, (SimdConvolutionActivationType)10>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
337
338
        template<SimdConvolutionActivationType activation> void SetDirect1x1(const ConvParam& p, const AlgParam& a, ConvolutionPtr* d)
339
0
        {
340
0
            SetDirect1x1<Term8iLast8u, activation>(p, a, d);
341
0
            SetDirect1x1<Term8iLast32f, activation>(p, a, d);
342
0
            SetDirect1x1<Term8iInterim, SimdConvolutionActivationIdentity>(p, a, d);
343
0
        }
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)3>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)4>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)5>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)6>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)7>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)8>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)9>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
Unexecuted instantiation: void Simd::Avx512bw::SetDirect1x1<(SimdConvolutionActivationType)10>(Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, void (**)(unsigned char const*, Simd::ConvParam const&, Simd::Base::SynetConvolution8iNhwcDirect::AlgParam const&, unsigned long, unsigned long, unsigned long, unsigned long, signed char const*, float const*, float const*, float const*, float const*, float const*, int*, unsigned char*, int))
344
345
        void SetDirect1x1(const ConvParam& p, const AlgParam& a, ConvolutionPtr* d)
346
0
        {
347
0
            switch (p.activation)
348
0
            {
349
0
            case SimdConvolutionActivationIdentity: SetDirect1x1<SimdConvolutionActivationRestrictRange>(p, a, d); break;
350
0
            case SimdConvolutionActivationRelu: SetDirect1x1<SimdConvolutionActivationRestrictRange>(p, a, d); break;
351
0
            case SimdConvolutionActivationLeakyRelu: SetDirect1x1<SimdConvolutionActivationPrelu>(p, a, d); break;
352
0
            case SimdConvolutionActivationRestrictRange: SetDirect1x1<SimdConvolutionActivationRestrictRange>(p, a, d); break;
353
0
            case SimdConvolutionActivationPrelu: SetDirect1x1<SimdConvolutionActivationPrelu>(p, a, d); break;
354
0
            case SimdConvolutionActivationElu: SetDirect1x1<SimdConvolutionActivationElu>(p, a, d); break;
355
0
            case SimdConvolutionActivationHswish: SetDirect1x1<SimdConvolutionActivationHswish>(p, a, d); break;
356
0
            case SimdConvolutionActivationMish: SetDirect1x1<SimdConvolutionActivationMish>(p, a, d); break;
357
0
            case SimdConvolutionActivationHardSigmoid: SetDirect1x1<SimdConvolutionActivationHardSigmoid>(p, a, d); break;
358
0
            case SimdConvolutionActivationSwish: SetDirect1x1<SimdConvolutionActivationSwish>(p, a, d); break;
359
0
            case SimdConvolutionActivationGelu: SetDirect1x1<SimdConvolutionActivationGelu>(p, a, d); break;
360
0
            default: assert(0);
361
0
            }
362
0
        }
363
    }
364
#endif
365
}