avxvnniint16intrin.h - OpenGrok cross reference for /freebsd/contrib/llvm-project/clang/lib/Headers/avxvnniint16intrin.h

Lines Matching +full:- +full:j
1 /*===----------- avxvnniint16intrin.h - AVXVNNIINT16 intrinsics-------------===
5  * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7  *===-----------------------------------------------------------------------===
26 /// Multiply groups of 2 adjacent pairs of signed 16-bit integers in \a __A with
27 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
28 ///    signed 16-bit results. Sum these 2 results with the corresponding
29 ///    32-bit integer in \a __W, and store the packed 32-bit results in \a dst.
40 ///    A 128-bit vector of [4 x int].
42 ///    A 128-bit vector of [8 x short].
44 ///    A 128-bit vector of [8 x unsigned short].
46 ///    A 128-bit vector of [4 x int].
49 /// FOR j := 0 to 3
50 /// 	tmp1.dword := SignExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
51 /// 	tmp2.dword := SignExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
52 /// 	dst.dword[j] := __W.dword[j] + tmp1 + tmp2
63 /// Multiply groups of 2 adjacent pairs of signed 16-bit integers in \a __A with
64 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
65 ///    signed 16-bit results. Sum these 2 results with the corresponding
66 ///    32-bit integer in \a __W, and store the packed 32-bit results in \a dst.
77 ///    A 256-bit vector of [8 x int].
79 ///    A 256-bit vector of [16 x short].
81 ///    A 256-bit vector of [16 x unsigned short].
83 ///    A 256-bit vector of [8 x int].
86 /// FOR j := 0 to 7
87 /// 	tmp1.dword := SignExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
88 /// 	tmp2.dword := SignExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
89 /// 	dst.dword[j] := __W.dword[j] + tmp1 + tmp2
99 /// Multiply groups of 2 adjacent pairs of signed 16-bit integers in \a __A with
100 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
101 ///    signed 16-bit results. Sum these 2 results with the corresponding
102 ///    32-bit integer in \a __W with signed saturation, and store the packed
103 ///    32-bit results in \a dst.
114 ///    A 128-bit vector of [4 x int].
116 ///    A 128-bit vector of [8 x short].
118 ///    A 128-bit vector of [8 x unsigned short].
120 ///    A 128-bit vector of [4 x int].
123 /// FOR j := 0 to 3
124 /// 	tmp1.dword := SignExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
125 /// 	tmp2.dword := SignExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
126 /// 	dst.dword[j] := SIGNED_DWORD_SATURATE(__W.dword[j] + tmp1 + tmp2)
137 /// Multiply groups of 2 adjacent pairs of signed 16-bit integers in \a __A with
138 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
139 ///    signed 16-bit results. Sum these 2 results with the corresponding
140 ///    32-bit integer in \a __W with signed saturation, and store the packed
141 ///    32-bit results in \a dst.
152 ///    A 256-bit vector of [8 x int].
154 ///    A 256-bit vector of [16 x short].
156 ///    A 256-bit vector of [16 x unsigned short].
158 ///    A 256-bit vector of [8 x int].
161 /// FOR j := 0 to 7
162 /// 	tmp1.dword := SignExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
163 /// 	tmp2.dword := SignExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
164 /// 	dst.dword[j] := SIGNED_DWORD_SATURATE(__W.dword[j] + tmp1 + tmp2)
174 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
175 ///    corresponding signed 16-bit integers in \a __B, producing 2 intermediate
176 ///    signed 16-bit results. Sum these 2 results with the corresponding
177 ///    32-bit integer in \a __W, and store the packed 32-bit results in \a dst.
188 ///    A 128-bit vector of [4 x int].
190 ///    A 128-bit vector of [8 x unsigned short].
192 ///    A 128-bit vector of [8 x short].
194 ///    A 128-bit vector of [4 x int].
197 /// FOR j := 0 to 3
198 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * SignExtend32(__B.word[2*j])
199 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * SignExtend32(__B.word[2*j+1])
200 /// 	dst.dword[j] := __W.dword[j] + tmp1 + tmp2
211 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
212 ///    corresponding signed 16-bit integers in \a __B, producing 2 intermediate
213 ///    signed 16-bit results. Sum these 2 results with the corresponding
214 ///    32-bit integer in \a __W, and store the packed 32-bit results in \a dst.
225 ///    A 256-bit vector of [8 x int].
227 ///    A 256-bit vector of [16 x unsigned short].
229 ///    A 256-bit vector of [16 x short].
231 ///    A 256-bit vector of [8 x int].
234 /// FOR j := 0 to 7
235 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * SignExtend32(__B.word[2*j])
236 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * SignExtend32(__B.word[2*j+1])
237 /// 	dst.dword[j] := __W.dword[j] + tmp1 + tmp2
247 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
248 ///    corresponding signed 16-bit integers in \a __B, producing 2 intermediate
249 ///    signed 16-bit results. Sum these 2 results with the corresponding
250 ///    32-bit integer in \a __W with signed saturation, and store the packed
251 ///    32-bit results in \a dst.
262 ///    A 128-bit vector of [4 x int].
264 ///    A 128-bit vector of [8 x unsigned short].
266 ///    A 128-bit vector of [8 x short].
268 ///    A 128-bit vector of [4 x int].
271 /// FOR j := 0 to 3
272 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * SignExtend32(__B.word[2*j])
273 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * SignExtend32(__B.word[2*j+1])
274 /// 	dst.dword[j] := SIGNED_DWORD_SATURATE(__W.dword[j] + tmp1 + tmp2)
285 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
286 ///    corresponding signed 16-bit integers in \a __B, producing 2 intermediate
287 ///    signed 16-bit results. Sum these 2 results with the corresponding
288 ///    32-bit integer in \a __W with signed saturation, and store the packed
289 ///    32-bit results in \a dst.
300 ///    A 256-bit vector of [8 x int].
302 ///    A 256-bit vector of [16 x unsigned short].
304 ///    A 256-bit vector of [16 x short].
306 ///    A 256-bit vector of [8 x int].
309 /// FOR j := 0 to 7
310 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * SignExtend32(__B.word[2*j])
311 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * SignExtend32(__B.word[2*j+1])
312 /// 	dst.dword[j] := SIGNED_DWORD_SATURATE(__W.dword[j] + tmp1 + tmp2)
322 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
323 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
324 ///    signed 16-bit results. Sum these 2 results with the corresponding
325 ///    32-bit integer in \a __W, and store the packed 32-bit results in \a dst.
336 ///    A 128-bit vector of [4 x unsigned int].
338 ///    A 128-bit vector of [8 x unsigned short].
340 ///    A 128-bit vector of [8 x unsigned short].
342 ///    A 128-bit vector of [4 x unsigned int].
345 /// FOR j := 0 to 3
346 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
347 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
348 /// 	dst.dword[j] := __W.dword[j] + tmp1 + tmp2
359 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
360 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
361 ///    signed 16-bit results. Sum these 2 results with the corresponding
362 ///    32-bit integer in \a __W, and store the packed 32-bit results in \a dst.
373 ///    A 256-bit vector of [8 x unsigned int].
375 ///    A 256-bit vector of [16 x unsigned short].
377 ///    A 256-bit vector of [16 x unsigned short].
379 ///    A 256-bit vector of [8 x unsigned int].
382 /// FOR j := 0 to 7
383 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
384 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
385 /// 	dst.dword[j] := __W.dword[j] + tmp1 + tmp2
395 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
396 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
397 ///    signed 16-bit results. Sum these 2 results with the corresponding
398 ///    32-bit integer in \a __W with signed saturation, and store the packed
399 ///    32-bit results in \a dst.
410 ///    A 128-bit vector of [4 x unsigned int].
412 ///    A 128-bit vector of [8 x unsigned short].
414 ///    A 128-bit vector of [8 x unsigned short].
416 ///    A 128-bit vector of [4 x unsigned int].
419 /// FOR j := 0 to 3
420 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
421 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
422 /// 	dst.dword[j] := UNSIGNED_DWORD_SATURATE(__W.dword[j] + tmp1 + tmp2)
433 /// Multiply groups of 2 adjacent pairs of unsigned 16-bit integers in \a __A with
434 ///    corresponding unsigned 16-bit integers in \a __B, producing 2 intermediate
435 ///    signed 16-bit results. Sum these 2 results with the corresponding
436 ///    32-bit integer in \a __W with signed saturation, and store the packed
437 ///    32-bit results in \a dst.
448 ///    A 256-bit vector of [8 x unsigned int].
450 ///    A 256-bit vector of [16 x unsigned short].
452 ///    A 256-bit vector of [16 x unsigned short].
454 ///    A 256-bit vector of [8 x unsigned int].
457 /// FOR j := 0 to 7
458 /// 	tmp1.dword := ZeroExtend32(__A.word[2*j]) * ZeroExtend32(__B.word[2*j])
459 /// 	tmp2.dword := ZeroExtend32(__A.word[2*j+1]) * ZeroExtend32(__B.word[2*j+1])
460 /// 	dst.dword[j] := UNSIGNED_DWORD_SATURATE(__W.dword[j] + tmp1 + tmp2)