Searched refs:loadu_128 (Results 1 – 2 of 2) sorted by relevance
13 INLINE uint32x4_t loadu_128(const uint8_t src[16]) { in loadu_128() function200 out[0] = loadu_128(&inputs[0][block_offset + 0 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()201 out[1] = loadu_128(&inputs[1][block_offset + 0 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()202 out[2] = loadu_128(&inputs[2][block_offset + 0 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()203 out[3] = loadu_128(&inputs[3][block_offset + 0 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()204 out[4] = loadu_128(&inputs[0][block_offset + 1 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()205 out[5] = loadu_128(&inputs[1][block_offset + 1 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()206 out[6] = loadu_128(&inputs[2][block_offset + 1 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()207 out[7] = loadu_128(&inputs[3][block_offset + 1 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()208 out[8] = loadu_128(&inputs[0][block_offset + 2 * sizeof(uint32x4_t)]); in transpose_msg_vecs4()[all …]
9 INLINE __m128i loadu_128(const uint8_t src[16]) { in loadu_128() function119 rows[0] = loadu_128((uint8_t *)&cv[0]); in compress_pre()120 rows[1] = loadu_128((uint8_t *)&cv[4]); in compress_pre()125 __m128i m0 = loadu_128(&block[sizeof(__m128i) * 0]); in compress_pre()126 __m128i m1 = loadu_128(&block[sizeof(__m128i) * 1]); in compress_pre()127 __m128i m2 = loadu_128(&block[sizeof(__m128i) * 2]); in compress_pre()128 __m128i m3 = loadu_128(&block[sizeof(__m128i) * 3]); in compress_pre()295 storeu_128(xor_128(rows[2], loadu_128((uint8_t *)&cv[0])), &out[32]); in blake3_compress_xof_avx512()296 storeu_128(xor_128(rows[3], loadu_128((uint8_t *)&cv[4])), &out[48]); in blake3_compress_xof_avx512()454 out[0] = loadu_128(&inputs[0][block_offset + 0 * sizeof(__m128i)]); in transpose_msg_vecs4()[all …]