public static __m128i _mm_clmulepi64_si128(__m128i a, __m128i b, byte imm8) => CarrylessMultiply(v64u(a), v64u(b), imm8);
public static Vector128 <uint> _mm_abs_epi32(__m128i a) => Abs(v32i(a));
public static __m128i _mm_abs_epi8(__m128i a) => Abs(v8i(a));
public static __m128i _mm_abs_epi16(__m128i a) => Abs(v16i(a));
public static __m128i _mm_shuffle_epi8(__m128i a, __m128i mask) => Shuffle(v8u(a), v8u(mask));