using System; using System.Diagnostics; #if NETCOREAPP3_0_OR_GREATER using System.Runtime.Intrinsics; using System.Runtime.Intrinsics.X86; #endif using Org.BouncyCastle.Math.Raw; namespace Org.BouncyCastle.Math.EC.Custom.Sec { internal static class SecT409Field { private const ulong M25 = ulong.MaxValue >> 39; private const ulong M59 = ulong.MaxValue >> 5; #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void Add(ReadOnlySpan x, ReadOnlySpan y, Span z) #else public static void Add(ulong[] x, ulong[] y, ulong[] z) #endif { z[0] = x[0] ^ y[0]; z[1] = x[1] ^ y[1]; z[2] = x[2] ^ y[2]; z[3] = x[3] ^ y[3]; z[4] = x[4] ^ y[4]; z[5] = x[5] ^ y[5]; z[6] = x[6] ^ y[6]; } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void AddBothTo(ReadOnlySpan x, ReadOnlySpan y, Span z) #else public static void AddBothTo(ulong[] x, ulong[] y, ulong[] z) #endif { z[0] ^= x[0] ^ y[0]; z[1] ^= x[1] ^ y[1]; z[2] ^= x[2] ^ y[2]; z[3] ^= x[3] ^ y[3]; z[4] ^= x[4] ^ y[4]; z[5] ^= x[5] ^ y[5]; z[6] ^= x[6] ^ y[6]; } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void AddExt(ReadOnlySpan xx, ReadOnlySpan yy, Span zz) #else public static void AddExt(ulong[] xx, ulong[] yy, ulong[] zz) #endif { for (int i = 0; i < 13; ++i) { zz[i] = xx[i] ^ yy[i]; } } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void AddOne(ReadOnlySpan x, Span z) #else public static void AddOne(ulong[] x, ulong[] z) #endif { z[0] = x[0] ^ 1UL; z[1] = x[1]; z[2] = x[2]; z[3] = x[3]; z[4] = x[4]; z[5] = x[5]; z[6] = x[6]; } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void AddTo(ReadOnlySpan x, Span z) #else public static void AddTo(ulong[] x, ulong[] z) #endif { z[0] ^= x[0]; z[1] ^= x[1]; z[2] ^= x[2]; z[3] ^= x[3]; z[4] ^= x[4]; z[5] ^= x[5]; z[6] ^= x[6]; } public static ulong[] FromBigInteger(BigInteger x) { return Nat.FromBigInteger64(409, x); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void HalfTrace(ReadOnlySpan x, Span z) #else public static void HalfTrace(ulong[] x, ulong[] z) #endif { #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span tt = stackalloc ulong[13]; #else ulong[] tt = Nat.Create64(13); #endif Nat448.Copy64(x, z); for (int i = 1; i < 409; i += 2) { ImplSquare(z, tt); Reduce(tt, z); ImplSquare(z, tt); Reduce(tt, z); AddTo(x, z); } } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void Invert(ReadOnlySpan x, Span z) #else public static void Invert(ulong[] x, ulong[] z) #endif { if (Nat448.IsZero64(x)) throw new InvalidOperationException(); // Itoh-Tsujii inversion with bases { 2, 3 } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span t0 = stackalloc ulong[7]; Span t1 = stackalloc ulong[7]; Span t2 = stackalloc ulong[7]; #else ulong[] t0 = Nat448.Create64(); ulong[] t1 = Nat448.Create64(); ulong[] t2 = Nat448.Create64(); #endif Square(x, t0); // 3 | 408 SquareN(t0, 1, t1); Multiply(t0, t1, t0); SquareN(t1, 1, t1); Multiply(t0, t1, t0); // 2 | 136 SquareN(t0, 3, t1); Multiply(t0, t1, t0); // 2 | 68 SquareN(t0, 6, t1); Multiply(t0, t1, t0); // 2 | 34 SquareN(t0, 12, t1); Multiply(t0, t1, t2); // ! {2,3} | 17 SquareN(t2, 24, t0); SquareN(t0, 24, t1); Multiply(t0, t1, t0); // 2 | 8 SquareN(t0, 48, t1); Multiply(t0, t1, t0); // 2 | 4 SquareN(t0, 96, t1); Multiply(t0, t1, t0); // 2 | 2 SquareN(t0, 192, t1); Multiply(t0, t1, t0); Multiply(t0, t2, z); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void Multiply(ReadOnlySpan x, ReadOnlySpan y, Span z) #else public static void Multiply(ulong[] x, ulong[] y, ulong[] z) #endif { #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span tt = stackalloc ulong[14]; #else ulong[] tt = Nat448.CreateExt64(); #endif ImplMultiply(x, y, tt); Reduce(tt, z); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void MultiplyAddToExt(ReadOnlySpan x, ReadOnlySpan y, Span zz) #else public static void MultiplyAddToExt(ulong[] x, ulong[] y, ulong[] zz) #endif { #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span tt = stackalloc ulong[14]; #else ulong[] tt = Nat448.CreateExt64(); #endif ImplMultiply(x, y, tt); AddExt(zz, tt, zz); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void MultiplyExt(ReadOnlySpan x, ReadOnlySpan y, Span zz) #else public static void MultiplyExt(ulong[] x, ulong[] y, ulong[] zz) #endif { #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER zz[..14].Fill(0UL); #else Array.Clear(zz, 0, 10); #endif ImplMultiply(x, y, zz); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void Reduce(ReadOnlySpan xx, Span z) #else public static void Reduce(ulong[] xx, ulong[] z) #endif { ulong x00 = xx[0], x01 = xx[1], x02 = xx[2], x03 = xx[3]; ulong x04 = xx[4], x05 = xx[5], x06 = xx[6], x07 = xx[7]; ulong u = xx[12]; x05 ^= (u << 39); x06 ^= (u >> 25) ^ (u << 62); x07 ^= (u >> 2); u = xx[11]; x04 ^= (u << 39); x05 ^= (u >> 25) ^ (u << 62); x06 ^= (u >> 2); u = xx[10]; x03 ^= (u << 39); x04 ^= (u >> 25) ^ (u << 62); x05 ^= (u >> 2); u = xx[9]; x02 ^= (u << 39); x03 ^= (u >> 25) ^ (u << 62); x04 ^= (u >> 2); u = xx[8]; x01 ^= (u << 39); x02 ^= (u >> 25) ^ (u << 62); x03 ^= (u >> 2); u = x07; x00 ^= (u << 39); x01 ^= (u >> 25) ^ (u << 62); x02 ^= (u >> 2); ulong t = x06 >> 25; z[0] = x00 ^ t; z[1] = x01 ^ (t << 23); z[2] = x02; z[3] = x03; z[4] = x04; z[5] = x05; z[6] = x06 & M25; } public static void Reduce39(ulong[] z, int zOff) { ulong z6 = z[zOff + 6], t = z6 >> 25; z[zOff ] ^= t; z[zOff + 1] ^= (t << 23); z[zOff + 6] = z6 & M25; } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void Sqrt(ReadOnlySpan x, Span z) #else public static void Sqrt(ulong[] x, ulong[] z) #endif { ulong c0 = Interleave.Unshuffle(x[0], x[1], out ulong e0); ulong c1 = Interleave.Unshuffle(x[2], x[3], out ulong e1); ulong c2 = Interleave.Unshuffle(x[4], x[5], out ulong e2); ulong c3 = Interleave.Unshuffle(x[6] , out ulong e3); z[0] = e0 ^ (c0 << 44); z[1] = e1 ^ (c1 << 44) ^ (c0 >> 20); z[2] = e2 ^ (c2 << 44) ^ (c1 >> 20); z[3] = e3 ^ (c3 << 44) ^ (c2 >> 20) ^ (c0 << 13); z[4] = (c3 >> 20) ^ (c1 << 13) ^ (c0 >> 51); z[5] = (c2 << 13) ^ (c1 >> 51); z[6] = (c3 << 13) ^ (c2 >> 51); Debug.Assert((c3 >> 51) == 0); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void Square(ReadOnlySpan x, Span z) #else public static void Square(ulong[] x, ulong[] z) #endif { #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span tt = stackalloc ulong[13]; #else ulong[] tt = Nat.Create64(13); #endif ImplSquare(x, tt); Reduce(tt, z); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void SquareAddToExt(ReadOnlySpan x, Span zz) #else public static void SquareAddToExt(ulong[] x, ulong[] zz) #endif { #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span tt = stackalloc ulong[13]; #else ulong[] tt = Nat.Create64(13); #endif ImplSquare(x, tt); AddExt(zz, tt, zz); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void SquareExt(ReadOnlySpan x, Span zz) #else public static void SquareExt(ulong[] x, ulong[] zz) #endif { ImplSquare(x, zz); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static void SquareN(ReadOnlySpan x, int n, Span z) #else public static void SquareN(ulong[] x, int n, ulong[] z) #endif { Debug.Assert(n > 0); #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Span tt = stackalloc ulong[13]; #else ulong[] tt = Nat.Create64(13); #endif ImplSquare(x, tt); Reduce(tt, z); while (--n > 0) { ImplSquare(z, tt); Reduce(tt, z); } } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER public static uint Trace(ReadOnlySpan x) #else public static uint Trace(ulong[] x) #endif { // Non-zero-trace bits: 0 return (uint)(x[0]) & 1U; } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER private static void ImplCompactExt(Span zz) #else private static void ImplCompactExt(ulong[] zz) #endif { ulong z00 = zz[ 0], z01 = zz[ 1], z02 = zz[ 2], z03 = zz[ 3], z04 = zz[ 4], z05 = zz[ 5], z06 = zz[ 6]; ulong z07 = zz[ 7], z08 = zz[ 8], z09 = zz[ 9], z10 = zz[10], z11 = zz[11], z12 = zz[12], z13 = zz[13]; zz[ 0] = z00 ^ (z01 << 59); zz[ 1] = (z01 >> 5) ^ (z02 << 54); zz[ 2] = (z02 >> 10) ^ (z03 << 49); zz[ 3] = (z03 >> 15) ^ (z04 << 44); zz[ 4] = (z04 >> 20) ^ (z05 << 39); zz[ 5] = (z05 >> 25) ^ (z06 << 34); zz[ 6] = (z06 >> 30) ^ (z07 << 29); zz[ 7] = (z07 >> 35) ^ (z08 << 24); zz[ 8] = (z08 >> 40) ^ (z09 << 19); zz[ 9] = (z09 >> 45) ^ (z10 << 14); zz[10] = (z10 >> 50) ^ (z11 << 9); zz[11] = (z11 >> 55) ^ (z12 << 4) ^ (z13 << 63); zz[12] = (z13 >> 1); //zz[13] = 0; } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER private static void ImplExpand(ReadOnlySpan x, Span z) #else private static void ImplExpand(ulong[] x, ulong[] z) #endif { ulong x0 = x[0], x1 = x[1], x2 = x[2], x3 = x[3], x4 = x[4], x5 = x[5], x6 = x[6]; z[0] = x0 & M59; z[1] = ((x0 >> 59) ^ (x1 << 5)) & M59; z[2] = ((x1 >> 54) ^ (x2 << 10)) & M59; z[3] = ((x2 >> 49) ^ (x3 << 15)) & M59; z[4] = ((x3 >> 44) ^ (x4 << 20)) & M59; z[5] = ((x4 >> 39) ^ (x5 << 25)) & M59; z[6] = ((x5 >> 34) ^ (x6 << 30)); } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER private static void ImplMultiply(ReadOnlySpan x, ReadOnlySpan y, Span zz) { Span a = stackalloc ulong[7], b = stackalloc ulong[7]; ImplExpand(x, a); ImplExpand(y, b); Span u = stackalloc ulong[8]; for (int i = 0; i < 7; ++i) { ImplMulwAcc(u, a[i], b[i], zz[(i << 1)..]); } ulong v0 = zz[0], v1 = zz[1]; v0 ^= zz[ 2]; zz[1] = v0 ^ v1; v1 ^= zz[ 3]; v0 ^= zz[ 4]; zz[2] = v0 ^ v1; v1 ^= zz[ 5]; v0 ^= zz[ 6]; zz[3] = v0 ^ v1; v1 ^= zz[ 7]; v0 ^= zz[ 8]; zz[4] = v0 ^ v1; v1 ^= zz[ 9]; v0 ^= zz[10]; zz[5] = v0 ^ v1; v1 ^= zz[11]; v0 ^= zz[12]; zz[6] = v0 ^ v1; v1 ^= zz[13]; ulong w = v0 ^ v1; zz[ 7] = zz[0] ^ w; zz[ 8] = zz[1] ^ w; zz[ 9] = zz[2] ^ w; zz[10] = zz[3] ^ w; zz[11] = zz[4] ^ w; zz[12] = zz[5] ^ w; zz[13] = zz[6] ^ w; ImplMulwAcc(u, a[0] ^ a[1], b[0] ^ b[1], zz[ 1..]); ImplMulwAcc(u, a[0] ^ a[2], b[0] ^ b[2], zz[ 2..]); ImplMulwAcc(u, a[0] ^ a[3], b[0] ^ b[3], zz[ 3..]); ImplMulwAcc(u, a[1] ^ a[2], b[1] ^ b[2], zz[ 3..]); ImplMulwAcc(u, a[0] ^ a[4], b[0] ^ b[4], zz[ 4..]); ImplMulwAcc(u, a[1] ^ a[3], b[1] ^ b[3], zz[ 4..]); ImplMulwAcc(u, a[0] ^ a[5], b[0] ^ b[5], zz[ 5..]); ImplMulwAcc(u, a[1] ^ a[4], b[1] ^ b[4], zz[ 5..]); ImplMulwAcc(u, a[2] ^ a[3], b[2] ^ b[3], zz[ 5..]); ImplMulwAcc(u, a[0] ^ a[6], b[0] ^ b[6], zz[ 6..]); ImplMulwAcc(u, a[1] ^ a[5], b[1] ^ b[5], zz[ 6..]); ImplMulwAcc(u, a[2] ^ a[4], b[2] ^ b[4], zz[ 6..]); ImplMulwAcc(u, a[1] ^ a[6], b[1] ^ b[6], zz[ 7..]); ImplMulwAcc(u, a[2] ^ a[5], b[2] ^ b[5], zz[ 7..]); ImplMulwAcc(u, a[3] ^ a[4], b[3] ^ b[4], zz[ 7..]); ImplMulwAcc(u, a[2] ^ a[6], b[2] ^ b[6], zz[ 8..]); ImplMulwAcc(u, a[3] ^ a[5], b[3] ^ b[5], zz[ 8..]); ImplMulwAcc(u, a[3] ^ a[6], b[3] ^ b[6], zz[ 9..]); ImplMulwAcc(u, a[4] ^ a[5], b[4] ^ b[5], zz[ 9..]); ImplMulwAcc(u, a[4] ^ a[6], b[4] ^ b[6], zz[10..]); ImplMulwAcc(u, a[5] ^ a[6], b[5] ^ b[6], zz[11..]); ImplCompactExt(zz); } #else private static void ImplMultiply(ulong[] x, ulong[] y, ulong[] zz) { ulong[] a = new ulong[7], b = new ulong[7]; ImplExpand(x, a); ImplExpand(y, b); ulong[] u = new ulong[8]; for (int i = 0; i < 7; ++i) { ImplMulwAcc(u, a[i], b[i], zz, i << 1); } ulong v0 = zz[0], v1 = zz[1]; v0 ^= zz[ 2]; zz[1] = v0 ^ v1; v1 ^= zz[ 3]; v0 ^= zz[ 4]; zz[2] = v0 ^ v1; v1 ^= zz[ 5]; v0 ^= zz[ 6]; zz[3] = v0 ^ v1; v1 ^= zz[ 7]; v0 ^= zz[ 8]; zz[4] = v0 ^ v1; v1 ^= zz[ 9]; v0 ^= zz[10]; zz[5] = v0 ^ v1; v1 ^= zz[11]; v0 ^= zz[12]; zz[6] = v0 ^ v1; v1 ^= zz[13]; ulong w = v0 ^ v1; zz[ 7] = zz[0] ^ w; zz[ 8] = zz[1] ^ w; zz[ 9] = zz[2] ^ w; zz[10] = zz[3] ^ w; zz[11] = zz[4] ^ w; zz[12] = zz[5] ^ w; zz[13] = zz[6] ^ w; ImplMulwAcc(u, a[0] ^ a[1], b[0] ^ b[1], zz, 1); ImplMulwAcc(u, a[0] ^ a[2], b[0] ^ b[2], zz, 2); ImplMulwAcc(u, a[0] ^ a[3], b[0] ^ b[3], zz, 3); ImplMulwAcc(u, a[1] ^ a[2], b[1] ^ b[2], zz, 3); ImplMulwAcc(u, a[0] ^ a[4], b[0] ^ b[4], zz, 4); ImplMulwAcc(u, a[1] ^ a[3], b[1] ^ b[3], zz, 4); ImplMulwAcc(u, a[0] ^ a[5], b[0] ^ b[5], zz, 5); ImplMulwAcc(u, a[1] ^ a[4], b[1] ^ b[4], zz, 5); ImplMulwAcc(u, a[2] ^ a[3], b[2] ^ b[3], zz, 5); ImplMulwAcc(u, a[0] ^ a[6], b[0] ^ b[6], zz, 6); ImplMulwAcc(u, a[1] ^ a[5], b[1] ^ b[5], zz, 6); ImplMulwAcc(u, a[2] ^ a[4], b[2] ^ b[4], zz, 6); ImplMulwAcc(u, a[1] ^ a[6], b[1] ^ b[6], zz, 7); ImplMulwAcc(u, a[2] ^ a[5], b[2] ^ b[5], zz, 7); ImplMulwAcc(u, a[3] ^ a[4], b[3] ^ b[4], zz, 7); ImplMulwAcc(u, a[2] ^ a[6], b[2] ^ b[6], zz, 8); ImplMulwAcc(u, a[3] ^ a[5], b[3] ^ b[5], zz, 8); ImplMulwAcc(u, a[3] ^ a[6], b[3] ^ b[6], zz, 9); ImplMulwAcc(u, a[4] ^ a[5], b[4] ^ b[5], zz, 9); ImplMulwAcc(u, a[4] ^ a[6], b[4] ^ b[6], zz, 10); ImplMulwAcc(u, a[5] ^ a[6], b[5] ^ b[6], zz, 11); ImplCompactExt(zz); } #endif #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER private static void ImplMulwAcc(Span u, ulong x, ulong y, Span z) #else private static void ImplMulwAcc(ulong[] u, ulong x, ulong y, ulong[] z, int zOff) #endif { Debug.Assert(x >> 59 == 0); Debug.Assert(y >> 59 == 0); #if NETCOREAPP3_0_OR_GREATER if (Org.BouncyCastle.Runtime.Intrinsics.X86.Pclmulqdq.IsEnabled) { var X = Vector128.CreateScalar(x); var Y = Vector128.CreateScalar(y); var Z = Pclmulqdq.CarrylessMultiply(X, Y, 0x00); ulong z0 = Z.GetElement(0); ulong z1 = Z.GetElement(1); z[0] ^= z0 & M59; z[1] ^= (z0 >> 59) ^ (z1 << 5); return; } #endif //u[0] = 0; u[1] = y; u[2] = u[1] << 1; u[3] = u[2] ^ y; u[4] = u[2] << 1; u[5] = u[4] ^ y; u[6] = u[3] << 1; u[7] = u[6] ^ y; uint j = (uint)x; ulong g, h = 0, l = u[(int)j & 7] ^ (u[(int)(j >> 3) & 7] << 3); int k = 54; do { j = (uint)(x >> k); g = u[(int)j & 7] ^ u[(int)(j >> 3) & 7] << 3; l ^= (g << k); h ^= (g >> -k); } while ((k -= 6) > 0); Debug.Assert(h >> 53 == 0); #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER z[0] ^= l & M59; z[1] ^= (l >> 59) ^ (h << 5); #else z[zOff ] ^= l & M59; z[zOff + 1] ^= (l >> 59) ^ (h << 5); #endif } #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER private static void ImplSquare(ReadOnlySpan x, Span zz) #else private static void ImplSquare(ulong[] x, ulong[] zz) #endif { zz[12] = Interleave.Expand32to64((uint)x[6]); #if NETCOREAPP3_0_OR_GREATER if (Org.BouncyCastle.Runtime.Intrinsics.X86.Bmi2.X64.IsEnabled) { zz[11] = Bmi2.X64.ParallelBitDeposit(x[5] >> 32, 0x5555555555555555UL); zz[10] = Bmi2.X64.ParallelBitDeposit(x[5] , 0x5555555555555555UL); zz[ 9] = Bmi2.X64.ParallelBitDeposit(x[4] >> 32, 0x5555555555555555UL); zz[ 8] = Bmi2.X64.ParallelBitDeposit(x[4] , 0x5555555555555555UL); zz[ 7] = Bmi2.X64.ParallelBitDeposit(x[3] >> 32, 0x5555555555555555UL); zz[ 6] = Bmi2.X64.ParallelBitDeposit(x[3] , 0x5555555555555555UL); zz[ 5] = Bmi2.X64.ParallelBitDeposit(x[2] >> 32, 0x5555555555555555UL); zz[ 4] = Bmi2.X64.ParallelBitDeposit(x[2] , 0x5555555555555555UL); zz[ 3] = Bmi2.X64.ParallelBitDeposit(x[1] >> 32, 0x5555555555555555UL); zz[ 2] = Bmi2.X64.ParallelBitDeposit(x[1] , 0x5555555555555555UL); zz[ 1] = Bmi2.X64.ParallelBitDeposit(x[0] >> 32, 0x5555555555555555UL); zz[ 0] = Bmi2.X64.ParallelBitDeposit(x[0] , 0x5555555555555555UL); return; } #endif #if NETCOREAPP2_1_OR_GREATER || NETSTANDARD2_1_OR_GREATER Interleave.Expand64To128(x[..6], zz[..12]); #else Interleave.Expand64To128(x, 0, 6, zz, 0); #endif } } }