-
Notifications
You must be signed in to change notification settings - Fork 4.8k
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Intel hardware intrinsic API change #27584
Comments
So far, the first two items (SSE4.2 STTNI intrinsic and 64-bit only intrinsic) needs more discussion for naming.
if (Popcnt.X64.IsSupported)
{
var res = Popcnt.X64.Popcnt(longVal);
...
} We think this is better than |
I think just |
Our personal opinions are heavily biased but the fact that already 3 discussion participants identified The point is that 3 discussion participants comprise 3/5 of whole group what should be alarming. |
X64 is no more ambiguous than the existing It is also already used elsewhere in .NET, alongside X86 in many cases, to differentiate in the same manner as we are trying to here (see https://source.dot.net/#q=X64 and https://source.dot.net/#q=X86) and in Roslyn (see http://source.roslyn.io/#q=X64 and http://source.roslyn.io/#q=X86) and other Microsoft products (the list could go on). |
I've requested another API review be scheduled to cover this and a few other questions. cc. @terrajobst |
For 3, the PR is here: dotnet/coreclr#20147 The current API in the PR is: public static class Vector64
{
public static unsafe Vector64<byte> Create(byte value);
public static unsafe Vector64<double> Create(double value);
public static unsafe Vector64<short> Create(short value);
public static unsafe Vector64<int> Create(int value);
public static unsafe Vector64<long> Create(long value);
public static unsafe Vector64<sbyte> Create(sbyte value);
public static unsafe Vector64<float> Create(float value);
public static unsafe Vector64<ushort> Create(ushort value);
public static unsafe Vector64<uint> Create(uint value);
public static unsafe Vector64<ulong> Create(ulong value);
public static unsafe Vector64<byte> Create(byte e0, byte e1, byte e2, byte e3, byte e4, byte e5, byte e6, byte e7);
public static unsafe Vector64<short> Create(short e0, short e1, short e2, short e3);
public static unsafe Vector64<int> Create(int e0, int e1);
public static unsafe Vector64<sbyte> Create(sbyte e0, sbyte e1, sbyte e2, sbyte e3, sbyte e4, sbyte e5, sbyte e6, sbyte e7);
public static unsafe Vector64<float> Create(float e0, float e1);
public static unsafe Vector64<ushort> Create(ushort e0, ushort e1, ushort e2, ushort e3);
public static unsafe Vector64<uint> Create(uint e0, uint e1);
public static unsafe Vector64<byte> CreateScalar(byte value);
public static unsafe Vector64<double> CreateScalar(double value);
public static unsafe Vector64<short> CreateScalar(short value);
public static unsafe Vector64<int> CreateScalar(int value);
public static unsafe Vector64<long> CreateScalar(long value);
public static unsafe Vector64<sbyte> CreateScalar(sbyte value);
public static unsafe Vector64<float> CreateScalar(float value);
public static unsafe Vector64<ushort> CreateScalar(ushort value);
public static unsafe Vector64<uint> CreateScalar(uint value);
public static unsafe Vector64<ulong> CreateScalar(ulong value);
}
public static partial struct Vector64<T>
{
public static Vector64<T> Zero { get; }
public Vector64<byte> AsByte();
public Vector64<double> AsDouble();
public Vector64<short> AsInt16();
public Vector64<int> AsInt32();
public Vector64<long> AsInt64();
public Vector64<sbyte> AsSByte();
public Vector64<float> AsSingle();
public Vector64<ushort> AsUInt16();
public Vector64<uint> AsUInt32();
public Vector64<ulong> AsUInt64();
public T AsScalar();
public T GetElement(int index);
public void SetElement(int index, T value);
}
public static class Vector128
{
public static unsafe Vector128<byte> Create(byte value);
public static unsafe Vector128<double> Create(double value);
public static unsafe Vector128<short> Create(short value);
public static unsafe Vector128<int> Create(int value);
public static unsafe Vector128<long> Create(long value);
public static unsafe Vector128<sbyte> Create(sbyte value);
public static unsafe Vector128<float> Create(float value);
public static unsafe Vector128<ushort> Create(ushort value);
public static unsafe Vector128<uint> Create(uint value);
public static unsafe Vector128<ulong> Create(ulong value);
public static unsafe Vector128<byte> Create(byte e0, byte e1, byte e2, byte e3, byte e4, byte e5, byte e6, byte e7, byte e8, byte e9, byte e10, byte e11, byte e12, byte e13, byte e14, byte e15);
public static unsafe Vector128<double> Create(double e0, double e1);
public static unsafe Vector128<short> Create(short e0, short e1, short e2, short e3, short e4, short e5, short e6, short e7);
public static unsafe Vector128<int> Create(int e0, int e1, int e2, int e3);
public static unsafe Vector128<long> Create(long e0, long e1);
public static unsafe Vector128<sbyte> Create(sbyte e0, sbyte e1, sbyte e2, sbyte e3, sbyte e4, sbyte e5, sbyte e6, sbyte e7, sbyte e8, sbyte e9, sbyte e10, sbyte e11, sbyte e12, sbyte e13, sbyte e14, sbyte e15);
public static unsafe Vector128<float> Create(float e0, float e1, float e2, float e3);
public static unsafe Vector128<ushort> Create(ushort e0, ushort e1, ushort e2, ushort e3, ushort e4, ushort e5, ushort e6, ushort e7);
public static unsafe Vector128<uint> Create(uint e0, uint e1, uint e2, uint e3);
public static unsafe Vector128<ulong> Create(ulong e0, ulong e1);
public static unsafe Vector128<T> Create<T>(Vector64<T> lower, Vector64<T> upper);
public static unsafe Vector128<byte> CreateScalar(byte value);
public static unsafe Vector128<double> CreateScalar(double value);
public static unsafe Vector128<short> CreateScalar(short value);
public static unsafe Vector128<int> CreateScalar(int value);
public static unsafe Vector128<long> CreateScalar(long value);
public static unsafe Vector128<sbyte> CreateScalar(sbyte value);
public static unsafe Vector128<float> CreateScalar(float value);
public static unsafe Vector128<ushort> CreateScalar(ushort value);
public static unsafe Vector128<uint> CreateScalar(uint value);
public static unsafe Vector128<ulong> CreateScalar(ulong value);
public static unsafe Vector128<T> CreateScalar<T>(Vector64<T> value);
}
public static partial struct Vector128<T>
{
public static Vector128<T> Zero { get; }
public Vector128<byte> AsByte();
public Vector128<double> AsDouble();
public Vector128<short> AsInt16();
public Vector128<int> AsInt32();
public Vector128<long> AsInt64();
public Vector128<sbyte> AsSByte();
public Vector128<float> AsSingle();
public Vector128<ushort> AsUInt16();
public Vector128<uint> AsUInt32();
public Vector128<ulong> AsUInt64();
public T AsScalar();
public T GetElement(int index);
public void SetElement(int index, T value);
public Vector64<T> GetLower();
public Vector64<T> GetUpper();
}
public static class Vector256
{
public static unsafe Vector256<byte> Create(byte value);
public static unsafe Vector256<double> Create(double value);
public static unsafe Vector256<short> Create(short value);
public static unsafe Vector256<int> Create(int value);
public static unsafe Vector256<long> Create(long value);
public static unsafe Vector256<sbyte> Create(sbyte value);
public static unsafe Vector256<float> Create(float value);
public static unsafe Vector256<ushort> Create(ushort value);
public static unsafe Vector256<uint> Create(uint value);
public static unsafe Vector256<ulong> Create(ulong value);
public static unsafe Vector256<byte> Create(byte e0, byte e1, byte e2, byte e3, byte e4, byte e5, byte e6, byte e7, byte e8, byte e9, byte e10, byte e11, byte e12, byte e13, byte e14, byte e15, byte e16, byte e17, byte e18, byte e19, byte e20, byte e21, byte e22, byte e23, byte e24, byte e25, byte e26, byte e27, byte e28, byte e29, byte e30, byte e31);
public static unsafe Vector256<double> Create(double e0, double e1, double e2, double e3);
public static unsafe Vector256<short> Create(short e0, short e1, short e2, short e3, short e4, short e5, short e6, short e7, short e8, short e9, short e10, short e11, short e12, short e13, short e14, short e15);
public static unsafe Vector256<int> Create(int e0, int e1, int e2, int e3, int e4, int e5, int e6, int e7);
public static unsafe Vector256<long> Create(long e0, long e1, long e2, long e3);
public static unsafe Vector256<sbyte> Create(sbyte e0, sbyte e1, sbyte e2, sbyte e3, sbyte e4, sbyte e5, sbyte e6, sbyte e7, sbyte e8, sbyte e9, sbyte e10, sbyte e11, sbyte e12, sbyte e13, sbyte e14, sbyte e15, sbyte e16, sbyte e17, sbyte e18, sbyte e19, sbyte e20, sbyte e21, sbyte e22, sbyte e23, sbyte e24, sbyte e25, sbyte e26, sbyte e27, sbyte e28, sbyte e29, sbyte e30, sbyte e31);
public static unsafe Vector256<float> Create(float e0, float e1, float e2, float e3, float e4, float e5, float e6, float e7);
public static unsafe Vector256<ushort> Create(ushort e0, ushort e1, ushort e2, ushort e3, ushort e4, ushort e5, ushort e6, ushort e7, ushort e8, ushort e9, ushort e10, ushort e11, ushort e12, ushort e13, ushort e14, ushort e15);
public static unsafe Vector256<uint> Create(uint e0, uint e1, uint e2, uint e3, uint e4, uint e5, uint e6, uint e7);
public static unsafe Vector256<ulong> Create(ulong e0, ulong e1, ulong e2, ulong e3);
public static unsafe Vector256<T> Create<T>(Vector128<T> lower, Vector128<T> upper);
public static unsafe Vector256<byte> CreateScalar(byte value);
public static unsafe Vector256<double> CreateScalar(double value);
public static unsafe Vector256<short> CreateScalar(short value);
public static unsafe Vector256<int> CreateScalar(int value);
public static unsafe Vector256<long> CreateScalar(long value);
public static unsafe Vector256<sbyte> CreateScalar(sbyte value);
public static unsafe Vector256<float> CreateScalar(float value);
public static unsafe Vector256<ushort> CreateScalar(ushort value);
public static unsafe Vector256<uint> CreateScalar(uint value);
public static unsafe Vector256<ulong> CreateScalar(ulong value);
public static unsafe Vector256<T> CreateScalar<T>(Vector128<T> value);
}
public static partial struct Vector256<T>
{
public static Vector256<T> Zero { get; }
public Vector256<byte> AsByte();
public Vector256<double> AsDouble();
public Vector256<short> AsInt16();
public Vector256<int> AsInt32();
public Vector256<long> AsInt64();
public Vector256<sbyte> AsSByte();
public Vector256<float> AsSingle();
public Vector256<ushort> AsUInt16();
public Vector256<uint> AsUInt32();
public Vector256<ulong> AsUInt64();
public T AsScalar();
public T GetElement(int index);
public void SetElement(int index, T value);
public Vector128<T> GetLower();
public Vector128<T> GetUpper();
} The open questions are:
|
For 2, the biggest question is the name. Is We also want to confirm that the nested
|
We will have an API review meeting at 11/6 to finalize the Intel hardware intrinsic APIs. There are three topics we need to go through in this review.
|
According to the second hw intrinsic API review meeting https://github.com/dotnet/apireviews/tree/master/2018/Hardware-Intrinsics-Intel, we need to change some intrinsic APIs and their implementation
StaticCast
and some other helpers into vector classes, and renameStaticCast
toAs
.The text was updated successfully, but these errors were encountered: