ff53dcf560
* dotnet format style --severity info Some changes were manually reverted. * dotnet format analyzers --serverity info Some changes have been minimally adapted. * Restore a few unused methods and variables * Silence dotnet format IDE0060 warnings * Silence dotnet format IDE0052 warnings * Address or silence dotnet format IDE1006 warnings * Address or silence dotnet format CA2208 warnings * Address dotnet format CA1822 warnings * Address or silence dotnet format CA1069 warnings * Silence CA1806 and CA1834 issues * Address dotnet format CA1401 warnings * Fix new dotnet-format issues after rebase * Address review comments * Address dotnet format CA2208 warnings properly * Fix formatting for switch expressions * Address most dotnet format whitespace warnings * Apply dotnet format whitespace formatting A few of them have been manually reverted and the corresponding warning was silenced * Add previously silenced warnings back I have no clue how these disappeared * Revert formatting changes for OpCodeTable.cs * Enable formatting for a few cases again * Format if-blocks correctly * Enable formatting for a few more cases again * Fix inline comment alignment * Run dotnet format after rebase and remove unused usings - analyzers - style - whitespace * Disable 'prefer switch expression' rule * Add comments to disabled warnings * Remove a few unused parameters * Adjust namespaces * Simplify properties and array initialization, Use const when possible, Remove trailing commas * Start working on disabled warnings * Fix and silence a few dotnet-format warnings again * Address IDE0251 warnings * Address a few disabled IDE0060 warnings * Silence IDE0060 in .editorconfig * Revert "Simplify properties and array initialization, Use const when possible, Remove trailing commas" This reverts commit 9462e4136c0a2100dc28b20cf9542e06790aa67e. * dotnet format whitespace after rebase * First dotnet format pass * Remove unnecessary formatting exclusion * Add unsafe dotnet format changes * Change visibility of JitSupportDarwin to internal
124 lines
5.5 KiB
C#
124 lines
5.5 KiB
C#
// https://www.intel.com/content/dam/www/public/us/en/documents/white-papers/fast-crc-computation-generic-polynomials-pclmulqdq-paper.pdf
|
|
|
|
using ARMeilleure.IntermediateRepresentation;
|
|
using ARMeilleure.Translation;
|
|
using System;
|
|
using System.Diagnostics;
|
|
using static ARMeilleure.Instructions.InstEmitSimdHelper;
|
|
using static ARMeilleure.IntermediateRepresentation.Operand.Factory;
|
|
|
|
namespace ARMeilleure.Instructions
|
|
{
|
|
static class InstEmitHashHelper
|
|
{
|
|
public const uint Crc32RevPoly = 0xedb88320;
|
|
public const uint Crc32cRevPoly = 0x82f63b78;
|
|
|
|
public static Operand EmitCrc32(ArmEmitterContext context, Operand crc, Operand value, int size, bool castagnoli)
|
|
{
|
|
Debug.Assert(crc.Type.IsInteger() && value.Type.IsInteger());
|
|
Debug.Assert(size >= 0 && size < 4);
|
|
Debug.Assert((size < 3) || (value.Type == OperandType.I64));
|
|
|
|
if (castagnoli && Optimizations.UseSse42)
|
|
{
|
|
// The CRC32 instruction does not have an immediate variant, so ensure both inputs are in registers.
|
|
value = (value.Kind == OperandKind.Constant) ? context.Copy(value) : value;
|
|
crc = (crc.Kind == OperandKind.Constant) ? context.Copy(crc) : crc;
|
|
|
|
Intrinsic op = size switch
|
|
{
|
|
0 => Intrinsic.X86Crc32_8,
|
|
1 => Intrinsic.X86Crc32_16,
|
|
_ => Intrinsic.X86Crc32,
|
|
};
|
|
|
|
return (size == 3) ? context.ConvertI64ToI32(context.AddIntrinsicLong(op, crc, value)) : context.AddIntrinsicInt(op, crc, value);
|
|
}
|
|
else if (Optimizations.UsePclmulqdq)
|
|
{
|
|
return size switch
|
|
{
|
|
3 => EmitCrc32Optimized64(context, crc, value, castagnoli),
|
|
_ => EmitCrc32Optimized(context, crc, value, castagnoli, size),
|
|
};
|
|
}
|
|
else
|
|
{
|
|
string name = (size, castagnoli) switch
|
|
{
|
|
(0, false) => nameof(SoftFallback.Crc32b),
|
|
(1, false) => nameof(SoftFallback.Crc32h),
|
|
(2, false) => nameof(SoftFallback.Crc32w),
|
|
(3, false) => nameof(SoftFallback.Crc32x),
|
|
(0, true) => nameof(SoftFallback.Crc32cb),
|
|
(1, true) => nameof(SoftFallback.Crc32ch),
|
|
(2, true) => nameof(SoftFallback.Crc32cw),
|
|
(3, true) => nameof(SoftFallback.Crc32cx),
|
|
_ => throw new ArgumentOutOfRangeException(nameof(size)),
|
|
};
|
|
|
|
return context.Call(typeof(SoftFallback).GetMethod(name), crc, value);
|
|
}
|
|
}
|
|
|
|
private static Operand EmitCrc32Optimized(ArmEmitterContext context, Operand crc, Operand data, bool castagnoli, int size)
|
|
{
|
|
long mu = castagnoli ? 0x0DEA713F1 : 0x1F7011641; // mu' = floor(x^64/P(x))'
|
|
long polynomial = castagnoli ? 0x105EC76F0 : 0x1DB710641; // P'(x) << 1
|
|
|
|
crc = context.VectorInsert(context.VectorZero(), crc, 0);
|
|
|
|
switch (size)
|
|
{
|
|
case 0:
|
|
data = context.VectorInsert8(context.VectorZero(), data, 0);
|
|
break;
|
|
case 1:
|
|
data = context.VectorInsert16(context.VectorZero(), data, 0);
|
|
break;
|
|
case 2:
|
|
data = context.VectorInsert(context.VectorZero(), data, 0);
|
|
break;
|
|
}
|
|
|
|
int bitsize = 8 << size;
|
|
|
|
Operand tmp = context.AddIntrinsic(Intrinsic.X86Pxor, crc, data);
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Psllq, tmp, Const(64 - bitsize));
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, mu), Const(0));
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, polynomial), Const(0));
|
|
|
|
if (bitsize < 32)
|
|
{
|
|
crc = context.AddIntrinsic(Intrinsic.X86Pslldq, crc, Const((64 - bitsize) / 8));
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pxor, tmp, crc);
|
|
}
|
|
|
|
return context.VectorExtract(OperandType.I32, tmp, 2);
|
|
}
|
|
|
|
private static Operand EmitCrc32Optimized64(ArmEmitterContext context, Operand crc, Operand data, bool castagnoli)
|
|
{
|
|
long mu = castagnoli ? 0x0DEA713F1 : 0x1F7011641; // mu' = floor(x^64/P(x))'
|
|
long polynomial = castagnoli ? 0x105EC76F0 : 0x1DB710641; // P'(x) << 1
|
|
|
|
crc = context.VectorInsert(context.VectorZero(), crc, 0);
|
|
data = context.VectorInsert(context.VectorZero(), data, 0);
|
|
|
|
Operand tmp = context.AddIntrinsic(Intrinsic.X86Pxor, crc, data);
|
|
Operand res = context.AddIntrinsic(Intrinsic.X86Pslldq, tmp, Const(4));
|
|
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, res, X86GetScalar(context, mu), Const(0));
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, polynomial), Const(0));
|
|
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pxor, tmp, res);
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Psllq, tmp, Const(32));
|
|
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, mu), Const(1));
|
|
tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, polynomial), Const(0));
|
|
|
|
return context.VectorExtract(OperandType.I32, tmp, 2);
|
|
}
|
|
}
|
|
}
|