diff --git a/clang/lib/Sema/OpenCLBuiltins.td b/clang/lib/Sema/OpenCLBuiltins.td index 38e07b21cb85d5..72b72f60a662fc 100644 --- a/clang/lib/Sema/OpenCLBuiltins.td +++ b/clang/lib/Sema/OpenCLBuiltins.td @@ -59,6 +59,10 @@ def FuncExtKhrLocalInt32BaseAtomics : FunctionExtension<"cl_khr_local_int32 def FuncExtKhrLocalInt32ExtendedAtomics : FunctionExtension<"cl_khr_local_int32_extended_atomics">; def FuncExtKhrInt64BaseAtomics : FunctionExtension<"cl_khr_int64_base_atomics">; def FuncExtKhrInt64ExtendedAtomics : FunctionExtension<"cl_khr_int64_extended_atomics">; +def FuncExtKhrMipmapImage : FunctionExtension<"cl_khr_mipmap_image">; + +// Multiple extensions +def FuncExtKhrMipmapAndWrite3d : FunctionExtension<"cl_khr_mipmap_image cl_khr_3d_image_writes">; // Qualified Type. These map to ASTContext::QualType. class QualType { @@ -1179,3 +1183,176 @@ let MinVersion = CL20 in { def get_num_sub_groups : Builtin<"get_num_sub_groups", [UInt]>; } } + +//-------------------------------------------------------------------- +// End of the builtin functions defined in the OpenCL C specification. +// Builtin functions defined in the OpenCL C Extension are below. +//-------------------------------------------------------------------- + + +// OpenCL Extension v2.0 s9.18 - Mipmaps +let Extension = FuncExtKhrMipmapImage in { + // Added to section 6.13.14.2. + foreach aQual = ["RO"] in { + foreach imgTy = [Image2d] in { + foreach name = ["read_imagef"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + foreach name = ["read_imagei"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + foreach name = ["read_imageui"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + } + foreach imgTy = [Image2dDepth] in { + foreach name = ["read_imagef"] in { + def : Builtin, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + } + foreach imgTy = [Image1d] in { + foreach name = ["read_imagef"] in { + def : Builtin, ImageType, Sampler, Float, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, Float, Float, Float], Attr.Pure>; + } + foreach name = ["read_imagei"] in { + def : Builtin, ImageType, Sampler, Float, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, Float, Float, Float], Attr.Pure>; + } + foreach name = ["read_imageui"] in { + def : Builtin, ImageType, Sampler, Float, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, Float, Float, Float], Attr.Pure>; + } + } + foreach imgTy = [Image3d] in { + foreach name = ["read_imagef"] in { + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + } + foreach name = ["read_imagei"] in { + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + } + foreach name = ["read_imageui"] in { + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + } + } + foreach imgTy = [Image1dArray] in { + foreach name = ["read_imagef"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, Float, Float], Attr.Pure>; + } + foreach name = ["read_imagei"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, Float, Float], Attr.Pure>; + } + foreach name = ["read_imageui"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, Float, Float], Attr.Pure>; + } + } + foreach imgTy = [Image2dArray] in { + foreach name = ["read_imagef"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + foreach name = ["read_imagei"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + foreach name = ["read_imageui"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + } + foreach imgTy = [Image2dArrayDepth] in { + foreach name = ["read_imagef"] in { + def : Builtin, ImageType, Sampler, VectorType, Float], Attr.Pure>; + def : Builtin, ImageType, Sampler, VectorType, VectorType, VectorType], Attr.Pure>; + } + } + } + // Added to section 6.13.14.4. + foreach aQual = ["WO"] in { + foreach imgTy = [Image2d] in { + foreach name = ["write_imagef"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imagei"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imageui"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + } + foreach imgTy = [Image2dDepth] in { + foreach name = ["write_imagef"] in { + def : Builtin, VectorType, Int, Float]>; + } + } + foreach imgTy = [Image1d] in { + foreach name = ["write_imagef"] in { + def : Builtin, Int, Int, VectorType]>; + } + foreach name = ["write_imagei"] in { + def : Builtin, Int, Int, VectorType]>; + } + foreach name = ["write_imageui"] in { + def : Builtin, Int, Int, VectorType]>; + } + } + foreach imgTy = [Image1dArray] in { + foreach name = ["write_imagef"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imagei"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imageui"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + } + foreach imgTy = [Image2dArray] in { + foreach name = ["write_imagef"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imagei"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imageui"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + } + foreach imgTy = [Image2dArrayDepth] in { + foreach name = ["write_imagef"] in { + def : Builtin, VectorType, Int, Float]>; + } + } + let Extension = FuncExtKhrMipmapAndWrite3d in { + foreach imgTy = [Image3d] in { + foreach name = ["write_imagef"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imagei"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + foreach name = ["write_imageui"] in { + def : Builtin, VectorType, Int, VectorType]>; + } + } + } + } + // Added to section 6.13.14.5 + foreach aQual = ["RO", "WO", "RW"] in { + foreach name = ["get_image_num_mip_levels"] in { + foreach imgTy = [Image1d, Image2d, Image3d, Image1dArray, Image2dArray, Image2dDepth, Image2dArrayDepth] in { + def : Builtin]>; + } + } + } +} diff --git a/llvm/include/llvm/CodeGen/GlobalISel/LegalizerHelper.h b/llvm/include/llvm/CodeGen/GlobalISel/LegalizerHelper.h index fbfe71255a387f..a09edff41bb97d 100644 --- a/llvm/include/llvm/CodeGen/GlobalISel/LegalizerHelper.h +++ b/llvm/include/llvm/CodeGen/GlobalISel/LegalizerHelper.h @@ -237,6 +237,8 @@ class LegalizerHelper { LegalizeResult lowerExtract(MachineInstr &MI); LegalizeResult lowerInsert(MachineInstr &MI); LegalizeResult lowerSADDO_SSUBO(MachineInstr &MI); + LegalizeResult lowerBswap(MachineInstr &MI); + LegalizeResult lowerBitreverse(MachineInstr &MI); private: MachineRegisterInfo &MRI; diff --git a/llvm/lib/CodeGen/GlobalISel/LegalizerHelper.cpp b/llvm/lib/CodeGen/GlobalISel/LegalizerHelper.cpp index 5e1d5d9b579b67..8e49db7b7fc574 100644 --- a/llvm/lib/CodeGen/GlobalISel/LegalizerHelper.cpp +++ b/llvm/lib/CodeGen/GlobalISel/LegalizerHelper.cpp @@ -1075,6 +1075,28 @@ LegalizerHelper::LegalizeResult LegalizerHelper::narrowScalar(MachineInstr &MI, MI.eraseFromParent(); return Legalized; } + case TargetOpcode::G_BSWAP: + case TargetOpcode::G_BITREVERSE: { + if (SizeOp0 % NarrowSize != 0) + return UnableToLegalize; + + Observer.changingInstr(MI); + SmallVector SrcRegs, DstRegs; + unsigned NumParts = SizeOp0 / NarrowSize; + extractParts(MI.getOperand(1).getReg(), NarrowTy, NumParts, SrcRegs); + + for (unsigned i = 0; i < NumParts; ++i) { + auto DstPart = MIRBuilder.buildInstr(MI.getOpcode(), {NarrowTy}, + {SrcRegs[NumParts - 1 - i]}); + DstRegs.push_back(DstPart.getReg(0)); + } + + MIRBuilder.buildMerge(MI.getOperand(0).getReg(), DstRegs); + + Observer.changedInstr(MI); + MI.eraseFromParent(); + return Legalized; + } } } @@ -2289,6 +2311,10 @@ LegalizerHelper::lower(MachineInstr &MI, unsigned TypeIdx, LLT Ty) { return lowerExtract(MI); case G_INSERT: return lowerInsert(MI); + case G_BSWAP: + return lowerBswap(MI); + case G_BITREVERSE: + return lowerBitreverse(MI); } } @@ -4326,3 +4352,79 @@ LegalizerHelper::lowerSADDO_SSUBO(MachineInstr &MI) { MI.eraseFromParent(); return Legalized; } + +LegalizerHelper::LegalizeResult +LegalizerHelper::lowerBswap(MachineInstr &MI) { + Register Dst = MI.getOperand(0).getReg(); + Register Src = MI.getOperand(1).getReg(); + const LLT Ty = MRI.getType(Src); + unsigned SizeInBytes = Ty.getSizeInBytes(); + unsigned BaseShiftAmt = (SizeInBytes - 1) * 8; + + // Swap most and least significant byte, set remaining bytes in Res to zero. + auto ShiftAmt = MIRBuilder.buildConstant(Ty, BaseShiftAmt); + auto LSByteShiftedLeft = MIRBuilder.buildShl(Ty, Src, ShiftAmt); + auto MSByteShiftedRight = MIRBuilder.buildLShr(Ty, Src, ShiftAmt); + auto Res = MIRBuilder.buildOr(Ty, MSByteShiftedRight, LSByteShiftedLeft); + + // Set i-th high/low byte in Res to i-th low/high byte from Src. + for (unsigned i = 1; i < SizeInBytes / 2; ++i) { + // AND with Mask leaves byte i unchanged and sets remaining bytes to 0. + APInt APMask(SizeInBytes * 8, 0xFF << (i * 8)); + auto Mask = MIRBuilder.buildConstant(Ty, APMask); + auto ShiftAmt = MIRBuilder.buildConstant(Ty, BaseShiftAmt - 16 * i); + // Low byte shifted left to place of high byte: (Src & Mask) << ShiftAmt. + auto LoByte = MIRBuilder.buildAnd(Ty, Src, Mask); + auto LoShiftedLeft = MIRBuilder.buildShl(Ty, LoByte, ShiftAmt); + Res = MIRBuilder.buildOr(Ty, Res, LoShiftedLeft); + // High byte shifted right to place of low byte: (Src >> ShiftAmt) & Mask. + auto SrcShiftedRight = MIRBuilder.buildLShr(Ty, Src, ShiftAmt); + auto HiShiftedRight = MIRBuilder.buildAnd(Ty, SrcShiftedRight, Mask); + Res = MIRBuilder.buildOr(Ty, Res, HiShiftedRight); + } + Res.getInstr()->getOperand(0).setReg(Dst); + + MI.eraseFromParent(); + return Legalized; +} + +//{ (Src & Mask) >> N } | { (Src << N) & Mask } +static MachineInstrBuilder SwapN(unsigned N, DstOp Dst, MachineIRBuilder &B, + MachineInstrBuilder Src, APInt Mask) { + const LLT Ty = Dst.getLLTTy(*B.getMRI()); + MachineInstrBuilder C_N = B.buildConstant(Ty, N); + MachineInstrBuilder MaskLoNTo0 = B.buildConstant(Ty, Mask); + return B.buildOr(Dst, B.buildLShr(Ty, B.buildAnd(Ty, Src, MaskLoNTo0), C_N), + B.buildAnd(Ty, B.buildShl(Ty, Src, C_N), MaskLoNTo0)); +} + +LegalizerHelper::LegalizeResult +LegalizerHelper::lowerBitreverse(MachineInstr &MI) { + Register Dst = MI.getOperand(0).getReg(); + Register Src = MI.getOperand(1).getReg(); + const LLT Ty = MRI.getType(Src); + unsigned Size = Ty.getSizeInBits(); + + MachineInstrBuilder BSWAP = + MIRBuilder.buildInstr(TargetOpcode::G_BSWAP, {Ty}, {Src}); + + // swap high and low 4 bits in 8 bit blocks 7654|3210 -> 3210|7654 + // [(val & 0xF0F0F0F0) >> 4] | [(val & 0x0F0F0F0F) << 4] + // -> [(val & 0xF0F0F0F0) >> 4] | [(val << 4) & 0xF0F0F0F0] + MachineInstrBuilder Swap4 = + SwapN(4, Ty, MIRBuilder, BSWAP, APInt::getSplat(Size, APInt(8, 0xF0))); + + // swap high and low 2 bits in 4 bit blocks 32|10 76|54 -> 10|32 54|76 + // [(val & 0xCCCCCCCC) >> 2] & [(val & 0x33333333) << 2] + // -> [(val & 0xCCCCCCCC) >> 2] & [(val << 2) & 0xCCCCCCCC] + MachineInstrBuilder Swap2 = + SwapN(2, Ty, MIRBuilder, Swap4, APInt::getSplat(Size, APInt(8, 0xCC))); + + // swap high and low 1 bit in 2 bit blocks 1|0 3|2 5|4 7|6 -> 0|1 2|3 4|5 6|7 + // [(val & 0xAAAAAAAA) >> 1] & [(val & 0x55555555) << 1] + // -> [(val & 0xAAAAAAAA) >> 1] & [(val << 1) & 0xAAAAAAAA] + SwapN(1, Dst, MIRBuilder, Swap2, APInt::getSplat(Size, APInt(8, 0xAA))); + + MI.eraseFromParent(); + return Legalized; +} diff --git a/llvm/lib/CodeGen/MachineCopyPropagation.cpp b/llvm/lib/CodeGen/MachineCopyPropagation.cpp index 6db388c2564a2d..c316b167059bca 100644 --- a/llvm/lib/CodeGen/MachineCopyPropagation.cpp +++ b/llvm/lib/CodeGen/MachineCopyPropagation.cpp @@ -78,6 +78,7 @@ using namespace llvm; STATISTIC(NumDeletes, "Number of dead copies deleted"); STATISTIC(NumCopyForwards, "Number of copy uses forwarded"); +STATISTIC(NumCopyBackwardPropagated, "Number of copy defs backward propagated"); DEBUG_COUNTER(FwdCounter, "machine-cp-fwd", "Controls which register COPYs are forwarded"); @@ -793,6 +794,7 @@ void MachineCopyPropagation::propagateDefs(MachineInstr &MI) { LLVM_DEBUG(dbgs() << "MCP: After replacement: " << MI << "\n"); MaybeDeadCopies.insert(Copy); Changed = true; + ++NumCopyBackwardPropagated; } } @@ -849,8 +851,10 @@ void MachineCopyPropagation::BackwardCopyPropagateBlock( } } - for (auto *Copy : MaybeDeadCopies) + for (auto *Copy : MaybeDeadCopies) { Copy->eraseFromParent(); + ++NumDeletes; + } MaybeDeadCopies.clear(); CopyDbgUsers.clear(); diff --git a/llvm/lib/Target/Mips/MipsLegalizerInfo.cpp b/llvm/lib/Target/Mips/MipsLegalizerInfo.cpp index 36eb85e379a28b..39e53a75ac7e59 100644 --- a/llvm/lib/Target/Mips/MipsLegalizerInfo.cpp +++ b/llvm/lib/Target/Mips/MipsLegalizerInfo.cpp @@ -185,6 +185,23 @@ MipsLegalizerInfo::MipsLegalizerInfo(const MipsSubtarget &ST) { getActionDefinitionsBuilder(G_VASTART) .legalFor({p0}); + getActionDefinitionsBuilder(G_BSWAP) + .legalIf([=, &ST](const LegalityQuery &Query) { + if (ST.hasMips32r2() && CheckTyN(0, Query, {s32})) + return true; + return false; + }) + .lowerIf([=, &ST](const LegalityQuery &Query) { + if (!ST.hasMips32r2() && CheckTyN(0, Query, {s32})) + return true; + return false; + }) + .maxScalar(0, s32); + + getActionDefinitionsBuilder(G_BITREVERSE) + .lowerFor({s32}) + .maxScalar(0, s32); + // FP instructions getActionDefinitionsBuilder(G_FCONSTANT) .legalFor({s32, s64}); diff --git a/llvm/lib/Target/Mips/MipsRegisterBankInfo.cpp b/llvm/lib/Target/Mips/MipsRegisterBankInfo.cpp index 4abbc23e4cb2df..272fe9a8dd2233 100644 --- a/llvm/lib/Target/Mips/MipsRegisterBankInfo.cpp +++ b/llvm/lib/Target/Mips/MipsRegisterBankInfo.cpp @@ -451,6 +451,7 @@ MipsRegisterBankInfo::getInstrMapping(const MachineInstr &MI) const { case G_LSHR: case G_BRINDIRECT: case G_VASTART: + case G_BSWAP: OperandsMapping = &Mips::ValueMappings[Mips::GPRIdx]; break; case G_ADD: diff --git a/llvm/test/CodeGen/AMDGPU/GlobalISel/legalize-bitreverse.mir b/llvm/test/CodeGen/AMDGPU/GlobalISel/legalize-bitreverse.mir index c15388af69ac0d..ff5c65cfce10e5 100644 --- a/llvm/test/CodeGen/AMDGPU/GlobalISel/legalize-bitreverse.mir +++ b/llvm/test/CodeGen/AMDGPU/GlobalISel/legalize-bitreverse.mir @@ -1,5 +1,5 @@ # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py -# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer -global-isel-abort=0 %s -o - | FileCheck %s +# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer %s -o - | FileCheck %s --- name: bitreverse_s8 @@ -131,8 +131,11 @@ body: | liveins: $vgpr0_vgpr1 ; CHECK-LABEL: name: bitreverse_s64 ; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1 - ; CHECK: [[BITREVERSE:%[0-9]+]]:_(s64) = G_BITREVERSE [[COPY]] - ; CHECK: $vgpr0_vgpr1 = COPY [[BITREVERSE]](s64) + ; CHECK: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[COPY]](s64) + ; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV1]] + ; CHECK: [[BITREVERSE1:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV]] + ; CHECK: [[MV:%[0-9]+]]:_(s64) = G_MERGE_VALUES [[BITREVERSE]](s32), [[BITREVERSE1]](s32) + ; CHECK: $vgpr0_vgpr1 = COPY [[MV]](s64) %0:_(s64) = COPY $vgpr0_vgpr1 %1:_(s64) = G_BITREVERSE %0 $vgpr0_vgpr1 = COPY %1 @@ -147,9 +150,15 @@ body: | ; CHECK-LABEL: name: bitreverse_v2s64 ; CHECK: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3 ; CHECK: [[UV:%[0-9]+]]:_(s64), [[UV1:%[0-9]+]]:_(s64) = G_UNMERGE_VALUES [[COPY]](<2 x s64>) - ; CHECK: [[BITREVERSE:%[0-9]+]]:_(s64) = G_BITREVERSE [[UV]] - ; CHECK: [[BITREVERSE1:%[0-9]+]]:_(s64) = G_BITREVERSE [[UV1]] - ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s64>) = G_BUILD_VECTOR [[BITREVERSE]](s64), [[BITREVERSE1]](s64) + ; CHECK: [[UV2:%[0-9]+]]:_(s32), [[UV3:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[UV]](s64) + ; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV3]] + ; CHECK: [[BITREVERSE1:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV2]] + ; CHECK: [[MV:%[0-9]+]]:_(s64) = G_MERGE_VALUES [[BITREVERSE]](s32), [[BITREVERSE1]](s32) + ; CHECK: [[UV4:%[0-9]+]]:_(s32), [[UV5:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[UV1]](s64) + ; CHECK: [[BITREVERSE2:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV5]] + ; CHECK: [[BITREVERSE3:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV4]] + ; CHECK: [[MV1:%[0-9]+]]:_(s64) = G_MERGE_VALUES [[BITREVERSE2]](s32), [[BITREVERSE3]](s32) + ; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s64>) = G_BUILD_VECTOR [[MV]](s64), [[MV1]](s64) ; CHECK: $vgpr0_vgpr1_vgpr2_vgpr3 = COPY [[BUILD_VECTOR]](<2 x s64>) %0:_(<2 x s64>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3 %1:_(<2 x s64>) = G_BITREVERSE %0 diff --git a/llvm/test/CodeGen/Mips/GlobalISel/instruction-select/bswap.mir b/llvm/test/CodeGen/Mips/GlobalISel/instruction-select/bswap.mir new file mode 100644 index 00000000000000..2cec5eba3ba525 --- /dev/null +++ b/llvm/test/CodeGen/Mips/GlobalISel/instruction-select/bswap.mir @@ -0,0 +1,30 @@ +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +# RUN: llc -mtriple=mipsel-linux-gnu -run-pass=instruction-select -mattr=+mips32r2 -verify-machineinstrs %s -o - | FileCheck %s -check-prefixes=MIPS32R2 +--- | + + define void @bswap_i32() { entry: ret void } + +... +--- +name: bswap_i32 +alignment: 4 +legalized: true +regBankSelected: true +tracksRegLiveness: true +body: | + bb.1.entry: + liveins: $a0 + + ; MIPS32R2-LABEL: name: bswap_i32 + ; MIPS32R2: liveins: $a0 + ; MIPS32R2: [[COPY:%[0-9]+]]:gpr32 = COPY $a0 + ; MIPS32R2: [[WSBH:%[0-9]+]]:gpr32 = WSBH [[COPY]] + ; MIPS32R2: [[ROTR:%[0-9]+]]:gpr32 = ROTR [[WSBH]], 16 + ; MIPS32R2: $v0 = COPY [[ROTR]] + ; MIPS32R2: RetRA implicit $v0 + %0:gprb(s32) = COPY $a0 + %1:gprb(s32) = G_BSWAP %0 + $v0 = COPY %1(s32) + RetRA implicit $v0 + +... diff --git a/llvm/test/CodeGen/Mips/GlobalISel/legalizer/bitreverse.mir b/llvm/test/CodeGen/Mips/GlobalISel/legalizer/bitreverse.mir new file mode 100644 index 00000000000000..ca874f5e49964d --- /dev/null +++ b/llvm/test/CodeGen/Mips/GlobalISel/legalizer/bitreverse.mir @@ -0,0 +1,215 @@ +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +# RUN: llc -mtriple=mipsel-linux-gnu -run-pass=legalizer -verify-machineinstrs %s -o - | FileCheck %s -check-prefixes=MIPS32 +# RUN: llc -mtriple=mipsel-linux-gnu -run-pass=legalizer -mattr=+mips32r2 -verify-machineinstrs %s -o - | FileCheck %s -check-prefixes=MIPS32R2 +--- | + + define void @bitreverse_i32() { entry: ret void } + define void @bitreverse_i64() { entry: ret void } + +... +--- +name: bitreverse_i32 +alignment: 4 +tracksRegLiveness: true +body: | + bb.1.entry: + liveins: $a0 + + ; MIPS32-LABEL: name: bitreverse_i32 + ; MIPS32: liveins: $a0 + ; MIPS32: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 24 + ; MIPS32: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[COPY]], [[C]](s32) + ; MIPS32: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C]](s32) + ; MIPS32: [[OR:%[0-9]+]]:_(s32) = G_OR [[LSHR]], [[SHL]] + ; MIPS32: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 65280 + ; MIPS32: [[C2:%[0-9]+]]:_(s32) = G_CONSTANT i32 8 + ; MIPS32: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY]], [[C1]] + ; MIPS32: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[AND]], [[C2]](s32) + ; MIPS32: [[OR1:%[0-9]+]]:_(s32) = G_OR [[OR]], [[SHL1]] + ; MIPS32: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C2]](s32) + ; MIPS32: [[AND1:%[0-9]+]]:_(s32) = G_AND [[LSHR1]], [[C1]] + ; MIPS32: [[OR2:%[0-9]+]]:_(s32) = G_OR [[OR1]], [[AND1]] + ; MIPS32: [[C3:%[0-9]+]]:_(s32) = G_CONSTANT i32 4 + ; MIPS32: [[C4:%[0-9]+]]:_(s32) = G_CONSTANT i32 -252645136 + ; MIPS32: [[SHL2:%[0-9]+]]:_(s32) = G_SHL [[OR2]], [[C3]](s32) + ; MIPS32: [[AND2:%[0-9]+]]:_(s32) = G_AND [[SHL2]], [[C4]] + ; MIPS32: [[AND3:%[0-9]+]]:_(s32) = G_AND [[OR2]], [[C4]] + ; MIPS32: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[AND3]], [[C3]](s32) + ; MIPS32: [[OR3:%[0-9]+]]:_(s32) = G_OR [[LSHR2]], [[AND2]] + ; MIPS32: [[C5:%[0-9]+]]:_(s32) = G_CONSTANT i32 2 + ; MIPS32: [[C6:%[0-9]+]]:_(s32) = G_CONSTANT i32 -858993460 + ; MIPS32: [[SHL3:%[0-9]+]]:_(s32) = G_SHL [[OR3]], [[C5]](s32) + ; MIPS32: [[AND4:%[0-9]+]]:_(s32) = G_AND [[SHL3]], [[C6]] + ; MIPS32: [[AND5:%[0-9]+]]:_(s32) = G_AND [[OR3]], [[C6]] + ; MIPS32: [[LSHR3:%[0-9]+]]:_(s32) = G_LSHR [[AND5]], [[C5]](s32) + ; MIPS32: [[OR4:%[0-9]+]]:_(s32) = G_OR [[LSHR3]], [[AND4]] + ; MIPS32: [[C7:%[0-9]+]]:_(s32) = G_CONSTANT i32 1 + ; MIPS32: [[C8:%[0-9]+]]:_(s32) = G_CONSTANT i32 -1431655766 + ; MIPS32: [[SHL4:%[0-9]+]]:_(s32) = G_SHL [[OR4]], [[C7]](s32) + ; MIPS32: [[AND6:%[0-9]+]]:_(s32) = G_AND [[SHL4]], [[C8]] + ; MIPS32: [[AND7:%[0-9]+]]:_(s32) = G_AND [[OR4]], [[C8]] + ; MIPS32: [[LSHR4:%[0-9]+]]:_(s32) = G_LSHR [[AND7]], [[C7]](s32) + ; MIPS32: [[OR5:%[0-9]+]]:_(s32) = G_OR [[LSHR4]], [[AND6]] + ; MIPS32: $v0 = COPY [[OR5]](s32) + ; MIPS32: RetRA implicit $v0 + ; MIPS32R2-LABEL: name: bitreverse_i32 + ; MIPS32R2: liveins: $a0 + ; MIPS32R2: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32R2: [[BSWAP:%[0-9]+]]:_(s32) = G_BSWAP [[COPY]] + ; MIPS32R2: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 4 + ; MIPS32R2: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 -252645136 + ; MIPS32R2: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[BSWAP]], [[C]](s32) + ; MIPS32R2: [[AND:%[0-9]+]]:_(s32) = G_AND [[SHL]], [[C1]] + ; MIPS32R2: [[AND1:%[0-9]+]]:_(s32) = G_AND [[BSWAP]], [[C1]] + ; MIPS32R2: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[AND1]], [[C]](s32) + ; MIPS32R2: [[OR:%[0-9]+]]:_(s32) = G_OR [[LSHR]], [[AND]] + ; MIPS32R2: [[C2:%[0-9]+]]:_(s32) = G_CONSTANT i32 2 + ; MIPS32R2: [[C3:%[0-9]+]]:_(s32) = G_CONSTANT i32 -858993460 + ; MIPS32R2: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[OR]], [[C2]](s32) + ; MIPS32R2: [[AND2:%[0-9]+]]:_(s32) = G_AND [[SHL1]], [[C3]] + ; MIPS32R2: [[AND3:%[0-9]+]]:_(s32) = G_AND [[OR]], [[C3]] + ; MIPS32R2: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[AND3]], [[C2]](s32) + ; MIPS32R2: [[OR1:%[0-9]+]]:_(s32) = G_OR [[LSHR1]], [[AND2]] + ; MIPS32R2: [[C4:%[0-9]+]]:_(s32) = G_CONSTANT i32 1 + ; MIPS32R2: [[C5:%[0-9]+]]:_(s32) = G_CONSTANT i32 -1431655766 + ; MIPS32R2: [[SHL2:%[0-9]+]]:_(s32) = G_SHL [[OR1]], [[C4]](s32) + ; MIPS32R2: [[AND4:%[0-9]+]]:_(s32) = G_AND [[SHL2]], [[C5]] + ; MIPS32R2: [[AND5:%[0-9]+]]:_(s32) = G_AND [[OR1]], [[C5]] + ; MIPS32R2: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[AND5]], [[C4]](s32) + ; MIPS32R2: [[OR2:%[0-9]+]]:_(s32) = G_OR [[LSHR2]], [[AND4]] + ; MIPS32R2: $v0 = COPY [[OR2]](s32) + ; MIPS32R2: RetRA implicit $v0 + %0:_(s32) = COPY $a0 + %1:_(s32) = G_BITREVERSE %0 + $v0 = COPY %1(s32) + RetRA implicit $v0 + +... +--- +name: bitreverse_i64 +alignment: 4 +tracksRegLiveness: true +body: | + bb.1.entry: + liveins: $a0, $a1 + + ; MIPS32-LABEL: name: bitreverse_i64 + ; MIPS32: liveins: $a0, $a1 + ; MIPS32: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32: [[COPY1:%[0-9]+]]:_(s32) = COPY $a1 + ; MIPS32: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 24 + ; MIPS32: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[COPY1]], [[C]](s32) + ; MIPS32: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[COPY1]], [[C]](s32) + ; MIPS32: [[OR:%[0-9]+]]:_(s32) = G_OR [[LSHR]], [[SHL]] + ; MIPS32: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 65280 + ; MIPS32: [[C2:%[0-9]+]]:_(s32) = G_CONSTANT i32 8 + ; MIPS32: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C1]] + ; MIPS32: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[AND]], [[C2]](s32) + ; MIPS32: [[OR1:%[0-9]+]]:_(s32) = G_OR [[OR]], [[SHL1]] + ; MIPS32: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[COPY1]], [[C2]](s32) + ; MIPS32: [[AND1:%[0-9]+]]:_(s32) = G_AND [[LSHR1]], [[C1]] + ; MIPS32: [[OR2:%[0-9]+]]:_(s32) = G_OR [[OR1]], [[AND1]] + ; MIPS32: [[C3:%[0-9]+]]:_(s32) = G_CONSTANT i32 4 + ; MIPS32: [[C4:%[0-9]+]]:_(s32) = G_CONSTANT i32 -252645136 + ; MIPS32: [[SHL2:%[0-9]+]]:_(s32) = G_SHL [[OR2]], [[C3]](s32) + ; MIPS32: [[AND2:%[0-9]+]]:_(s32) = G_AND [[SHL2]], [[C4]] + ; MIPS32: [[AND3:%[0-9]+]]:_(s32) = G_AND [[OR2]], [[C4]] + ; MIPS32: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[AND3]], [[C3]](s32) + ; MIPS32: [[OR3:%[0-9]+]]:_(s32) = G_OR [[LSHR2]], [[AND2]] + ; MIPS32: [[C5:%[0-9]+]]:_(s32) = G_CONSTANT i32 2 + ; MIPS32: [[C6:%[0-9]+]]:_(s32) = G_CONSTANT i32 -858993460 + ; MIPS32: [[SHL3:%[0-9]+]]:_(s32) = G_SHL [[OR3]], [[C5]](s32) + ; MIPS32: [[AND4:%[0-9]+]]:_(s32) = G_AND [[SHL3]], [[C6]] + ; MIPS32: [[AND5:%[0-9]+]]:_(s32) = G_AND [[OR3]], [[C6]] + ; MIPS32: [[LSHR3:%[0-9]+]]:_(s32) = G_LSHR [[AND5]], [[C5]](s32) + ; MIPS32: [[OR4:%[0-9]+]]:_(s32) = G_OR [[LSHR3]], [[AND4]] + ; MIPS32: [[C7:%[0-9]+]]:_(s32) = G_CONSTANT i32 1 + ; MIPS32: [[C8:%[0-9]+]]:_(s32) = G_CONSTANT i32 -1431655766 + ; MIPS32: [[SHL4:%[0-9]+]]:_(s32) = G_SHL [[OR4]], [[C7]](s32) + ; MIPS32: [[AND6:%[0-9]+]]:_(s32) = G_AND [[SHL4]], [[C8]] + ; MIPS32: [[AND7:%[0-9]+]]:_(s32) = G_AND [[OR4]], [[C8]] + ; MIPS32: [[LSHR4:%[0-9]+]]:_(s32) = G_LSHR [[AND7]], [[C7]](s32) + ; MIPS32: [[OR5:%[0-9]+]]:_(s32) = G_OR [[LSHR4]], [[AND6]] + ; MIPS32: [[SHL5:%[0-9]+]]:_(s32) = G_SHL [[COPY]], [[C]](s32) + ; MIPS32: [[LSHR5:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C]](s32) + ; MIPS32: [[OR6:%[0-9]+]]:_(s32) = G_OR [[LSHR5]], [[SHL5]] + ; MIPS32: [[AND8:%[0-9]+]]:_(s32) = G_AND [[COPY]], [[C1]] + ; MIPS32: [[SHL6:%[0-9]+]]:_(s32) = G_SHL [[AND8]], [[C2]](s32) + ; MIPS32: [[OR7:%[0-9]+]]:_(s32) = G_OR [[OR6]], [[SHL6]] + ; MIPS32: [[LSHR6:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C2]](s32) + ; MIPS32: [[AND9:%[0-9]+]]:_(s32) = G_AND [[LSHR6]], [[C1]] + ; MIPS32: [[OR8:%[0-9]+]]:_(s32) = G_OR [[OR7]], [[AND9]] + ; MIPS32: [[SHL7:%[0-9]+]]:_(s32) = G_SHL [[OR8]], [[C3]](s32) + ; MIPS32: [[AND10:%[0-9]+]]:_(s32) = G_AND [[SHL7]], [[C4]] + ; MIPS32: [[AND11:%[0-9]+]]:_(s32) = G_AND [[OR8]], [[C4]] + ; MIPS32: [[LSHR7:%[0-9]+]]:_(s32) = G_LSHR [[AND11]], [[C3]](s32) + ; MIPS32: [[OR9:%[0-9]+]]:_(s32) = G_OR [[LSHR7]], [[AND10]] + ; MIPS32: [[SHL8:%[0-9]+]]:_(s32) = G_SHL [[OR9]], [[C5]](s32) + ; MIPS32: [[AND12:%[0-9]+]]:_(s32) = G_AND [[SHL8]], [[C6]] + ; MIPS32: [[AND13:%[0-9]+]]:_(s32) = G_AND [[OR9]], [[C6]] + ; MIPS32: [[LSHR8:%[0-9]+]]:_(s32) = G_LSHR [[AND13]], [[C5]](s32) + ; MIPS32: [[OR10:%[0-9]+]]:_(s32) = G_OR [[LSHR8]], [[AND12]] + ; MIPS32: [[SHL9:%[0-9]+]]:_(s32) = G_SHL [[OR10]], [[C7]](s32) + ; MIPS32: [[AND14:%[0-9]+]]:_(s32) = G_AND [[SHL9]], [[C8]] + ; MIPS32: [[AND15:%[0-9]+]]:_(s32) = G_AND [[OR10]], [[C8]] + ; MIPS32: [[LSHR9:%[0-9]+]]:_(s32) = G_LSHR [[AND15]], [[C7]](s32) + ; MIPS32: [[OR11:%[0-9]+]]:_(s32) = G_OR [[LSHR9]], [[AND14]] + ; MIPS32: $v0 = COPY [[OR5]](s32) + ; MIPS32: $v1 = COPY [[OR11]](s32) + ; MIPS32: RetRA implicit $v0, implicit $v1 + ; MIPS32R2-LABEL: name: bitreverse_i64 + ; MIPS32R2: liveins: $a0, $a1 + ; MIPS32R2: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32R2: [[COPY1:%[0-9]+]]:_(s32) = COPY $a1 + ; MIPS32R2: [[BSWAP:%[0-9]+]]:_(s32) = G_BSWAP [[COPY1]] + ; MIPS32R2: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 4 + ; MIPS32R2: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 -252645136 + ; MIPS32R2: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[BSWAP]], [[C]](s32) + ; MIPS32R2: [[AND:%[0-9]+]]:_(s32) = G_AND [[SHL]], [[C1]] + ; MIPS32R2: [[AND1:%[0-9]+]]:_(s32) = G_AND [[BSWAP]], [[C1]] + ; MIPS32R2: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[AND1]], [[C]](s32) + ; MIPS32R2: [[OR:%[0-9]+]]:_(s32) = G_OR [[LSHR]], [[AND]] + ; MIPS32R2: [[C2:%[0-9]+]]:_(s32) = G_CONSTANT i32 2 + ; MIPS32R2: [[C3:%[0-9]+]]:_(s32) = G_CONSTANT i32 -858993460 + ; MIPS32R2: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[OR]], [[C2]](s32) + ; MIPS32R2: [[AND2:%[0-9]+]]:_(s32) = G_AND [[SHL1]], [[C3]] + ; MIPS32R2: [[AND3:%[0-9]+]]:_(s32) = G_AND [[OR]], [[C3]] + ; MIPS32R2: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[AND3]], [[C2]](s32) + ; MIPS32R2: [[OR1:%[0-9]+]]:_(s32) = G_OR [[LSHR1]], [[AND2]] + ; MIPS32R2: [[C4:%[0-9]+]]:_(s32) = G_CONSTANT i32 1 + ; MIPS32R2: [[C5:%[0-9]+]]:_(s32) = G_CONSTANT i32 -1431655766 + ; MIPS32R2: [[SHL2:%[0-9]+]]:_(s32) = G_SHL [[OR1]], [[C4]](s32) + ; MIPS32R2: [[AND4:%[0-9]+]]:_(s32) = G_AND [[SHL2]], [[C5]] + ; MIPS32R2: [[AND5:%[0-9]+]]:_(s32) = G_AND [[OR1]], [[C5]] + ; MIPS32R2: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[AND5]], [[C4]](s32) + ; MIPS32R2: [[OR2:%[0-9]+]]:_(s32) = G_OR [[LSHR2]], [[AND4]] + ; MIPS32R2: [[BSWAP1:%[0-9]+]]:_(s32) = G_BSWAP [[COPY]] + ; MIPS32R2: [[SHL3:%[0-9]+]]:_(s32) = G_SHL [[BSWAP1]], [[C]](s32) + ; MIPS32R2: [[AND6:%[0-9]+]]:_(s32) = G_AND [[SHL3]], [[C1]] + ; MIPS32R2: [[AND7:%[0-9]+]]:_(s32) = G_AND [[BSWAP1]], [[C1]] + ; MIPS32R2: [[LSHR3:%[0-9]+]]:_(s32) = G_LSHR [[AND7]], [[C]](s32) + ; MIPS32R2: [[OR3:%[0-9]+]]:_(s32) = G_OR [[LSHR3]], [[AND6]] + ; MIPS32R2: [[SHL4:%[0-9]+]]:_(s32) = G_SHL [[OR3]], [[C2]](s32) + ; MIPS32R2: [[AND8:%[0-9]+]]:_(s32) = G_AND [[SHL4]], [[C3]] + ; MIPS32R2: [[AND9:%[0-9]+]]:_(s32) = G_AND [[OR3]], [[C3]] + ; MIPS32R2: [[LSHR4:%[0-9]+]]:_(s32) = G_LSHR [[AND9]], [[C2]](s32) + ; MIPS32R2: [[OR4:%[0-9]+]]:_(s32) = G_OR [[LSHR4]], [[AND8]] + ; MIPS32R2: [[SHL5:%[0-9]+]]:_(s32) = G_SHL [[OR4]], [[C4]](s32) + ; MIPS32R2: [[AND10:%[0-9]+]]:_(s32) = G_AND [[SHL5]], [[C5]] + ; MIPS32R2: [[AND11:%[0-9]+]]:_(s32) = G_AND [[OR4]], [[C5]] + ; MIPS32R2: [[LSHR5:%[0-9]+]]:_(s32) = G_LSHR [[AND11]], [[C4]](s32) + ; MIPS32R2: [[OR5:%[0-9]+]]:_(s32) = G_OR [[LSHR5]], [[AND10]] + ; MIPS32R2: $v0 = COPY [[OR2]](s32) + ; MIPS32R2: $v1 = COPY [[OR5]](s32) + ; MIPS32R2: RetRA implicit $v0, implicit $v1 + %1:_(s32) = COPY $a0 + %2:_(s32) = COPY $a1 + %0:_(s64) = G_MERGE_VALUES %1(s32), %2(s32) + %3:_(s64) = G_BITREVERSE %0 + %4:_(s32), %5:_(s32) = G_UNMERGE_VALUES %3(s64) + $v0 = COPY %4(s32) + $v1 = COPY %5(s32) + RetRA implicit $v0, implicit $v1 + +... diff --git a/llvm/test/CodeGen/Mips/GlobalISel/legalizer/bswap.mir b/llvm/test/CodeGen/Mips/GlobalISel/legalizer/bswap.mir new file mode 100644 index 00000000000000..62a95b8c10a06b --- /dev/null +++ b/llvm/test/CodeGen/Mips/GlobalISel/legalizer/bswap.mir @@ -0,0 +1,101 @@ +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +# RUN: llc -mtriple=mipsel-linux-gnu -run-pass=legalizer -verify-machineinstrs %s -o - | FileCheck %s -check-prefixes=MIPS32 +# RUN: llc -mtriple=mipsel-linux-gnu -run-pass=legalizer -mattr=+mips32r2 -verify-machineinstrs %s -o - | FileCheck %s -check-prefixes=MIPS32R2 +--- | + + define void @bswap_i32() { entry: ret void } + define void @bswap_i64() { entry: ret void } + +... +--- +name: bswap_i32 +alignment: 4 +tracksRegLiveness: true +body: | + bb.1.entry: + liveins: $a0 + + ; MIPS32-LABEL: name: bswap_i32 + ; MIPS32: liveins: $a0 + ; MIPS32: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 24 + ; MIPS32: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[COPY]], [[C]](s32) + ; MIPS32: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C]](s32) + ; MIPS32: [[OR:%[0-9]+]]:_(s32) = G_OR [[LSHR]], [[SHL]] + ; MIPS32: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 65280 + ; MIPS32: [[C2:%[0-9]+]]:_(s32) = G_CONSTANT i32 8 + ; MIPS32: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY]], [[C1]] + ; MIPS32: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[AND]], [[C2]](s32) + ; MIPS32: [[OR1:%[0-9]+]]:_(s32) = G_OR [[OR]], [[SHL1]] + ; MIPS32: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C2]](s32) + ; MIPS32: [[AND1:%[0-9]+]]:_(s32) = G_AND [[LSHR1]], [[C1]] + ; MIPS32: [[OR2:%[0-9]+]]:_(s32) = G_OR [[OR1]], [[AND1]] + ; MIPS32: $v0 = COPY [[OR2]](s32) + ; MIPS32: RetRA implicit $v0 + ; MIPS32R2-LABEL: name: bswap_i32 + ; MIPS32R2: liveins: $a0 + ; MIPS32R2: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32R2: [[BSWAP:%[0-9]+]]:_(s32) = G_BSWAP [[COPY]] + ; MIPS32R2: $v0 = COPY [[BSWAP]](s32) + ; MIPS32R2: RetRA implicit $v0 + %0:_(s32) = COPY $a0 + %1:_(s32) = G_BSWAP %0 + $v0 = COPY %1(s32) + RetRA implicit $v0 + +... +--- +name: bswap_i64 +alignment: 4 +tracksRegLiveness: true +body: | + bb.1.entry: + liveins: $a0, $a1 + + ; MIPS32-LABEL: name: bswap_i64 + ; MIPS32: liveins: $a0, $a1 + ; MIPS32: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32: [[COPY1:%[0-9]+]]:_(s32) = COPY $a1 + ; MIPS32: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 24 + ; MIPS32: [[SHL:%[0-9]+]]:_(s32) = G_SHL [[COPY1]], [[C]](s32) + ; MIPS32: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[COPY1]], [[C]](s32) + ; MIPS32: [[OR:%[0-9]+]]:_(s32) = G_OR [[LSHR]], [[SHL]] + ; MIPS32: [[C1:%[0-9]+]]:_(s32) = G_CONSTANT i32 65280 + ; MIPS32: [[C2:%[0-9]+]]:_(s32) = G_CONSTANT i32 8 + ; MIPS32: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C1]] + ; MIPS32: [[SHL1:%[0-9]+]]:_(s32) = G_SHL [[AND]], [[C2]](s32) + ; MIPS32: [[OR1:%[0-9]+]]:_(s32) = G_OR [[OR]], [[SHL1]] + ; MIPS32: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[COPY1]], [[C2]](s32) + ; MIPS32: [[AND1:%[0-9]+]]:_(s32) = G_AND [[LSHR1]], [[C1]] + ; MIPS32: [[OR2:%[0-9]+]]:_(s32) = G_OR [[OR1]], [[AND1]] + ; MIPS32: [[SHL2:%[0-9]+]]:_(s32) = G_SHL [[COPY]], [[C]](s32) + ; MIPS32: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C]](s32) + ; MIPS32: [[OR3:%[0-9]+]]:_(s32) = G_OR [[LSHR2]], [[SHL2]] + ; MIPS32: [[AND2:%[0-9]+]]:_(s32) = G_AND [[COPY]], [[C1]] + ; MIPS32: [[SHL3:%[0-9]+]]:_(s32) = G_SHL [[AND2]], [[C2]](s32) + ; MIPS32: [[OR4:%[0-9]+]]:_(s32) = G_OR [[OR3]], [[SHL3]] + ; MIPS32: [[LSHR3:%[0-9]+]]:_(s32) = G_LSHR [[COPY]], [[C2]](s32) + ; MIPS32: [[AND3:%[0-9]+]]:_(s32) = G_AND [[LSHR3]], [[C1]] + ; MIPS32: [[OR5:%[0-9]+]]:_(s32) = G_OR [[OR4]], [[AND3]] + ; MIPS32: $v0 = COPY [[OR2]](s32) + ; MIPS32: $v1 = COPY [[OR5]](s32) + ; MIPS32: RetRA implicit $v0, implicit $v1 + ; MIPS32R2-LABEL: name: bswap_i64 + ; MIPS32R2: liveins: $a0, $a1 + ; MIPS32R2: [[COPY:%[0-9]+]]:_(s32) = COPY $a0 + ; MIPS32R2: [[COPY1:%[0-9]+]]:_(s32) = COPY $a1 + ; MIPS32R2: [[BSWAP:%[0-9]+]]:_(s32) = G_BSWAP [[COPY1]] + ; MIPS32R2: [[BSWAP1:%[0-9]+]]:_(s32) = G_BSWAP [[COPY]] + ; MIPS32R2: $v0 = COPY [[BSWAP]](s32) + ; MIPS32R2: $v1 = COPY [[BSWAP1]](s32) + ; MIPS32R2: RetRA implicit $v0, implicit $v1 + %1:_(s32) = COPY $a0 + %2:_(s32) = COPY $a1 + %0:_(s64) = G_MERGE_VALUES %1(s32), %2(s32) + %3:_(s64) = G_BSWAP %0 + %4:_(s32), %5:_(s32) = G_UNMERGE_VALUES %3(s64) + $v0 = COPY %4(s32) + $v1 = COPY %5(s32) + RetRA implicit $v0, implicit $v1 + +... diff --git a/llvm/test/CodeGen/Mips/GlobalISel/llvm-ir/bitreverse.ll b/llvm/test/CodeGen/Mips/GlobalISel/llvm-ir/bitreverse.ll new file mode 100644 index 00000000000000..845d84d7551698 --- /dev/null +++ b/llvm/test/CodeGen/Mips/GlobalISel/llvm-ir/bitreverse.ll @@ -0,0 +1,184 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -O0 -mtriple=mipsel-linux-gnu -global-isel -verify-machineinstrs %s -o -| FileCheck %s -check-prefixes=MIPS32 +; RUN: llc -O0 -mtriple=mipsel-linux-gnu -global-isel -mattr=+mips32r2 -verify-machineinstrs %s -o -| FileCheck %s -check-prefixes=MIPS32R2 + +declare i32 @llvm.bitreverse.i32(i32) +define i32 @bitreverse_i32(i32 signext %a) { +; MIPS32-LABEL: bitreverse_i32: +; MIPS32: # %bb.0: # %entry +; MIPS32-NEXT: sll $1, $4, 24 +; MIPS32-NEXT: srl $2, $4, 24 +; MIPS32-NEXT: or $1, $2, $1 +; MIPS32-NEXT: andi $2, $4, 65280 +; MIPS32-NEXT: sll $2, $2, 8 +; MIPS32-NEXT: or $1, $1, $2 +; MIPS32-NEXT: srl $2, $4, 8 +; MIPS32-NEXT: andi $2, $2, 65280 +; MIPS32-NEXT: or $1, $1, $2 +; MIPS32-NEXT: lui $2, 61680 +; MIPS32-NEXT: ori $2, $2, 61680 +; MIPS32-NEXT: sll $3, $1, 4 +; MIPS32-NEXT: and $3, $3, $2 +; MIPS32-NEXT: and $1, $1, $2 +; MIPS32-NEXT: srl $1, $1, 4 +; MIPS32-NEXT: or $1, $1, $3 +; MIPS32-NEXT: lui $2, 52428 +; MIPS32-NEXT: ori $2, $2, 52428 +; MIPS32-NEXT: sll $3, $1, 2 +; MIPS32-NEXT: and $3, $3, $2 +; MIPS32-NEXT: and $1, $1, $2 +; MIPS32-NEXT: srl $1, $1, 2 +; MIPS32-NEXT: or $1, $1, $3 +; MIPS32-NEXT: lui $2, 43690 +; MIPS32-NEXT: ori $2, $2, 43690 +; MIPS32-NEXT: sll $3, $1, 1 +; MIPS32-NEXT: and $3, $3, $2 +; MIPS32-NEXT: and $1, $1, $2 +; MIPS32-NEXT: srl $1, $1, 1 +; MIPS32-NEXT: or $2, $1, $3 +; MIPS32-NEXT: jr $ra +; MIPS32-NEXT: nop +; +; MIPS32R2-LABEL: bitreverse_i32: +; MIPS32R2: # %bb.0: # %entry +; MIPS32R2-NEXT: wsbh $1, $4 +; MIPS32R2-NEXT: rotr $1, $1, 16 +; MIPS32R2-NEXT: lui $2, 61680 +; MIPS32R2-NEXT: ori $2, $2, 61680 +; MIPS32R2-NEXT: sll $3, $1, 4 +; MIPS32R2-NEXT: and $3, $3, $2 +; MIPS32R2-NEXT: and $1, $1, $2 +; MIPS32R2-NEXT: srl $1, $1, 4 +; MIPS32R2-NEXT: or $1, $1, $3 +; MIPS32R2-NEXT: lui $2, 52428 +; MIPS32R2-NEXT: ori $2, $2, 52428 +; MIPS32R2-NEXT: sll $3, $1, 2 +; MIPS32R2-NEXT: and $3, $3, $2 +; MIPS32R2-NEXT: and $1, $1, $2 +; MIPS32R2-NEXT: srl $1, $1, 2 +; MIPS32R2-NEXT: or $1, $1, $3 +; MIPS32R2-NEXT: lui $2, 43690 +; MIPS32R2-NEXT: ori $2, $2, 43690 +; MIPS32R2-NEXT: sll $3, $1, 1 +; MIPS32R2-NEXT: and $3, $3, $2 +; MIPS32R2-NEXT: and $1, $1, $2 +; MIPS32R2-NEXT: srl $1, $1, 1 +; MIPS32R2-NEXT: or $2, $1, $3 +; MIPS32R2-NEXT: jr $ra +; MIPS32R2-NEXT: nop +entry: + %0 = call i32 @llvm.bitreverse.i32(i32 %a) + ret i32 %0 +} + +declare i64 @llvm.bitreverse.i64(i64) +define i64 @bitreverse_i64(i64 signext %a) { +; MIPS32-LABEL: bitreverse_i64: +; MIPS32: # %bb.0: # %entry +; MIPS32-NEXT: sll $1, $5, 24 +; MIPS32-NEXT: srl $2, $5, 24 +; MIPS32-NEXT: or $1, $2, $1 +; MIPS32-NEXT: andi $2, $5, 65280 +; MIPS32-NEXT: sll $2, $2, 8 +; MIPS32-NEXT: or $1, $1, $2 +; MIPS32-NEXT: srl $2, $5, 8 +; MIPS32-NEXT: andi $2, $2, 65280 +; MIPS32-NEXT: or $1, $1, $2 +; MIPS32-NEXT: lui $2, 61680 +; MIPS32-NEXT: ori $2, $2, 61680 +; MIPS32-NEXT: sll $3, $1, 4 +; MIPS32-NEXT: and $3, $3, $2 +; MIPS32-NEXT: and $1, $1, $2 +; MIPS32-NEXT: srl $1, $1, 4 +; MIPS32-NEXT: or $1, $1, $3 +; MIPS32-NEXT: lui $3, 52428 +; MIPS32-NEXT: ori $3, $3, 52428 +; MIPS32-NEXT: sll $5, $1, 2 +; MIPS32-NEXT: and $5, $5, $3 +; MIPS32-NEXT: and $1, $1, $3 +; MIPS32-NEXT: srl $1, $1, 2 +; MIPS32-NEXT: or $1, $1, $5 +; MIPS32-NEXT: lui $5, 43690 +; MIPS32-NEXT: ori $5, $5, 43690 +; MIPS32-NEXT: sll $6, $1, 1 +; MIPS32-NEXT: and $6, $6, $5 +; MIPS32-NEXT: and $1, $1, $5 +; MIPS32-NEXT: srl $1, $1, 1 +; MIPS32-NEXT: or $1, $1, $6 +; MIPS32-NEXT: sll $6, $4, 24 +; MIPS32-NEXT: srl $7, $4, 24 +; MIPS32-NEXT: or $6, $7, $6 +; MIPS32-NEXT: andi $7, $4, 65280 +; MIPS32-NEXT: sll $7, $7, 8 +; MIPS32-NEXT: or $6, $6, $7 +; MIPS32-NEXT: srl $4, $4, 8 +; MIPS32-NEXT: andi $4, $4, 65280 +; MIPS32-NEXT: or $4, $6, $4 +; MIPS32-NEXT: sll $6, $4, 4 +; MIPS32-NEXT: and $6, $6, $2 +; MIPS32-NEXT: and $2, $4, $2 +; MIPS32-NEXT: srl $2, $2, 4 +; MIPS32-NEXT: or $2, $2, $6 +; MIPS32-NEXT: sll $4, $2, 2 +; MIPS32-NEXT: and $4, $4, $3 +; MIPS32-NEXT: and $2, $2, $3 +; MIPS32-NEXT: srl $2, $2, 2 +; MIPS32-NEXT: or $2, $2, $4 +; MIPS32-NEXT: sll $3, $2, 1 +; MIPS32-NEXT: and $3, $3, $5 +; MIPS32-NEXT: and $2, $2, $5 +; MIPS32-NEXT: srl $2, $2, 1 +; MIPS32-NEXT: or $3, $2, $3 +; MIPS32-NEXT: move $2, $1 +; MIPS32-NEXT: jr $ra +; MIPS32-NEXT: nop +; +; MIPS32R2-LABEL: bitreverse_i64: +; MIPS32R2: # %bb.0: # %entry +; MIPS32R2-NEXT: wsbh $1, $5 +; MIPS32R2-NEXT: rotr $1, $1, 16 +; MIPS32R2-NEXT: lui $2, 61680 +; MIPS32R2-NEXT: ori $2, $2, 61680 +; MIPS32R2-NEXT: sll $3, $1, 4 +; MIPS32R2-NEXT: and $3, $3, $2 +; MIPS32R2-NEXT: and $1, $1, $2 +; MIPS32R2-NEXT: srl $1, $1, 4 +; MIPS32R2-NEXT: or $1, $1, $3 +; MIPS32R2-NEXT: lui $3, 52428 +; MIPS32R2-NEXT: ori $3, $3, 52428 +; MIPS32R2-NEXT: sll $5, $1, 2 +; MIPS32R2-NEXT: and $5, $5, $3 +; MIPS32R2-NEXT: and $1, $1, $3 +; MIPS32R2-NEXT: srl $1, $1, 2 +; MIPS32R2-NEXT: or $1, $1, $5 +; MIPS32R2-NEXT: lui $5, 43690 +; MIPS32R2-NEXT: ori $5, $5, 43690 +; MIPS32R2-NEXT: sll $6, $1, 1 +; MIPS32R2-NEXT: and $6, $6, $5 +; MIPS32R2-NEXT: and $1, $1, $5 +; MIPS32R2-NEXT: srl $1, $1, 1 +; MIPS32R2-NEXT: or $1, $1, $6 +; MIPS32R2-NEXT: wsbh $4, $4 +; MIPS32R2-NEXT: rotr $4, $4, 16 +; MIPS32R2-NEXT: sll $6, $4, 4 +; MIPS32R2-NEXT: and $6, $6, $2 +; MIPS32R2-NEXT: and $2, $4, $2 +; MIPS32R2-NEXT: srl $2, $2, 4 +; MIPS32R2-NEXT: or $2, $2, $6 +; MIPS32R2-NEXT: sll $4, $2, 2 +; MIPS32R2-NEXT: and $4, $4, $3 +; MIPS32R2-NEXT: and $2, $2, $3 +; MIPS32R2-NEXT: srl $2, $2, 2 +; MIPS32R2-NEXT: or $2, $2, $4 +; MIPS32R2-NEXT: sll $3, $2, 1 +; MIPS32R2-NEXT: and $3, $3, $5 +; MIPS32R2-NEXT: and $2, $2, $5 +; MIPS32R2-NEXT: srl $2, $2, 1 +; MIPS32R2-NEXT: or $3, $2, $3 +; MIPS32R2-NEXT: move $2, $1 +; MIPS32R2-NEXT: jr $ra +; MIPS32R2-NEXT: nop +entry: + %0 = call i64 @llvm.bitreverse.i64(i64 %a) + ret i64 %0 +} diff --git a/llvm/test/CodeGen/Mips/GlobalISel/llvm-ir/bswap.ll b/llvm/test/CodeGen/Mips/GlobalISel/llvm-ir/bswap.ll new file mode 100644 index 00000000000000..3b371cca6fe90f --- /dev/null +++ b/llvm/test/CodeGen/Mips/GlobalISel/llvm-ir/bswap.ll @@ -0,0 +1,68 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -O0 -mtriple=mipsel-linux-gnu -global-isel -verify-machineinstrs %s -o -| FileCheck %s -check-prefixes=MIPS32 +; RUN: llc -O0 -mtriple=mipsel-linux-gnu -global-isel -mattr=+mips32r2 -verify-machineinstrs %s -o -| FileCheck %s -check-prefixes=MIPS32R2 + +declare i32 @llvm.bswap.i32(i32) +define i32 @bswap_i32(i32 %x) { +; MIPS32-LABEL: bswap_i32: +; MIPS32: # %bb.0: # %entry +; MIPS32-NEXT: sll $1, $4, 24 +; MIPS32-NEXT: srl $2, $4, 24 +; MIPS32-NEXT: or $1, $2, $1 +; MIPS32-NEXT: andi $2, $4, 65280 +; MIPS32-NEXT: sll $2, $2, 8 +; MIPS32-NEXT: or $1, $1, $2 +; MIPS32-NEXT: srl $2, $4, 8 +; MIPS32-NEXT: andi $2, $2, 65280 +; MIPS32-NEXT: or $2, $1, $2 +; MIPS32-NEXT: jr $ra +; MIPS32-NEXT: nop +; +; MIPS32R2-LABEL: bswap_i32: +; MIPS32R2: # %bb.0: # %entry +; MIPS32R2-NEXT: wsbh $1, $4 +; MIPS32R2-NEXT: rotr $2, $1, 16 +; MIPS32R2-NEXT: jr $ra +; MIPS32R2-NEXT: nop +entry: + %0 = tail call i32 @llvm.bswap.i32(i32 %x) + ret i32 %0 +} + +declare i64 @llvm.bswap.i64(i64) +define i64 @bswap_i64(i64 %x) { +; MIPS32-LABEL: bswap_i64: +; MIPS32: # %bb.0: # %entry +; MIPS32-NEXT: sll $1, $5, 24 +; MIPS32-NEXT: srl $2, $5, 24 +; MIPS32-NEXT: or $1, $2, $1 +; MIPS32-NEXT: andi $2, $5, 65280 +; MIPS32-NEXT: sll $2, $2, 8 +; MIPS32-NEXT: or $1, $1, $2 +; MIPS32-NEXT: srl $2, $5, 8 +; MIPS32-NEXT: andi $2, $2, 65280 +; MIPS32-NEXT: or $2, $1, $2 +; MIPS32-NEXT: sll $1, $4, 24 +; MIPS32-NEXT: srl $3, $4, 24 +; MIPS32-NEXT: or $1, $3, $1 +; MIPS32-NEXT: andi $3, $4, 65280 +; MIPS32-NEXT: sll $3, $3, 8 +; MIPS32-NEXT: or $1, $1, $3 +; MIPS32-NEXT: srl $3, $4, 8 +; MIPS32-NEXT: andi $3, $3, 65280 +; MIPS32-NEXT: or $3, $1, $3 +; MIPS32-NEXT: jr $ra +; MIPS32-NEXT: nop +; +; MIPS32R2-LABEL: bswap_i64: +; MIPS32R2: # %bb.0: # %entry +; MIPS32R2-NEXT: wsbh $1, $5 +; MIPS32R2-NEXT: rotr $2, $1, 16 +; MIPS32R2-NEXT: wsbh $1, $4 +; MIPS32R2-NEXT: rotr $3, $1, 16 +; MIPS32R2-NEXT: jr $ra +; MIPS32R2-NEXT: nop +entry: + %0 = tail call i64 @llvm.bswap.i64(i64 %x) + ret i64 %0 +} diff --git a/llvm/test/CodeGen/Mips/GlobalISel/regbankselect/bswap.mir b/llvm/test/CodeGen/Mips/GlobalISel/regbankselect/bswap.mir new file mode 100644 index 00000000000000..c50e81eae0c935 --- /dev/null +++ b/llvm/test/CodeGen/Mips/GlobalISel/regbankselect/bswap.mir @@ -0,0 +1,28 @@ +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +# RUN: llc -mtriple=mipsel-linux-gnu -run-pass=regbankselect -mattr=+mips32r2 -verify-machineinstrs %s -o - | FileCheck %s -check-prefixes=MIPS32R2 +--- | + + define void @bswap_i32() { entry: ret void } + +... +--- +name: bswap_i32 +alignment: 4 +legalized: true +tracksRegLiveness: true +body: | + bb.1.entry: + liveins: $a0 + + ; MIPS32R2-LABEL: name: bswap_i32 + ; MIPS32R2: liveins: $a0 + ; MIPS32R2: [[COPY:%[0-9]+]]:gprb(s32) = COPY $a0 + ; MIPS32R2: [[BSWAP:%[0-9]+]]:gprb(s32) = G_BSWAP [[COPY]] + ; MIPS32R2: $v0 = COPY [[BSWAP]](s32) + ; MIPS32R2: RetRA implicit $v0 + %0:_(s32) = COPY $a0 + %1:_(s32) = G_BSWAP %0 + $v0 = COPY %1(s32) + RetRA implicit $v0 + +...