10b57cec5SDimitry Andric// WebAssemblyInstrSIMD.td - WebAssembly SIMD codegen support -*- tablegen -*-// 20b57cec5SDimitry Andric// 30b57cec5SDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric// See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric// 70b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric/// 90b57cec5SDimitry Andric/// \file 100b57cec5SDimitry Andric/// WebAssembly SIMD operand code-gen constructs. 110b57cec5SDimitry Andric/// 120b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 130b57cec5SDimitry Andric 140b57cec5SDimitry Andric// Instructions requiring HasSIMD128 and the simd128 prefix byte 150b57cec5SDimitry Andricmulticlass SIMD_I<dag oops_r, dag iops_r, dag oops_s, dag iops_s, 160b57cec5SDimitry Andric list<dag> pattern_r, string asmstr_r = "", 170b57cec5SDimitry Andric string asmstr_s = "", bits<32> simdop = -1> { 180b57cec5SDimitry Andric defm "" : I<oops_r, iops_r, oops_s, iops_s, pattern_r, asmstr_r, asmstr_s, 190b57cec5SDimitry Andric !or(0xfd00, !and(0xff, simdop))>, 200b57cec5SDimitry Andric Requires<[HasSIMD128]>; 210b57cec5SDimitry Andric} 220b57cec5SDimitry Andric 230b57cec5SDimitry Andricdefm "" : ARGUMENT<V128, v16i8>; 240b57cec5SDimitry Andricdefm "" : ARGUMENT<V128, v8i16>; 250b57cec5SDimitry Andricdefm "" : ARGUMENT<V128, v4i32>; 260b57cec5SDimitry Andricdefm "" : ARGUMENT<V128, v2i64>; 270b57cec5SDimitry Andricdefm "" : ARGUMENT<V128, v4f32>; 280b57cec5SDimitry Andricdefm "" : ARGUMENT<V128, v2f64>; 290b57cec5SDimitry Andric 300b57cec5SDimitry Andric// Constrained immediate argument types 310b57cec5SDimitry Andricforeach SIZE = [8, 16] in 320b57cec5SDimitry Andricdef ImmI#SIZE : ImmLeaf<i32, 330b57cec5SDimitry Andric "return -(1 << ("#SIZE#" - 1)) <= Imm && Imm < (1 << ("#SIZE#" - 1));" 340b57cec5SDimitry Andric>; 350b57cec5SDimitry Andricforeach SIZE = [2, 4, 8, 16, 32] in 360b57cec5SDimitry Andricdef LaneIdx#SIZE : ImmLeaf<i32, "return 0 <= Imm && Imm < "#SIZE#";">; 370b57cec5SDimitry Andric 380b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 390b57cec5SDimitry Andric// Load and store 400b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 410b57cec5SDimitry Andric 420b57cec5SDimitry Andric// Load: v128.load 43*5ffd83dbSDimitry Andriclet mayLoad = 1, UseNamedOperandTable = 1 in { 44*5ffd83dbSDimitry Andricdefm LOAD_V128_A32 : 450b57cec5SDimitry Andric SIMD_I<(outs V128:$dst), (ins P2Align:$p2align, offset32_op:$off, I32:$addr), 460b57cec5SDimitry Andric (outs), (ins P2Align:$p2align, offset32_op:$off), [], 470b57cec5SDimitry Andric "v128.load\t$dst, ${off}(${addr})$p2align", 480b57cec5SDimitry Andric "v128.load\t$off$p2align", 0>; 49*5ffd83dbSDimitry Andricdefm LOAD_V128_A64 : 50*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), (ins P2Align:$p2align, offset64_op:$off, I64:$addr), 51*5ffd83dbSDimitry Andric (outs), (ins P2Align:$p2align, offset64_op:$off), [], 52*5ffd83dbSDimitry Andric "v128.load\t$dst, ${off}(${addr})$p2align", 53*5ffd83dbSDimitry Andric "v128.load\t$off$p2align", 0>; 54*5ffd83dbSDimitry Andric} 550b57cec5SDimitry Andric 560b57cec5SDimitry Andric// Def load and store patterns from WebAssemblyInstrMemory.td for vector types 578bcb0991SDimitry Andricforeach vec_t = [v16i8, v8i16, v4i32, v2i64, v4f32, v2f64] in { 58*5ffd83dbSDimitry Andricdefm : LoadPatNoOffset<vec_t, load, "LOAD_V128">; 59*5ffd83dbSDimitry Andricdefm : LoadPatImmOff<vec_t, load, regPlusImm, "LOAD_V128">; 60*5ffd83dbSDimitry Andricdefm : LoadPatImmOff<vec_t, load, or_is_add, "LOAD_V128">; 61*5ffd83dbSDimitry Andricdefm : LoadPatOffsetOnly<vec_t, load, "LOAD_V128">; 62*5ffd83dbSDimitry Andricdefm : LoadPatGlobalAddrOffOnly<vec_t, load, "LOAD_V128">; 630b57cec5SDimitry Andric} 640b57cec5SDimitry Andric 658bcb0991SDimitry Andric// vNxM.load_splat 668bcb0991SDimitry Andricmulticlass SIMDLoadSplat<string vec, bits<32> simdop> { 67*5ffd83dbSDimitry Andric let mayLoad = 1, UseNamedOperandTable = 1 in { 68*5ffd83dbSDimitry Andric defm LOAD_SPLAT_#vec#_A32 : 69*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), 70*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset32_op:$off, I32:$addr), 71*5ffd83dbSDimitry Andric (outs), 72*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset32_op:$off), [], 73*5ffd83dbSDimitry Andric vec#".load_splat\t$dst, ${off}(${addr})$p2align", 74*5ffd83dbSDimitry Andric vec#".load_splat\t$off$p2align", simdop>; 75*5ffd83dbSDimitry Andric defm LOAD_SPLAT_#vec#_A64 : 76*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), 77*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset64_op:$off, I64:$addr), 78*5ffd83dbSDimitry Andric (outs), 79*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset64_op:$off), [], 808bcb0991SDimitry Andric vec#".load_splat\t$dst, ${off}(${addr})$p2align", 818bcb0991SDimitry Andric vec#".load_splat\t$off$p2align", simdop>; 828bcb0991SDimitry Andric } 83*5ffd83dbSDimitry Andric} 848bcb0991SDimitry Andric 85*5ffd83dbSDimitry Andricdefm "" : SIMDLoadSplat<"v8x16", 7>; 86*5ffd83dbSDimitry Andricdefm "" : SIMDLoadSplat<"v16x8", 8>; 87*5ffd83dbSDimitry Andricdefm "" : SIMDLoadSplat<"v32x4", 9>; 88*5ffd83dbSDimitry Andricdefm "" : SIMDLoadSplat<"v64x2", 10>; 898bcb0991SDimitry Andric 90480093f4SDimitry Andricdef wasm_load_splat_t : SDTypeProfile<1, 1, [SDTCisPtrTy<1>]>; 91480093f4SDimitry Andricdef wasm_load_splat : SDNode<"WebAssemblyISD::LOAD_SPLAT", wasm_load_splat_t, 92480093f4SDimitry Andric [SDNPHasChain, SDNPMayLoad, SDNPMemOperand]>; 93480093f4SDimitry Andricdef load_splat : PatFrag<(ops node:$addr), (wasm_load_splat node:$addr)>; 948bcb0991SDimitry Andric 958bcb0991SDimitry Andricforeach args = [["v16i8", "v8x16"], ["v8i16", "v16x8"], ["v4i32", "v32x4"], 968bcb0991SDimitry Andric ["v2i64", "v64x2"], ["v4f32", "v32x4"], ["v2f64", "v64x2"]] in { 97*5ffd83dbSDimitry Andricdefm : LoadPatNoOffset<!cast<ValueType>(args[0]), 98480093f4SDimitry Andric load_splat, 99*5ffd83dbSDimitry Andric "LOAD_SPLAT_"#args[1]>; 100*5ffd83dbSDimitry Andricdefm : LoadPatImmOff<!cast<ValueType>(args[0]), 101480093f4SDimitry Andric load_splat, 1028bcb0991SDimitry Andric regPlusImm, 103*5ffd83dbSDimitry Andric "LOAD_SPLAT_"#args[1]>; 104*5ffd83dbSDimitry Andricdefm : LoadPatImmOff<!cast<ValueType>(args[0]), 105480093f4SDimitry Andric load_splat, 1068bcb0991SDimitry Andric or_is_add, 107*5ffd83dbSDimitry Andric "LOAD_SPLAT_"#args[1]>; 108*5ffd83dbSDimitry Andricdefm : LoadPatOffsetOnly<!cast<ValueType>(args[0]), 109480093f4SDimitry Andric load_splat, 110*5ffd83dbSDimitry Andric "LOAD_SPLAT_"#args[1]>; 111*5ffd83dbSDimitry Andricdefm : LoadPatGlobalAddrOffOnly<!cast<ValueType>(args[0]), 112480093f4SDimitry Andric load_splat, 113*5ffd83dbSDimitry Andric "LOAD_SPLAT_"#args[1]>; 1148bcb0991SDimitry Andric} 1158bcb0991SDimitry Andric 1168bcb0991SDimitry Andric// Load and extend 1178bcb0991SDimitry Andricmulticlass SIMDLoadExtend<ValueType vec_t, string name, bits<32> simdop> { 118*5ffd83dbSDimitry Andric let mayLoad = 1, UseNamedOperandTable = 1 in { 119*5ffd83dbSDimitry Andric defm LOAD_EXTEND_S_#vec_t#_A32 : 120*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), 121*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset32_op:$off, I32:$addr), 1228bcb0991SDimitry Andric (outs), (ins P2Align:$p2align, offset32_op:$off), [], 1238bcb0991SDimitry Andric name#"_s\t$dst, ${off}(${addr})$p2align", 1248bcb0991SDimitry Andric name#"_s\t$off$p2align", simdop>; 125*5ffd83dbSDimitry Andric defm LOAD_EXTEND_U_#vec_t#_A32 : 126*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), 127*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset32_op:$off, I32:$addr), 1288bcb0991SDimitry Andric (outs), (ins P2Align:$p2align, offset32_op:$off), [], 1298bcb0991SDimitry Andric name#"_u\t$dst, ${off}(${addr})$p2align", 1308bcb0991SDimitry Andric name#"_u\t$off$p2align", !add(simdop, 1)>; 131*5ffd83dbSDimitry Andric defm LOAD_EXTEND_S_#vec_t#_A64 : 132*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), 133*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset64_op:$off, I64:$addr), 134*5ffd83dbSDimitry Andric (outs), (ins P2Align:$p2align, offset64_op:$off), [], 135*5ffd83dbSDimitry Andric name#"_s\t$dst, ${off}(${addr})$p2align", 136*5ffd83dbSDimitry Andric name#"_s\t$off$p2align", simdop>; 137*5ffd83dbSDimitry Andric defm LOAD_EXTEND_U_#vec_t#_A64 : 138*5ffd83dbSDimitry Andric SIMD_I<(outs V128:$dst), 139*5ffd83dbSDimitry Andric (ins P2Align:$p2align, offset64_op:$off, I64:$addr), 140*5ffd83dbSDimitry Andric (outs), (ins P2Align:$p2align, offset64_op:$off), [], 141*5ffd83dbSDimitry Andric name#"_u\t$dst, ${off}(${addr})$p2align", 142*5ffd83dbSDimitry Andric name#"_u\t$off$p2align", !add(simdop, 1)>; 1438bcb0991SDimitry Andric } 1448bcb0991SDimitry Andric} 1458bcb0991SDimitry Andric 146*5ffd83dbSDimitry Andricdefm "" : SIMDLoadExtend<v8i16, "i16x8.load8x8", 1>; 147*5ffd83dbSDimitry Andricdefm "" : SIMDLoadExtend<v4i32, "i32x4.load16x4", 3>; 148*5ffd83dbSDimitry Andricdefm "" : SIMDLoadExtend<v2i64, "i64x2.load32x2", 5>; 1498bcb0991SDimitry Andric 1508bcb0991SDimitry Andricforeach types = [[v8i16, i8], [v4i32, i16], [v2i64, i32]] in 1518bcb0991SDimitry Andricforeach exts = [["sextloadv", "_S"], 1528bcb0991SDimitry Andric ["zextloadv", "_U"], 1538bcb0991SDimitry Andric ["extloadv", "_U"]] in { 154*5ffd83dbSDimitry Andricdefm : LoadPatNoOffset<types[0], !cast<PatFrag>(exts[0]#types[1]), 155*5ffd83dbSDimitry Andric "LOAD_EXTEND"#exts[1]#"_"#types[0]>; 156*5ffd83dbSDimitry Andricdefm : LoadPatImmOff<types[0], !cast<PatFrag>(exts[0]#types[1]), regPlusImm, 157*5ffd83dbSDimitry Andric "LOAD_EXTEND"#exts[1]#"_"#types[0]>; 158*5ffd83dbSDimitry Andricdefm : LoadPatImmOff<types[0], !cast<PatFrag>(exts[0]#types[1]), or_is_add, 159*5ffd83dbSDimitry Andric "LOAD_EXTEND"#exts[1]#"_"#types[0]>; 160*5ffd83dbSDimitry Andricdefm : LoadPatOffsetOnly<types[0], !cast<PatFrag>(exts[0]#types[1]), 161*5ffd83dbSDimitry Andric "LOAD_EXTEND"#exts[1]#"_"#types[0]>; 162*5ffd83dbSDimitry Andricdefm : LoadPatGlobalAddrOffOnly<types[0], !cast<PatFrag>(exts[0]#types[1]), 163*5ffd83dbSDimitry Andric "LOAD_EXTEND"#exts[1]#"_"#types[0]>; 1648bcb0991SDimitry Andric} 1658bcb0991SDimitry Andric 1668bcb0991SDimitry Andric 1670b57cec5SDimitry Andric// Store: v128.store 168*5ffd83dbSDimitry Andriclet mayStore = 1, UseNamedOperandTable = 1 in { 169*5ffd83dbSDimitry Andricdefm STORE_V128_A32 : 1700b57cec5SDimitry Andric SIMD_I<(outs), (ins P2Align:$p2align, offset32_op:$off, I32:$addr, V128:$vec), 1710b57cec5SDimitry Andric (outs), (ins P2Align:$p2align, offset32_op:$off), [], 1720b57cec5SDimitry Andric "v128.store\t${off}(${addr})$p2align, $vec", 173*5ffd83dbSDimitry Andric "v128.store\t$off$p2align", 11>; 174*5ffd83dbSDimitry Andricdefm STORE_V128_A64 : 175*5ffd83dbSDimitry Andric SIMD_I<(outs), (ins P2Align:$p2align, offset64_op:$off, I64:$addr, V128:$vec), 176*5ffd83dbSDimitry Andric (outs), (ins P2Align:$p2align, offset64_op:$off), [], 177*5ffd83dbSDimitry Andric "v128.store\t${off}(${addr})$p2align, $vec", 178*5ffd83dbSDimitry Andric "v128.store\t$off$p2align", 11>; 179*5ffd83dbSDimitry Andric} 1800b57cec5SDimitry Andricforeach vec_t = [v16i8, v8i16, v4i32, v2i64, v4f32, v2f64] in { 1810b57cec5SDimitry Andric// Def load and store patterns from WebAssemblyInstrMemory.td for vector types 182*5ffd83dbSDimitry Andricdefm : StorePatNoOffset<vec_t, store, "STORE_V128">; 183*5ffd83dbSDimitry Andricdefm : StorePatImmOff<vec_t, store, regPlusImm, "STORE_V128">; 184*5ffd83dbSDimitry Andricdefm : StorePatImmOff<vec_t, store, or_is_add, "STORE_V128">; 185*5ffd83dbSDimitry Andricdefm : StorePatOffsetOnly<vec_t, store, "STORE_V128">; 186*5ffd83dbSDimitry Andricdefm : StorePatGlobalAddrOffOnly<vec_t, store, "STORE_V128">; 1870b57cec5SDimitry Andric} 1880b57cec5SDimitry Andric 1890b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 1900b57cec5SDimitry Andric// Constructing SIMD values 1910b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 1920b57cec5SDimitry Andric 1930b57cec5SDimitry Andric// Constant: v128.const 1940b57cec5SDimitry Andricmulticlass ConstVec<ValueType vec_t, dag ops, dag pat, string args> { 1950b57cec5SDimitry Andric let isMoveImm = 1, isReMaterializable = 1, 1968bcb0991SDimitry Andric Predicates = [HasUnimplementedSIMD128] in 1970b57cec5SDimitry Andric defm CONST_V128_#vec_t : SIMD_I<(outs V128:$dst), ops, (outs), ops, 1980b57cec5SDimitry Andric [(set V128:$dst, (vec_t pat))], 1990b57cec5SDimitry Andric "v128.const\t$dst, "#args, 200*5ffd83dbSDimitry Andric "v128.const\t"#args, 12>; 2010b57cec5SDimitry Andric} 2020b57cec5SDimitry Andric 2030b57cec5SDimitry Andricdefm "" : ConstVec<v16i8, 2040b57cec5SDimitry Andric (ins vec_i8imm_op:$i0, vec_i8imm_op:$i1, 2050b57cec5SDimitry Andric vec_i8imm_op:$i2, vec_i8imm_op:$i3, 2060b57cec5SDimitry Andric vec_i8imm_op:$i4, vec_i8imm_op:$i5, 2070b57cec5SDimitry Andric vec_i8imm_op:$i6, vec_i8imm_op:$i7, 2080b57cec5SDimitry Andric vec_i8imm_op:$i8, vec_i8imm_op:$i9, 2090b57cec5SDimitry Andric vec_i8imm_op:$iA, vec_i8imm_op:$iB, 2100b57cec5SDimitry Andric vec_i8imm_op:$iC, vec_i8imm_op:$iD, 2110b57cec5SDimitry Andric vec_i8imm_op:$iE, vec_i8imm_op:$iF), 2120b57cec5SDimitry Andric (build_vector ImmI8:$i0, ImmI8:$i1, ImmI8:$i2, ImmI8:$i3, 2130b57cec5SDimitry Andric ImmI8:$i4, ImmI8:$i5, ImmI8:$i6, ImmI8:$i7, 2140b57cec5SDimitry Andric ImmI8:$i8, ImmI8:$i9, ImmI8:$iA, ImmI8:$iB, 2150b57cec5SDimitry Andric ImmI8:$iC, ImmI8:$iD, ImmI8:$iE, ImmI8:$iF), 2160b57cec5SDimitry Andric !strconcat("$i0, $i1, $i2, $i3, $i4, $i5, $i6, $i7, ", 2170b57cec5SDimitry Andric "$i8, $i9, $iA, $iB, $iC, $iD, $iE, $iF")>; 2180b57cec5SDimitry Andricdefm "" : ConstVec<v8i16, 2190b57cec5SDimitry Andric (ins vec_i16imm_op:$i0, vec_i16imm_op:$i1, 2200b57cec5SDimitry Andric vec_i16imm_op:$i2, vec_i16imm_op:$i3, 2210b57cec5SDimitry Andric vec_i16imm_op:$i4, vec_i16imm_op:$i5, 2220b57cec5SDimitry Andric vec_i16imm_op:$i6, vec_i16imm_op:$i7), 2230b57cec5SDimitry Andric (build_vector 2240b57cec5SDimitry Andric ImmI16:$i0, ImmI16:$i1, ImmI16:$i2, ImmI16:$i3, 2250b57cec5SDimitry Andric ImmI16:$i4, ImmI16:$i5, ImmI16:$i6, ImmI16:$i7), 2260b57cec5SDimitry Andric "$i0, $i1, $i2, $i3, $i4, $i5, $i6, $i7">; 2270b57cec5SDimitry Andriclet IsCanonical = 1 in 2280b57cec5SDimitry Andricdefm "" : ConstVec<v4i32, 2290b57cec5SDimitry Andric (ins vec_i32imm_op:$i0, vec_i32imm_op:$i1, 2300b57cec5SDimitry Andric vec_i32imm_op:$i2, vec_i32imm_op:$i3), 2310b57cec5SDimitry Andric (build_vector (i32 imm:$i0), (i32 imm:$i1), 2320b57cec5SDimitry Andric (i32 imm:$i2), (i32 imm:$i3)), 2330b57cec5SDimitry Andric "$i0, $i1, $i2, $i3">; 2340b57cec5SDimitry Andricdefm "" : ConstVec<v2i64, 2350b57cec5SDimitry Andric (ins vec_i64imm_op:$i0, vec_i64imm_op:$i1), 2360b57cec5SDimitry Andric (build_vector (i64 imm:$i0), (i64 imm:$i1)), 2370b57cec5SDimitry Andric "$i0, $i1">; 2380b57cec5SDimitry Andricdefm "" : ConstVec<v4f32, 2390b57cec5SDimitry Andric (ins f32imm_op:$i0, f32imm_op:$i1, 2400b57cec5SDimitry Andric f32imm_op:$i2, f32imm_op:$i3), 2410b57cec5SDimitry Andric (build_vector (f32 fpimm:$i0), (f32 fpimm:$i1), 2420b57cec5SDimitry Andric (f32 fpimm:$i2), (f32 fpimm:$i3)), 2430b57cec5SDimitry Andric "$i0, $i1, $i2, $i3">; 2440b57cec5SDimitry Andricdefm "" : ConstVec<v2f64, 2450b57cec5SDimitry Andric (ins f64imm_op:$i0, f64imm_op:$i1), 2460b57cec5SDimitry Andric (build_vector (f64 fpimm:$i0), (f64 fpimm:$i1)), 2470b57cec5SDimitry Andric "$i0, $i1">; 2480b57cec5SDimitry Andric 2490b57cec5SDimitry Andric// Shuffle lanes: shuffle 2500b57cec5SDimitry Andricdefm SHUFFLE : 2510b57cec5SDimitry Andric SIMD_I<(outs V128:$dst), 2520b57cec5SDimitry Andric (ins V128:$x, V128:$y, 2530b57cec5SDimitry Andric vec_i8imm_op:$m0, vec_i8imm_op:$m1, 2540b57cec5SDimitry Andric vec_i8imm_op:$m2, vec_i8imm_op:$m3, 2550b57cec5SDimitry Andric vec_i8imm_op:$m4, vec_i8imm_op:$m5, 2560b57cec5SDimitry Andric vec_i8imm_op:$m6, vec_i8imm_op:$m7, 2570b57cec5SDimitry Andric vec_i8imm_op:$m8, vec_i8imm_op:$m9, 2580b57cec5SDimitry Andric vec_i8imm_op:$mA, vec_i8imm_op:$mB, 2590b57cec5SDimitry Andric vec_i8imm_op:$mC, vec_i8imm_op:$mD, 2600b57cec5SDimitry Andric vec_i8imm_op:$mE, vec_i8imm_op:$mF), 2610b57cec5SDimitry Andric (outs), 2620b57cec5SDimitry Andric (ins 2630b57cec5SDimitry Andric vec_i8imm_op:$m0, vec_i8imm_op:$m1, 2640b57cec5SDimitry Andric vec_i8imm_op:$m2, vec_i8imm_op:$m3, 2650b57cec5SDimitry Andric vec_i8imm_op:$m4, vec_i8imm_op:$m5, 2660b57cec5SDimitry Andric vec_i8imm_op:$m6, vec_i8imm_op:$m7, 2670b57cec5SDimitry Andric vec_i8imm_op:$m8, vec_i8imm_op:$m9, 2680b57cec5SDimitry Andric vec_i8imm_op:$mA, vec_i8imm_op:$mB, 2690b57cec5SDimitry Andric vec_i8imm_op:$mC, vec_i8imm_op:$mD, 2700b57cec5SDimitry Andric vec_i8imm_op:$mE, vec_i8imm_op:$mF), 2710b57cec5SDimitry Andric [], 2720b57cec5SDimitry Andric "v8x16.shuffle\t$dst, $x, $y, "# 2730b57cec5SDimitry Andric "$m0, $m1, $m2, $m3, $m4, $m5, $m6, $m7, "# 2740b57cec5SDimitry Andric "$m8, $m9, $mA, $mB, $mC, $mD, $mE, $mF", 2750b57cec5SDimitry Andric "v8x16.shuffle\t"# 2760b57cec5SDimitry Andric "$m0, $m1, $m2, $m3, $m4, $m5, $m6, $m7, "# 2770b57cec5SDimitry Andric "$m8, $m9, $mA, $mB, $mC, $mD, $mE, $mF", 278*5ffd83dbSDimitry Andric 13>; 2790b57cec5SDimitry Andric 2800b57cec5SDimitry Andric// Shuffles after custom lowering 2810b57cec5SDimitry Andricdef wasm_shuffle_t : SDTypeProfile<1, 18, []>; 2820b57cec5SDimitry Andricdef wasm_shuffle : SDNode<"WebAssemblyISD::SHUFFLE", wasm_shuffle_t>; 2830b57cec5SDimitry Andricforeach vec_t = [v16i8, v8i16, v4i32, v2i64, v4f32, v2f64] in { 2840b57cec5SDimitry Andricdef : Pat<(vec_t (wasm_shuffle (vec_t V128:$x), (vec_t V128:$y), 2850b57cec5SDimitry Andric (i32 LaneIdx32:$m0), (i32 LaneIdx32:$m1), 2860b57cec5SDimitry Andric (i32 LaneIdx32:$m2), (i32 LaneIdx32:$m3), 2870b57cec5SDimitry Andric (i32 LaneIdx32:$m4), (i32 LaneIdx32:$m5), 2880b57cec5SDimitry Andric (i32 LaneIdx32:$m6), (i32 LaneIdx32:$m7), 2890b57cec5SDimitry Andric (i32 LaneIdx32:$m8), (i32 LaneIdx32:$m9), 2900b57cec5SDimitry Andric (i32 LaneIdx32:$mA), (i32 LaneIdx32:$mB), 2910b57cec5SDimitry Andric (i32 LaneIdx32:$mC), (i32 LaneIdx32:$mD), 2920b57cec5SDimitry Andric (i32 LaneIdx32:$mE), (i32 LaneIdx32:$mF))), 2930b57cec5SDimitry Andric (vec_t (SHUFFLE (vec_t V128:$x), (vec_t V128:$y), 2940b57cec5SDimitry Andric (i32 LaneIdx32:$m0), (i32 LaneIdx32:$m1), 2950b57cec5SDimitry Andric (i32 LaneIdx32:$m2), (i32 LaneIdx32:$m3), 2960b57cec5SDimitry Andric (i32 LaneIdx32:$m4), (i32 LaneIdx32:$m5), 2970b57cec5SDimitry Andric (i32 LaneIdx32:$m6), (i32 LaneIdx32:$m7), 2980b57cec5SDimitry Andric (i32 LaneIdx32:$m8), (i32 LaneIdx32:$m9), 2990b57cec5SDimitry Andric (i32 LaneIdx32:$mA), (i32 LaneIdx32:$mB), 3000b57cec5SDimitry Andric (i32 LaneIdx32:$mC), (i32 LaneIdx32:$mD), 3010b57cec5SDimitry Andric (i32 LaneIdx32:$mE), (i32 LaneIdx32:$mF)))>; 3020b57cec5SDimitry Andric} 3030b57cec5SDimitry Andric 3048bcb0991SDimitry Andric// Swizzle lanes: v8x16.swizzle 3058bcb0991SDimitry Andricdef wasm_swizzle_t : SDTypeProfile<1, 2, []>; 3068bcb0991SDimitry Andricdef wasm_swizzle : SDNode<"WebAssemblyISD::SWIZZLE", wasm_swizzle_t>; 3078bcb0991SDimitry Andricdefm SWIZZLE : 3088bcb0991SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$src, V128:$mask), (outs), (ins), 3098bcb0991SDimitry Andric [(set (v16i8 V128:$dst), 3108bcb0991SDimitry Andric (wasm_swizzle (v16i8 V128:$src), (v16i8 V128:$mask)))], 311*5ffd83dbSDimitry Andric "v8x16.swizzle\t$dst, $src, $mask", "v8x16.swizzle", 14>; 3128bcb0991SDimitry Andric 3138bcb0991SDimitry Andricdef : Pat<(int_wasm_swizzle (v16i8 V128:$src), (v16i8 V128:$mask)), 3148bcb0991SDimitry Andric (SWIZZLE V128:$src, V128:$mask)>; 3158bcb0991SDimitry Andric 3160b57cec5SDimitry Andric// Create vector with identical lanes: splat 3170b57cec5SDimitry Andricdef splat2 : PatFrag<(ops node:$x), (build_vector node:$x, node:$x)>; 3180b57cec5SDimitry Andricdef splat4 : PatFrag<(ops node:$x), (build_vector 3190b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x)>; 3200b57cec5SDimitry Andricdef splat8 : PatFrag<(ops node:$x), (build_vector 3210b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x, 3220b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x)>; 3230b57cec5SDimitry Andricdef splat16 : PatFrag<(ops node:$x), (build_vector 3240b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x, 3250b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x, 3260b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x, 3270b57cec5SDimitry Andric node:$x, node:$x, node:$x, node:$x)>; 3280b57cec5SDimitry Andric 3290b57cec5SDimitry Andricmulticlass Splat<ValueType vec_t, string vec, WebAssemblyRegClass reg_t, 3300b57cec5SDimitry Andric PatFrag splat_pat, bits<32> simdop> { 3310b57cec5SDimitry Andric defm SPLAT_#vec_t : SIMD_I<(outs V128:$dst), (ins reg_t:$x), (outs), (ins), 3320b57cec5SDimitry Andric [(set (vec_t V128:$dst), (splat_pat reg_t:$x))], 3330b57cec5SDimitry Andric vec#".splat\t$dst, $x", vec#".splat", simdop>; 3340b57cec5SDimitry Andric} 3350b57cec5SDimitry Andric 336*5ffd83dbSDimitry Andricdefm "" : Splat<v16i8, "i8x16", I32, splat16, 15>; 337*5ffd83dbSDimitry Andricdefm "" : Splat<v8i16, "i16x8", I32, splat8, 16>; 338*5ffd83dbSDimitry Andricdefm "" : Splat<v4i32, "i32x4", I32, splat4, 17>; 339*5ffd83dbSDimitry Andricdefm "" : Splat<v2i64, "i64x2", I64, splat2, 18>; 340*5ffd83dbSDimitry Andricdefm "" : Splat<v4f32, "f32x4", F32, splat4, 19>; 341*5ffd83dbSDimitry Andricdefm "" : Splat<v2f64, "f64x2", F64, splat2, 20>; 3420b57cec5SDimitry Andric 3430b57cec5SDimitry Andric// scalar_to_vector leaves high lanes undefined, so can be a splat 3440b57cec5SDimitry Andricclass ScalarSplatPat<ValueType vec_t, ValueType lane_t, 3450b57cec5SDimitry Andric WebAssemblyRegClass reg_t> : 3460b57cec5SDimitry Andric Pat<(vec_t (scalar_to_vector (lane_t reg_t:$x))), 3470b57cec5SDimitry Andric (!cast<Instruction>("SPLAT_"#vec_t) reg_t:$x)>; 3480b57cec5SDimitry Andric 3490b57cec5SDimitry Andricdef : ScalarSplatPat<v16i8, i32, I32>; 3500b57cec5SDimitry Andricdef : ScalarSplatPat<v8i16, i32, I32>; 3510b57cec5SDimitry Andricdef : ScalarSplatPat<v4i32, i32, I32>; 3520b57cec5SDimitry Andricdef : ScalarSplatPat<v2i64, i64, I64>; 3530b57cec5SDimitry Andricdef : ScalarSplatPat<v4f32, f32, F32>; 3540b57cec5SDimitry Andricdef : ScalarSplatPat<v2f64, f64, F64>; 3550b57cec5SDimitry Andric 3560b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3570b57cec5SDimitry Andric// Accessing lanes 3580b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3590b57cec5SDimitry Andric 3600b57cec5SDimitry Andric// Extract lane as a scalar: extract_lane / extract_lane_s / extract_lane_u 361*5ffd83dbSDimitry Andricmulticlass ExtractLane<ValueType vec_t, string vec, WebAssemblyRegClass reg_t, 362*5ffd83dbSDimitry Andric bits<32> simdop, string suffix = ""> { 3630b57cec5SDimitry Andric defm EXTRACT_LANE_#vec_t#suffix : 3640b57cec5SDimitry Andric SIMD_I<(outs reg_t:$dst), (ins V128:$vec, vec_i8imm_op:$idx), 365*5ffd83dbSDimitry Andric (outs), (ins vec_i8imm_op:$idx), [], 3660b57cec5SDimitry Andric vec#".extract_lane"#suffix#"\t$dst, $vec, $idx", 3670b57cec5SDimitry Andric vec#".extract_lane"#suffix#"\t$idx", simdop>; 3680b57cec5SDimitry Andric} 3690b57cec5SDimitry Andric 370*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v16i8, "i8x16", I32, 21, "_s">; 371*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v16i8, "i8x16", I32, 22, "_u">; 372*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v8i16, "i16x8", I32, 24, "_s">; 373*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v8i16, "i16x8", I32, 25, "_u">; 374*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v4i32, "i32x4", I32, 27>; 375*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v2i64, "i64x2", I64, 29>; 376*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v4f32, "f32x4", F32, 31>; 377*5ffd83dbSDimitry Andricdefm "" : ExtractLane<v2f64, "f64x2", F64, 33>; 3780b57cec5SDimitry Andric 379*5ffd83dbSDimitry Andricdef : Pat<(vector_extract (v16i8 V128:$vec), (i32 LaneIdx16:$idx)), 380*5ffd83dbSDimitry Andric (EXTRACT_LANE_v16i8_u V128:$vec, imm:$idx)>; 381*5ffd83dbSDimitry Andricdef : Pat<(vector_extract (v8i16 V128:$vec), (i32 LaneIdx8:$idx)), 382*5ffd83dbSDimitry Andric (EXTRACT_LANE_v8i16_u V128:$vec, imm:$idx)>; 383*5ffd83dbSDimitry Andricdef : Pat<(vector_extract (v4i32 V128:$vec), (i32 LaneIdx4:$idx)), 384*5ffd83dbSDimitry Andric (EXTRACT_LANE_v4i32 V128:$vec, imm:$idx)>; 385*5ffd83dbSDimitry Andricdef : Pat<(vector_extract (v4f32 V128:$vec), (i32 LaneIdx4:$idx)), 386*5ffd83dbSDimitry Andric (EXTRACT_LANE_v4f32 V128:$vec, imm:$idx)>; 387*5ffd83dbSDimitry Andricdef : Pat<(vector_extract (v2i64 V128:$vec), (i32 LaneIdx2:$idx)), 388*5ffd83dbSDimitry Andric (EXTRACT_LANE_v2i64 V128:$vec, imm:$idx)>; 389*5ffd83dbSDimitry Andricdef : Pat<(vector_extract (v2f64 V128:$vec), (i32 LaneIdx2:$idx)), 390*5ffd83dbSDimitry Andric (EXTRACT_LANE_v2f64 V128:$vec, imm:$idx)>; 3910b57cec5SDimitry Andric 392*5ffd83dbSDimitry Andricdef : Pat< 393*5ffd83dbSDimitry Andric (sext_inreg (vector_extract (v16i8 V128:$vec), (i32 LaneIdx16:$idx)), i8), 394*5ffd83dbSDimitry Andric (EXTRACT_LANE_v16i8_s V128:$vec, imm:$idx)>; 395*5ffd83dbSDimitry Andricdef : Pat< 396*5ffd83dbSDimitry Andric (and (vector_extract (v16i8 V128:$vec), (i32 LaneIdx16:$idx)), (i32 0xff)), 397*5ffd83dbSDimitry Andric (EXTRACT_LANE_v16i8_u V128:$vec, imm:$idx)>; 398*5ffd83dbSDimitry Andricdef : Pat< 399*5ffd83dbSDimitry Andric (sext_inreg (vector_extract (v8i16 V128:$vec), (i32 LaneIdx8:$idx)), i16), 400*5ffd83dbSDimitry Andric (EXTRACT_LANE_v8i16_s V128:$vec, imm:$idx)>; 401*5ffd83dbSDimitry Andricdef : Pat< 402*5ffd83dbSDimitry Andric (and (vector_extract (v8i16 V128:$vec), (i32 LaneIdx8:$idx)), (i32 0xffff)), 403*5ffd83dbSDimitry Andric (EXTRACT_LANE_v8i16_u V128:$vec, imm:$idx)>; 4040b57cec5SDimitry Andric 4050b57cec5SDimitry Andric// Replace lane value: replace_lane 4060b57cec5SDimitry Andricmulticlass ReplaceLane<ValueType vec_t, string vec, ImmLeaf imm_t, 4070b57cec5SDimitry Andric WebAssemblyRegClass reg_t, ValueType lane_t, 4080b57cec5SDimitry Andric bits<32> simdop> { 4090b57cec5SDimitry Andric defm REPLACE_LANE_#vec_t : 4100b57cec5SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$vec, vec_i8imm_op:$idx, reg_t:$x), 4110b57cec5SDimitry Andric (outs), (ins vec_i8imm_op:$idx), 4120b57cec5SDimitry Andric [(set V128:$dst, (vector_insert 4130b57cec5SDimitry Andric (vec_t V128:$vec), (lane_t reg_t:$x), (i32 imm_t:$idx)))], 4140b57cec5SDimitry Andric vec#".replace_lane\t$dst, $vec, $idx, $x", 4150b57cec5SDimitry Andric vec#".replace_lane\t$idx", simdop>; 4160b57cec5SDimitry Andric} 4170b57cec5SDimitry Andric 418*5ffd83dbSDimitry Andricdefm "" : ReplaceLane<v16i8, "i8x16", LaneIdx16, I32, i32, 23>; 419*5ffd83dbSDimitry Andricdefm "" : ReplaceLane<v8i16, "i16x8", LaneIdx8, I32, i32, 26>; 420*5ffd83dbSDimitry Andricdefm "" : ReplaceLane<v4i32, "i32x4", LaneIdx4, I32, i32, 28>; 421*5ffd83dbSDimitry Andricdefm "" : ReplaceLane<v2i64, "i64x2", LaneIdx2, I64, i64, 30>; 422*5ffd83dbSDimitry Andricdefm "" : ReplaceLane<v4f32, "f32x4", LaneIdx4, F32, f32, 32>; 423*5ffd83dbSDimitry Andricdefm "" : ReplaceLane<v2f64, "f64x2", LaneIdx2, F64, f64, 34>; 4240b57cec5SDimitry Andric 4250b57cec5SDimitry Andric// Lower undef lane indices to zero 4260b57cec5SDimitry Andricdef : Pat<(vector_insert (v16i8 V128:$vec), I32:$x, undef), 4270b57cec5SDimitry Andric (REPLACE_LANE_v16i8 V128:$vec, 0, I32:$x)>; 4280b57cec5SDimitry Andricdef : Pat<(vector_insert (v8i16 V128:$vec), I32:$x, undef), 4290b57cec5SDimitry Andric (REPLACE_LANE_v8i16 V128:$vec, 0, I32:$x)>; 4300b57cec5SDimitry Andricdef : Pat<(vector_insert (v4i32 V128:$vec), I32:$x, undef), 4310b57cec5SDimitry Andric (REPLACE_LANE_v4i32 V128:$vec, 0, I32:$x)>; 4320b57cec5SDimitry Andricdef : Pat<(vector_insert (v2i64 V128:$vec), I64:$x, undef), 4330b57cec5SDimitry Andric (REPLACE_LANE_v2i64 V128:$vec, 0, I64:$x)>; 4340b57cec5SDimitry Andricdef : Pat<(vector_insert (v4f32 V128:$vec), F32:$x, undef), 4350b57cec5SDimitry Andric (REPLACE_LANE_v4f32 V128:$vec, 0, F32:$x)>; 4360b57cec5SDimitry Andricdef : Pat<(vector_insert (v2f64 V128:$vec), F64:$x, undef), 4370b57cec5SDimitry Andric (REPLACE_LANE_v2f64 V128:$vec, 0, F64:$x)>; 4380b57cec5SDimitry Andric 4390b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 4400b57cec5SDimitry Andric// Comparisons 4410b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 4420b57cec5SDimitry Andric 4430b57cec5SDimitry Andricmulticlass SIMDCondition<ValueType vec_t, ValueType out_t, string vec, 4440b57cec5SDimitry Andric string name, CondCode cond, bits<32> simdop> { 4450b57cec5SDimitry Andric defm _#vec_t : 4460b57cec5SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$lhs, V128:$rhs), (outs), (ins), 4470b57cec5SDimitry Andric [(set (out_t V128:$dst), 4480b57cec5SDimitry Andric (setcc (vec_t V128:$lhs), (vec_t V128:$rhs), cond) 4490b57cec5SDimitry Andric )], 4500b57cec5SDimitry Andric vec#"."#name#"\t$dst, $lhs, $rhs", vec#"."#name, simdop>; 4510b57cec5SDimitry Andric} 4520b57cec5SDimitry Andric 4530b57cec5SDimitry Andricmulticlass SIMDConditionInt<string name, CondCode cond, bits<32> baseInst> { 4540b57cec5SDimitry Andric defm "" : SIMDCondition<v16i8, v16i8, "i8x16", name, cond, baseInst>; 4550b57cec5SDimitry Andric defm "" : SIMDCondition<v8i16, v8i16, "i16x8", name, cond, 4560b57cec5SDimitry Andric !add(baseInst, 10)>; 4570b57cec5SDimitry Andric defm "" : SIMDCondition<v4i32, v4i32, "i32x4", name, cond, 4580b57cec5SDimitry Andric !add(baseInst, 20)>; 4590b57cec5SDimitry Andric} 4600b57cec5SDimitry Andric 4610b57cec5SDimitry Andricmulticlass SIMDConditionFP<string name, CondCode cond, bits<32> baseInst> { 4620b57cec5SDimitry Andric defm "" : SIMDCondition<v4f32, v4i32, "f32x4", name, cond, baseInst>; 4630b57cec5SDimitry Andric defm "" : SIMDCondition<v2f64, v2i64, "f64x2", name, cond, 4640b57cec5SDimitry Andric !add(baseInst, 6)>; 4650b57cec5SDimitry Andric} 4660b57cec5SDimitry Andric 4670b57cec5SDimitry Andric// Equality: eq 4680b57cec5SDimitry Andriclet isCommutable = 1 in { 469*5ffd83dbSDimitry Andricdefm EQ : SIMDConditionInt<"eq", SETEQ, 35>; 470*5ffd83dbSDimitry Andricdefm EQ : SIMDConditionFP<"eq", SETOEQ, 65>; 4710b57cec5SDimitry Andric} // isCommutable = 1 4720b57cec5SDimitry Andric 4730b57cec5SDimitry Andric// Non-equality: ne 4740b57cec5SDimitry Andriclet isCommutable = 1 in { 475*5ffd83dbSDimitry Andricdefm NE : SIMDConditionInt<"ne", SETNE, 36>; 476*5ffd83dbSDimitry Andricdefm NE : SIMDConditionFP<"ne", SETUNE, 66>; 4770b57cec5SDimitry Andric} // isCommutable = 1 4780b57cec5SDimitry Andric 4790b57cec5SDimitry Andric// Less than: lt_s / lt_u / lt 480*5ffd83dbSDimitry Andricdefm LT_S : SIMDConditionInt<"lt_s", SETLT, 37>; 481*5ffd83dbSDimitry Andricdefm LT_U : SIMDConditionInt<"lt_u", SETULT, 38>; 482*5ffd83dbSDimitry Andricdefm LT : SIMDConditionFP<"lt", SETOLT, 67>; 4830b57cec5SDimitry Andric 4840b57cec5SDimitry Andric// Greater than: gt_s / gt_u / gt 485*5ffd83dbSDimitry Andricdefm GT_S : SIMDConditionInt<"gt_s", SETGT, 39>; 486*5ffd83dbSDimitry Andricdefm GT_U : SIMDConditionInt<"gt_u", SETUGT, 40>; 487*5ffd83dbSDimitry Andricdefm GT : SIMDConditionFP<"gt", SETOGT, 68>; 4880b57cec5SDimitry Andric 4890b57cec5SDimitry Andric// Less than or equal: le_s / le_u / le 490*5ffd83dbSDimitry Andricdefm LE_S : SIMDConditionInt<"le_s", SETLE, 41>; 491*5ffd83dbSDimitry Andricdefm LE_U : SIMDConditionInt<"le_u", SETULE, 42>; 492*5ffd83dbSDimitry Andricdefm LE : SIMDConditionFP<"le", SETOLE, 69>; 4930b57cec5SDimitry Andric 4940b57cec5SDimitry Andric// Greater than or equal: ge_s / ge_u / ge 495*5ffd83dbSDimitry Andricdefm GE_S : SIMDConditionInt<"ge_s", SETGE, 43>; 496*5ffd83dbSDimitry Andricdefm GE_U : SIMDConditionInt<"ge_u", SETUGE, 44>; 497*5ffd83dbSDimitry Andricdefm GE : SIMDConditionFP<"ge", SETOGE, 70>; 4980b57cec5SDimitry Andric 4990b57cec5SDimitry Andric// Lower float comparisons that don't care about NaN to standard WebAssembly 5000b57cec5SDimitry Andric// float comparisons. These instructions are generated with nnan and in the 5010b57cec5SDimitry Andric// target-independent expansion of unordered comparisons and ordered ne. 5020b57cec5SDimitry Andricforeach nodes = [[seteq, EQ_v4f32], [setne, NE_v4f32], [setlt, LT_v4f32], 5030b57cec5SDimitry Andric [setgt, GT_v4f32], [setle, LE_v4f32], [setge, GE_v4f32]] in 5040b57cec5SDimitry Andricdef : Pat<(v4i32 (nodes[0] (v4f32 V128:$lhs), (v4f32 V128:$rhs))), 5050b57cec5SDimitry Andric (v4i32 (nodes[1] (v4f32 V128:$lhs), (v4f32 V128:$rhs)))>; 5060b57cec5SDimitry Andric 5070b57cec5SDimitry Andricforeach nodes = [[seteq, EQ_v2f64], [setne, NE_v2f64], [setlt, LT_v2f64], 5080b57cec5SDimitry Andric [setgt, GT_v2f64], [setle, LE_v2f64], [setge, GE_v2f64]] in 5090b57cec5SDimitry Andricdef : Pat<(v2i64 (nodes[0] (v2f64 V128:$lhs), (v2f64 V128:$rhs))), 5100b57cec5SDimitry Andric (v2i64 (nodes[1] (v2f64 V128:$lhs), (v2f64 V128:$rhs)))>; 5110b57cec5SDimitry Andric 5120b57cec5SDimitry Andric 5130b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 5140b57cec5SDimitry Andric// Bitwise operations 5150b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 5160b57cec5SDimitry Andric 5170b57cec5SDimitry Andricmulticlass SIMDBinary<ValueType vec_t, string vec, SDNode node, string name, 5180b57cec5SDimitry Andric bits<32> simdop> { 5190b57cec5SDimitry Andric defm _#vec_t : SIMD_I<(outs V128:$dst), (ins V128:$lhs, V128:$rhs), 5200b57cec5SDimitry Andric (outs), (ins), 5210b57cec5SDimitry Andric [(set (vec_t V128:$dst), 5220b57cec5SDimitry Andric (node (vec_t V128:$lhs), (vec_t V128:$rhs)) 5230b57cec5SDimitry Andric )], 5240b57cec5SDimitry Andric vec#"."#name#"\t$dst, $lhs, $rhs", vec#"."#name, 5250b57cec5SDimitry Andric simdop>; 5260b57cec5SDimitry Andric} 5270b57cec5SDimitry Andric 5280b57cec5SDimitry Andricmulticlass SIMDBitwise<SDNode node, string name, bits<32> simdop> { 5290b57cec5SDimitry Andric defm "" : SIMDBinary<v16i8, "v128", node, name, simdop>; 5300b57cec5SDimitry Andric defm "" : SIMDBinary<v8i16, "v128", node, name, simdop>; 5310b57cec5SDimitry Andric defm "" : SIMDBinary<v4i32, "v128", node, name, simdop>; 5320b57cec5SDimitry Andric defm "" : SIMDBinary<v2i64, "v128", node, name, simdop>; 5330b57cec5SDimitry Andric} 5340b57cec5SDimitry Andric 5350b57cec5SDimitry Andricmulticlass SIMDUnary<ValueType vec_t, string vec, SDNode node, string name, 5360b57cec5SDimitry Andric bits<32> simdop> { 5370b57cec5SDimitry Andric defm _#vec_t : SIMD_I<(outs V128:$dst), (ins V128:$vec), (outs), (ins), 5380b57cec5SDimitry Andric [(set (vec_t V128:$dst), 5390b57cec5SDimitry Andric (vec_t (node (vec_t V128:$vec))) 5400b57cec5SDimitry Andric )], 5410b57cec5SDimitry Andric vec#"."#name#"\t$dst, $vec", vec#"."#name, simdop>; 5420b57cec5SDimitry Andric} 5430b57cec5SDimitry Andric 5440b57cec5SDimitry Andric// Bitwise logic: v128.not 5450b57cec5SDimitry Andricforeach vec_t = [v16i8, v8i16, v4i32, v2i64] in 546*5ffd83dbSDimitry Andricdefm NOT: SIMDUnary<vec_t, "v128", vnot, "not", 77>; 5470b57cec5SDimitry Andric 5480b57cec5SDimitry Andric// Bitwise logic: v128.and / v128.or / v128.xor 5490b57cec5SDimitry Andriclet isCommutable = 1 in { 550*5ffd83dbSDimitry Andricdefm AND : SIMDBitwise<and, "and", 78>; 551*5ffd83dbSDimitry Andricdefm OR : SIMDBitwise<or, "or", 80>; 552*5ffd83dbSDimitry Andricdefm XOR : SIMDBitwise<xor, "xor", 81>; 5530b57cec5SDimitry Andric} // isCommutable = 1 5540b57cec5SDimitry Andric 5558bcb0991SDimitry Andric// Bitwise logic: v128.andnot 5568bcb0991SDimitry Andricdef andnot : PatFrag<(ops node:$left, node:$right), (and $left, (vnot $right))>; 557*5ffd83dbSDimitry Andricdefm ANDNOT : SIMDBitwise<andnot, "andnot", 79>; 5588bcb0991SDimitry Andric 5590b57cec5SDimitry Andric// Bitwise select: v128.bitselect 5600b57cec5SDimitry Andricforeach vec_t = [v16i8, v8i16, v4i32, v2i64, v4f32, v2f64] in 5610b57cec5SDimitry Andric defm BITSELECT_#vec_t : 5620b57cec5SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$v1, V128:$v2, V128:$c), (outs), (ins), 5630b57cec5SDimitry Andric [(set (vec_t V128:$dst), 5640b57cec5SDimitry Andric (vec_t (int_wasm_bitselect 5650b57cec5SDimitry Andric (vec_t V128:$v1), (vec_t V128:$v2), (vec_t V128:$c) 5660b57cec5SDimitry Andric )) 5670b57cec5SDimitry Andric )], 568*5ffd83dbSDimitry Andric "v128.bitselect\t$dst, $v1, $v2, $c", "v128.bitselect", 82>; 5690b57cec5SDimitry Andric 5700b57cec5SDimitry Andric// Bitselect is equivalent to (c & v1) | (~c & v2) 5710b57cec5SDimitry Andricforeach vec_t = [v16i8, v8i16, v4i32, v2i64] in 5720b57cec5SDimitry Andric def : Pat<(vec_t (or (and (vec_t V128:$c), (vec_t V128:$v1)), 5730b57cec5SDimitry Andric (and (vnot V128:$c), (vec_t V128:$v2)))), 5740b57cec5SDimitry Andric (!cast<Instruction>("BITSELECT_"#vec_t) 5750b57cec5SDimitry Andric V128:$v1, V128:$v2, V128:$c)>; 5760b57cec5SDimitry Andric 5770b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 5780b57cec5SDimitry Andric// Integer unary arithmetic 5790b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 5800b57cec5SDimitry Andric 5810b57cec5SDimitry Andricmulticlass SIMDUnaryInt<SDNode node, string name, bits<32> baseInst> { 5820b57cec5SDimitry Andric defm "" : SIMDUnary<v16i8, "i8x16", node, name, baseInst>; 583*5ffd83dbSDimitry Andric defm "" : SIMDUnary<v8i16, "i16x8", node, name, !add(baseInst, 32)>; 584*5ffd83dbSDimitry Andric defm "" : SIMDUnary<v4i32, "i32x4", node, name, !add(baseInst, 64)>; 585*5ffd83dbSDimitry Andric defm "" : SIMDUnary<v2i64, "i64x2", node, name, !add(baseInst, 96)>; 5860b57cec5SDimitry Andric} 5870b57cec5SDimitry Andric 5880b57cec5SDimitry Andricmulticlass SIMDReduceVec<ValueType vec_t, string vec, SDNode op, string name, 5890b57cec5SDimitry Andric bits<32> simdop> { 5900b57cec5SDimitry Andric defm _#vec_t : SIMD_I<(outs I32:$dst), (ins V128:$vec), (outs), (ins), 5910b57cec5SDimitry Andric [(set I32:$dst, (i32 (op (vec_t V128:$vec))))], 5920b57cec5SDimitry Andric vec#"."#name#"\t$dst, $vec", vec#"."#name, simdop>; 5930b57cec5SDimitry Andric} 5940b57cec5SDimitry Andric 5950b57cec5SDimitry Andricmulticlass SIMDReduce<SDNode op, string name, bits<32> baseInst> { 5960b57cec5SDimitry Andric defm "" : SIMDReduceVec<v16i8, "i8x16", op, name, baseInst>; 597*5ffd83dbSDimitry Andric defm "" : SIMDReduceVec<v8i16, "i16x8", op, name, !add(baseInst, 32)>; 598*5ffd83dbSDimitry Andric defm "" : SIMDReduceVec<v4i32, "i32x4", op, name, !add(baseInst, 64)>; 599*5ffd83dbSDimitry Andric defm "" : SIMDReduceVec<v2i64, "i64x2", op, name, !add(baseInst, 96)>; 6000b57cec5SDimitry Andric} 6010b57cec5SDimitry Andric 6020b57cec5SDimitry Andric// Integer vector negation 6030b57cec5SDimitry Andricdef ivneg : PatFrag<(ops node:$in), (sub immAllZerosV, node:$in)>; 6040b57cec5SDimitry Andric 605*5ffd83dbSDimitry Andric// Integer absolute value: abs 606*5ffd83dbSDimitry Andricdefm ABS : SIMDUnaryInt<abs, "abs", 96>; 607*5ffd83dbSDimitry Andric 6080b57cec5SDimitry Andric// Integer negation: neg 609*5ffd83dbSDimitry Andricdefm NEG : SIMDUnaryInt<ivneg, "neg", 97>; 6100b57cec5SDimitry Andric 6110b57cec5SDimitry Andric// Any lane true: any_true 612*5ffd83dbSDimitry Andricdefm ANYTRUE : SIMDReduce<int_wasm_anytrue, "any_true", 98>; 6130b57cec5SDimitry Andric 6140b57cec5SDimitry Andric// All lanes true: all_true 615*5ffd83dbSDimitry Andricdefm ALLTRUE : SIMDReduce<int_wasm_alltrue, "all_true", 99>; 6160b57cec5SDimitry Andric 6170b57cec5SDimitry Andric// Reductions already return 0 or 1, so and 1, setne 0, and seteq 1 6180b57cec5SDimitry Andric// can be folded out 6190b57cec5SDimitry Andricforeach reduction = 6200b57cec5SDimitry Andric [["int_wasm_anytrue", "ANYTRUE"], ["int_wasm_alltrue", "ALLTRUE"]] in 6210b57cec5SDimitry Andricforeach ty = [v16i8, v8i16, v4i32, v2i64] in { 6220b57cec5SDimitry Andricdef : Pat<(i32 (and 6230b57cec5SDimitry Andric (i32 (!cast<Intrinsic>(reduction[0]) (ty V128:$x))), 6240b57cec5SDimitry Andric (i32 1) 6250b57cec5SDimitry Andric )), 6260b57cec5SDimitry Andric (i32 (!cast<NI>(reduction[1]#"_"#ty) (ty V128:$x)))>; 6270b57cec5SDimitry Andricdef : Pat<(i32 (setne 6280b57cec5SDimitry Andric (i32 (!cast<Intrinsic>(reduction[0]) (ty V128:$x))), 6290b57cec5SDimitry Andric (i32 0) 6300b57cec5SDimitry Andric )), 6310b57cec5SDimitry Andric (i32 (!cast<NI>(reduction[1]#"_"#ty) (ty V128:$x)))>; 6320b57cec5SDimitry Andricdef : Pat<(i32 (seteq 6330b57cec5SDimitry Andric (i32 (!cast<Intrinsic>(reduction[0]) (ty V128:$x))), 6340b57cec5SDimitry Andric (i32 1) 6350b57cec5SDimitry Andric )), 6360b57cec5SDimitry Andric (i32 (!cast<NI>(reduction[1]#"_"#ty) (ty V128:$x)))>; 6370b57cec5SDimitry Andric} 6380b57cec5SDimitry Andric 639*5ffd83dbSDimitry Andricmulticlass SIMDBitmask<ValueType vec_t, string vec, bits<32> simdop> { 640*5ffd83dbSDimitry Andric defm _#vec_t : SIMD_I<(outs I32:$dst), (ins V128:$vec), (outs), (ins), 641*5ffd83dbSDimitry Andric [(set I32:$dst, 642*5ffd83dbSDimitry Andric (i32 (int_wasm_bitmask (vec_t V128:$vec))) 643*5ffd83dbSDimitry Andric )], 644*5ffd83dbSDimitry Andric vec#".bitmask\t$dst, $vec", vec#".bitmask", simdop>; 645*5ffd83dbSDimitry Andric} 646*5ffd83dbSDimitry Andric 647*5ffd83dbSDimitry Andricdefm BITMASK : SIMDBitmask<v16i8, "i8x16", 100>; 648*5ffd83dbSDimitry Andricdefm BITMASK : SIMDBitmask<v8i16, "i16x8", 132>; 649*5ffd83dbSDimitry Andricdefm BITMASK : SIMDBitmask<v4i32, "i32x4", 164>; 650*5ffd83dbSDimitry Andric 6510b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 6520b57cec5SDimitry Andric// Bit shifts 6530b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 6540b57cec5SDimitry Andric 655*5ffd83dbSDimitry Andricmulticlass SIMDShift<ValueType vec_t, string vec, SDNode node, string name, 656*5ffd83dbSDimitry Andric bits<32> simdop> { 6570b57cec5SDimitry Andric defm _#vec_t : SIMD_I<(outs V128:$dst), (ins V128:$vec, I32:$x), 6580b57cec5SDimitry Andric (outs), (ins), 659*5ffd83dbSDimitry Andric [(set (vec_t V128:$dst), (node V128:$vec, I32:$x))], 6600b57cec5SDimitry Andric vec#"."#name#"\t$dst, $vec, $x", vec#"."#name, simdop>; 6610b57cec5SDimitry Andric} 6620b57cec5SDimitry Andric 6630b57cec5SDimitry Andricmulticlass SIMDShiftInt<SDNode node, string name, bits<32> baseInst> { 664*5ffd83dbSDimitry Andric defm "" : SIMDShift<v16i8, "i8x16", node, name, baseInst>; 665*5ffd83dbSDimitry Andric defm "" : SIMDShift<v8i16, "i16x8", node, name, !add(baseInst, 32)>; 666*5ffd83dbSDimitry Andric defm "" : SIMDShift<v4i32, "i32x4", node, name, !add(baseInst, 64)>; 667*5ffd83dbSDimitry Andric defm "" : SIMDShift<v2i64, "i64x2", node, name, !add(baseInst, 96)>; 6680b57cec5SDimitry Andric} 6690b57cec5SDimitry Andric 670*5ffd83dbSDimitry Andric// WebAssembly SIMD shifts are nonstandard in that the shift amount is 671*5ffd83dbSDimitry Andric// an i32 rather than a vector, so they need custom nodes. 6720b57cec5SDimitry Andricdef wasm_shift_t : SDTypeProfile<1, 2, 6730b57cec5SDimitry Andric [SDTCisVec<0>, SDTCisSameAs<0, 1>, SDTCisVT<2, i32>] 6740b57cec5SDimitry Andric>; 6750b57cec5SDimitry Andricdef wasm_shl : SDNode<"WebAssemblyISD::VEC_SHL", wasm_shift_t>; 6760b57cec5SDimitry Andricdef wasm_shr_s : SDNode<"WebAssemblyISD::VEC_SHR_S", wasm_shift_t>; 6770b57cec5SDimitry Andricdef wasm_shr_u : SDNode<"WebAssemblyISD::VEC_SHR_U", wasm_shift_t>; 678*5ffd83dbSDimitry Andric 679*5ffd83dbSDimitry Andric// Left shift by scalar: shl 680*5ffd83dbSDimitry Andricdefm SHL : SIMDShiftInt<wasm_shl, "shl", 107>; 681*5ffd83dbSDimitry Andric 682*5ffd83dbSDimitry Andric// Right shift by scalar: shr_s / shr_u 683*5ffd83dbSDimitry Andricdefm SHR_S : SIMDShiftInt<wasm_shr_s, "shr_s", 108>; 684*5ffd83dbSDimitry Andricdefm SHR_U : SIMDShiftInt<wasm_shr_u, "shr_u", 109>; 6850b57cec5SDimitry Andric 6860b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 6870b57cec5SDimitry Andric// Integer binary arithmetic 6880b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 6890b57cec5SDimitry Andric 690*5ffd83dbSDimitry Andricmulticlass SIMDBinaryIntNoI8x16<SDNode node, string name, bits<32> baseInst> { 691*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v8i16, "i16x8", node, name, !add(baseInst, 32)>; 692*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v4i32, "i32x4", node, name, !add(baseInst, 64)>; 693*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v2i64, "i64x2", node, name, !add(baseInst, 96)>; 694*5ffd83dbSDimitry Andric} 695*5ffd83dbSDimitry Andric 6960b57cec5SDimitry Andricmulticlass SIMDBinaryIntSmall<SDNode node, string name, bits<32> baseInst> { 6970b57cec5SDimitry Andric defm "" : SIMDBinary<v16i8, "i8x16", node, name, baseInst>; 698*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v8i16, "i16x8", node, name, !add(baseInst, 32)>; 6990b57cec5SDimitry Andric} 7000b57cec5SDimitry Andric 7010b57cec5SDimitry Andricmulticlass SIMDBinaryIntNoI64x2<SDNode node, string name, bits<32> baseInst> { 7020b57cec5SDimitry Andric defm "" : SIMDBinaryIntSmall<node, name, baseInst>; 703*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v4i32, "i32x4", node, name, !add(baseInst, 64)>; 7040b57cec5SDimitry Andric} 7050b57cec5SDimitry Andric 7060b57cec5SDimitry Andricmulticlass SIMDBinaryInt<SDNode node, string name, bits<32> baseInst> { 7070b57cec5SDimitry Andric defm "" : SIMDBinaryIntNoI64x2<node, name, baseInst>; 708*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v2i64, "i64x2", node, name, !add(baseInst, 96)>; 7090b57cec5SDimitry Andric} 7100b57cec5SDimitry Andric 7110b57cec5SDimitry Andric// Integer addition: add / add_saturate_s / add_saturate_u 7120b57cec5SDimitry Andriclet isCommutable = 1 in { 713*5ffd83dbSDimitry Andricdefm ADD : SIMDBinaryInt<add, "add", 110>; 714*5ffd83dbSDimitry Andricdefm ADD_SAT_S : SIMDBinaryIntSmall<saddsat, "add_saturate_s", 111>; 715*5ffd83dbSDimitry Andricdefm ADD_SAT_U : SIMDBinaryIntSmall<uaddsat, "add_saturate_u", 112>; 7160b57cec5SDimitry Andric} // isCommutable = 1 7170b57cec5SDimitry Andric 7180b57cec5SDimitry Andric// Integer subtraction: sub / sub_saturate_s / sub_saturate_u 719*5ffd83dbSDimitry Andricdefm SUB : SIMDBinaryInt<sub, "sub", 113>; 7200b57cec5SDimitry Andricdefm SUB_SAT_S : 721*5ffd83dbSDimitry Andric SIMDBinaryIntSmall<int_wasm_sub_saturate_signed, "sub_saturate_s", 114>; 7220b57cec5SDimitry Andricdefm SUB_SAT_U : 723*5ffd83dbSDimitry Andric SIMDBinaryIntSmall<int_wasm_sub_saturate_unsigned, "sub_saturate_u", 115>; 7240b57cec5SDimitry Andric 7250b57cec5SDimitry Andric// Integer multiplication: mul 726480093f4SDimitry Andriclet isCommutable = 1 in 727*5ffd83dbSDimitry Andricdefm MUL : SIMDBinaryIntNoI8x16<mul, "mul", 117>; 7280b57cec5SDimitry Andric 729480093f4SDimitry Andric// Integer min_s / min_u / max_s / max_u 730480093f4SDimitry Andriclet isCommutable = 1 in { 731*5ffd83dbSDimitry Andricdefm MIN_S : SIMDBinaryIntNoI64x2<smin, "min_s", 118>; 732*5ffd83dbSDimitry Andricdefm MIN_U : SIMDBinaryIntNoI64x2<umin, "min_u", 119>; 733*5ffd83dbSDimitry Andricdefm MAX_S : SIMDBinaryIntNoI64x2<smax, "max_s", 120>; 734*5ffd83dbSDimitry Andricdefm MAX_U : SIMDBinaryIntNoI64x2<umax, "max_u", 121>; 735480093f4SDimitry Andric} // isCommutable = 1 736480093f4SDimitry Andric 737480093f4SDimitry Andric// Integer unsigned rounding average: avgr_u 738*5ffd83dbSDimitry Andriclet isCommutable = 1 in { 739*5ffd83dbSDimitry Andricdefm AVGR_U : SIMDBinary<v16i8, "i8x16", int_wasm_avgr_unsigned, "avgr_u", 123>; 740*5ffd83dbSDimitry Andricdefm AVGR_U : SIMDBinary<v8i16, "i16x8", int_wasm_avgr_unsigned, "avgr_u", 155>; 741480093f4SDimitry Andric} 742480093f4SDimitry Andric 743480093f4SDimitry Andricdef add_nuw : PatFrag<(ops node:$lhs, node:$rhs), 744480093f4SDimitry Andric (add node:$lhs, node:$rhs), 745480093f4SDimitry Andric "return N->getFlags().hasNoUnsignedWrap();">; 746480093f4SDimitry Andric 747480093f4SDimitry Andricforeach nodes = [[v16i8, splat16], [v8i16, splat8]] in 748*5ffd83dbSDimitry Andricdef : Pat<(wasm_shr_u 749480093f4SDimitry Andric (add_nuw 750480093f4SDimitry Andric (add_nuw (nodes[0] V128:$lhs), (nodes[0] V128:$rhs)), 751480093f4SDimitry Andric (nodes[1] (i32 1)) 752480093f4SDimitry Andric ), 753*5ffd83dbSDimitry Andric (i32 1) 754480093f4SDimitry Andric ), 755480093f4SDimitry Andric (!cast<NI>("AVGR_U_"#nodes[0]) V128:$lhs, V128:$rhs)>; 756480093f4SDimitry Andric 757480093f4SDimitry Andric// Widening dot product: i32x4.dot_i16x8_s 758480093f4SDimitry Andriclet isCommutable = 1 in 759480093f4SDimitry Andricdefm DOT : SIMD_I<(outs V128:$dst), (ins V128:$lhs, V128:$rhs), (outs), (ins), 760480093f4SDimitry Andric [(set V128:$dst, (int_wasm_dot V128:$lhs, V128:$rhs))], 761480093f4SDimitry Andric "i32x4.dot_i16x8_s\t$dst, $lhs, $rhs", "i32x4.dot_i16x8_s", 762*5ffd83dbSDimitry Andric 180>; 763480093f4SDimitry Andric 7640b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 7650b57cec5SDimitry Andric// Floating-point unary arithmetic 7660b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 7670b57cec5SDimitry Andric 7680b57cec5SDimitry Andricmulticlass SIMDUnaryFP<SDNode node, string name, bits<32> baseInst> { 7690b57cec5SDimitry Andric defm "" : SIMDUnary<v4f32, "f32x4", node, name, baseInst>; 770*5ffd83dbSDimitry Andric defm "" : SIMDUnary<v2f64, "f64x2", node, name, !add(baseInst, 12)>; 7710b57cec5SDimitry Andric} 7720b57cec5SDimitry Andric 7730b57cec5SDimitry Andric// Absolute value: abs 774*5ffd83dbSDimitry Andricdefm ABS : SIMDUnaryFP<fabs, "abs", 224>; 7750b57cec5SDimitry Andric 7760b57cec5SDimitry Andric// Negation: neg 777*5ffd83dbSDimitry Andricdefm NEG : SIMDUnaryFP<fneg, "neg", 225>; 7780b57cec5SDimitry Andric 7790b57cec5SDimitry Andric// Square root: sqrt 780*5ffd83dbSDimitry Andricdefm SQRT : SIMDUnaryFP<fsqrt, "sqrt", 227>; 781*5ffd83dbSDimitry Andric 782*5ffd83dbSDimitry Andric// Rounding: ceil, floor, trunc, nearest 783*5ffd83dbSDimitry Andricdefm CEIL : SIMDUnary<v4f32, "f32x4", int_wasm_ceil, "ceil", 216>; 784*5ffd83dbSDimitry Andricdefm FLOOR : SIMDUnary<v4f32, "f32x4", int_wasm_floor, "floor", 217>; 785*5ffd83dbSDimitry Andricdefm TRUNC: SIMDUnary<v4f32, "f32x4", int_wasm_trunc, "trunc", 218>; 786*5ffd83dbSDimitry Andricdefm NEAREST: SIMDUnary<v4f32, "f32x4", int_wasm_nearest, "nearest", 219>; 787*5ffd83dbSDimitry Andricdefm CEIL : SIMDUnary<v2f64, "f64x2", int_wasm_ceil, "ceil", 220>; 788*5ffd83dbSDimitry Andricdefm FLOOR : SIMDUnary<v2f64, "f64x2", int_wasm_floor, "floor", 221>; 789*5ffd83dbSDimitry Andricdefm TRUNC: SIMDUnary<v2f64, "f64x2", int_wasm_trunc, "trunc", 222>; 790*5ffd83dbSDimitry Andricdefm NEAREST: SIMDUnary<v2f64, "f64x2", int_wasm_nearest, "nearest", 223>; 7910b57cec5SDimitry Andric 7920b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 7930b57cec5SDimitry Andric// Floating-point binary arithmetic 7940b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 7950b57cec5SDimitry Andric 7960b57cec5SDimitry Andricmulticlass SIMDBinaryFP<SDNode node, string name, bits<32> baseInst> { 7970b57cec5SDimitry Andric defm "" : SIMDBinary<v4f32, "f32x4", node, name, baseInst>; 798*5ffd83dbSDimitry Andric defm "" : SIMDBinary<v2f64, "f64x2", node, name, !add(baseInst, 12)>; 7990b57cec5SDimitry Andric} 8000b57cec5SDimitry Andric 8010b57cec5SDimitry Andric// Addition: add 8020b57cec5SDimitry Andriclet isCommutable = 1 in 803*5ffd83dbSDimitry Andricdefm ADD : SIMDBinaryFP<fadd, "add", 228>; 8040b57cec5SDimitry Andric 8050b57cec5SDimitry Andric// Subtraction: sub 806*5ffd83dbSDimitry Andricdefm SUB : SIMDBinaryFP<fsub, "sub", 229>; 8070b57cec5SDimitry Andric 8080b57cec5SDimitry Andric// Multiplication: mul 8090b57cec5SDimitry Andriclet isCommutable = 1 in 810*5ffd83dbSDimitry Andricdefm MUL : SIMDBinaryFP<fmul, "mul", 230>; 8110b57cec5SDimitry Andric 8120b57cec5SDimitry Andric// Division: div 813*5ffd83dbSDimitry Andricdefm DIV : SIMDBinaryFP<fdiv, "div", 231>; 8140b57cec5SDimitry Andric 8150b57cec5SDimitry Andric// NaN-propagating minimum: min 816*5ffd83dbSDimitry Andricdefm MIN : SIMDBinaryFP<fminimum, "min", 232>; 8170b57cec5SDimitry Andric 8180b57cec5SDimitry Andric// NaN-propagating maximum: max 819*5ffd83dbSDimitry Andricdefm MAX : SIMDBinaryFP<fmaximum, "max", 233>; 820*5ffd83dbSDimitry Andric 821*5ffd83dbSDimitry Andric// Pseudo-minimum: pmin 822*5ffd83dbSDimitry Andricdefm PMIN : SIMDBinaryFP<int_wasm_pmin, "pmin", 234>; 823*5ffd83dbSDimitry Andric 824*5ffd83dbSDimitry Andric// Pseudo-maximum: pmax 825*5ffd83dbSDimitry Andricdefm PMAX : SIMDBinaryFP<int_wasm_pmax, "pmax", 235>; 8260b57cec5SDimitry Andric 8270b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 8280b57cec5SDimitry Andric// Conversions 8290b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 8300b57cec5SDimitry Andric 8310b57cec5SDimitry Andricmulticlass SIMDConvert<ValueType vec_t, ValueType arg_t, SDNode op, 8320b57cec5SDimitry Andric string name, bits<32> simdop> { 8330b57cec5SDimitry Andric defm op#_#vec_t#_#arg_t : 8340b57cec5SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$vec), (outs), (ins), 8350b57cec5SDimitry Andric [(set (vec_t V128:$dst), (vec_t (op (arg_t V128:$vec))))], 8360b57cec5SDimitry Andric name#"\t$dst, $vec", name, simdop>; 8370b57cec5SDimitry Andric} 8380b57cec5SDimitry Andric 8390b57cec5SDimitry Andric// Floating point to integer with saturation: trunc_sat 840*5ffd83dbSDimitry Andricdefm "" : SIMDConvert<v4i32, v4f32, fp_to_sint, "i32x4.trunc_sat_f32x4_s", 248>; 841*5ffd83dbSDimitry Andricdefm "" : SIMDConvert<v4i32, v4f32, fp_to_uint, "i32x4.trunc_sat_f32x4_u", 249>; 842*5ffd83dbSDimitry Andric 843*5ffd83dbSDimitry Andric// Integer to floating point: convert 844*5ffd83dbSDimitry Andricdefm "" : SIMDConvert<v4f32, v4i32, sint_to_fp, "f32x4.convert_i32x4_s", 250>; 845*5ffd83dbSDimitry Andricdefm "" : SIMDConvert<v4f32, v4i32, uint_to_fp, "f32x4.convert_i32x4_u", 251>; 8460b57cec5SDimitry Andric 8478bcb0991SDimitry Andric// Widening operations 8488bcb0991SDimitry Andricmulticlass SIMDWiden<ValueType vec_t, string vec, ValueType arg_t, string arg, 8498bcb0991SDimitry Andric bits<32> baseInst> { 8508bcb0991SDimitry Andric defm "" : SIMDConvert<vec_t, arg_t, int_wasm_widen_low_signed, 8518bcb0991SDimitry Andric vec#".widen_low_"#arg#"_s", baseInst>; 8528bcb0991SDimitry Andric defm "" : SIMDConvert<vec_t, arg_t, int_wasm_widen_high_signed, 8538bcb0991SDimitry Andric vec#".widen_high_"#arg#"_s", !add(baseInst, 1)>; 8548bcb0991SDimitry Andric defm "" : SIMDConvert<vec_t, arg_t, int_wasm_widen_low_unsigned, 8558bcb0991SDimitry Andric vec#".widen_low_"#arg#"_u", !add(baseInst, 2)>; 8568bcb0991SDimitry Andric defm "" : SIMDConvert<vec_t, arg_t, int_wasm_widen_high_unsigned, 8578bcb0991SDimitry Andric vec#".widen_high_"#arg#"_u", !add(baseInst, 3)>; 8588bcb0991SDimitry Andric} 8598bcb0991SDimitry Andric 860*5ffd83dbSDimitry Andricdefm "" : SIMDWiden<v8i16, "i16x8", v16i8, "i8x16", 135>; 861*5ffd83dbSDimitry Andricdefm "" : SIMDWiden<v4i32, "i32x4", v8i16, "i16x8", 167>; 8628bcb0991SDimitry Andric 8638bcb0991SDimitry Andric// Narrowing operations 8648bcb0991SDimitry Andricmulticlass SIMDNarrow<ValueType vec_t, string vec, ValueType arg_t, string arg, 8658bcb0991SDimitry Andric bits<32> baseInst> { 8668bcb0991SDimitry Andric defm NARROW_S_#vec_t : 8678bcb0991SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$low, V128:$high), (outs), (ins), 8688bcb0991SDimitry Andric [(set (vec_t V128:$dst), (vec_t (int_wasm_narrow_signed 8698bcb0991SDimitry Andric (arg_t V128:$low), (arg_t V128:$high))))], 8708bcb0991SDimitry Andric vec#".narrow_"#arg#"_s\t$dst, $low, $high", vec#".narrow_"#arg#"_s", 8718bcb0991SDimitry Andric baseInst>; 8728bcb0991SDimitry Andric defm NARROW_U_#vec_t : 8738bcb0991SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$low, V128:$high), (outs), (ins), 8748bcb0991SDimitry Andric [(set (vec_t V128:$dst), (vec_t (int_wasm_narrow_unsigned 8758bcb0991SDimitry Andric (arg_t V128:$low), (arg_t V128:$high))))], 8768bcb0991SDimitry Andric vec#".narrow_"#arg#"_u\t$dst, $low, $high", vec#".narrow_"#arg#"_u", 8778bcb0991SDimitry Andric !add(baseInst, 1)>; 8788bcb0991SDimitry Andric} 8798bcb0991SDimitry Andric 880*5ffd83dbSDimitry Andricdefm "" : SIMDNarrow<v16i8, "i8x16", v8i16, "i16x8", 101>; 881*5ffd83dbSDimitry Andricdefm "" : SIMDNarrow<v8i16, "i16x8", v4i32, "i32x4", 133>; 8828bcb0991SDimitry Andric 8830b57cec5SDimitry Andric// Lower llvm.wasm.trunc.saturate.* to saturating instructions 8840b57cec5SDimitry Andricdef : Pat<(v4i32 (int_wasm_trunc_saturate_signed (v4f32 V128:$src))), 8850b57cec5SDimitry Andric (fp_to_sint_v4i32_v4f32 (v4f32 V128:$src))>; 8860b57cec5SDimitry Andricdef : Pat<(v4i32 (int_wasm_trunc_saturate_unsigned (v4f32 V128:$src))), 8870b57cec5SDimitry Andric (fp_to_uint_v4i32_v4f32 (v4f32 V128:$src))>; 8880b57cec5SDimitry Andric 8890b57cec5SDimitry Andric// Bitcasts are nops 8900b57cec5SDimitry Andric// Matching bitcast t1 to t1 causes strange errors, so avoid repeating types 8910b57cec5SDimitry Andricforeach t1 = [v16i8, v8i16, v4i32, v2i64, v4f32, v2f64] in 8920b57cec5SDimitry Andricforeach t2 = !foldl( 8930b57cec5SDimitry Andric []<ValueType>, [v16i8, v8i16, v4i32, v2i64, v4f32, v2f64], 8940b57cec5SDimitry Andric acc, cur, !if(!eq(!cast<string>(t1), !cast<string>(cur)), 8950b57cec5SDimitry Andric acc, !listconcat(acc, [cur]) 8960b57cec5SDimitry Andric ) 8970b57cec5SDimitry Andric) in 8980b57cec5SDimitry Andricdef : Pat<(t1 (bitconvert (t2 V128:$v))), (t1 V128:$v)>; 8998bcb0991SDimitry Andric 9008bcb0991SDimitry Andric//===----------------------------------------------------------------------===// 9018bcb0991SDimitry Andric// Quasi-Fused Multiply- Add and Subtract (QFMA/QFMS) 9028bcb0991SDimitry Andric//===----------------------------------------------------------------------===// 9038bcb0991SDimitry Andric 9048bcb0991SDimitry Andricmulticlass SIMDQFM<ValueType vec_t, string vec, bits<32> baseInst> { 9058bcb0991SDimitry Andric defm QFMA_#vec_t : 9068bcb0991SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$a, V128:$b, V128:$c), 9078bcb0991SDimitry Andric (outs), (ins), 9088bcb0991SDimitry Andric [(set (vec_t V128:$dst), 9098bcb0991SDimitry Andric (int_wasm_qfma (vec_t V128:$a), (vec_t V128:$b), (vec_t V128:$c)))], 9108bcb0991SDimitry Andric vec#".qfma\t$dst, $a, $b, $c", vec#".qfma", baseInst>; 9118bcb0991SDimitry Andric defm QFMS_#vec_t : 9128bcb0991SDimitry Andric SIMD_I<(outs V128:$dst), (ins V128:$a, V128:$b, V128:$c), 9138bcb0991SDimitry Andric (outs), (ins), 9148bcb0991SDimitry Andric [(set (vec_t V128:$dst), 9158bcb0991SDimitry Andric (int_wasm_qfms (vec_t V128:$a), (vec_t V128:$b), (vec_t V128:$c)))], 9168bcb0991SDimitry Andric vec#".qfms\t$dst, $a, $b, $c", vec#".qfms", !add(baseInst, 1)>; 9178bcb0991SDimitry Andric} 9188bcb0991SDimitry Andric 919*5ffd83dbSDimitry Andricdefm "" : SIMDQFM<v4f32, "f32x4", 252>; 920*5ffd83dbSDimitry Andricdefm "" : SIMDQFM<v2f64, "f64x2", 254>; 921