|  | ; RUN: llc < %s -asm-verbose=false -verify-machineinstrs -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -mattr=+simd128,+relaxed-simd | FileCheck %s --check-prefixes=CHECK,SLOW | 
|  | ; RUN: llc < %s -asm-verbose=false -verify-machineinstrs -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -mattr=+simd128,+relaxed-simd -fast-isel | FileCheck %s | 
|  |  | 
|  | ; Test that SIMD128 intrinsics lower as expected. These intrinsics are | 
|  | ; only expected to lower successfully if the simd128 attribute is | 
|  | ; enabled and legal types are used. | 
|  |  | 
|  | target triple = "wasm32-unknown-unknown" | 
|  |  | 
|  | ; ============================================================================== | 
|  | ; 16 x i8 | 
|  | ; ============================================================================== | 
|  | ; CHECK-LABEL: swizzle_v16i8: | 
|  | ; CHECK-NEXT: .functype swizzle_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.swizzle $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.swizzle(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @swizzle_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.wasm.swizzle(<16 x i8> %x, <16 x i8> %y) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: add_sat_s_v16i8: | 
|  | ; CHECK-NEXT: .functype add_sat_s_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.add_sat_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.sadd.sat.v16i8(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @add_sat_s_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.sadd.sat.v16i8(<16 x i8> %x, <16 x i8> %y) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: add_sat_u_v16i8: | 
|  | ; CHECK-NEXT: .functype add_sat_u_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.add_sat_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.uadd.sat.v16i8(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @add_sat_u_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.uadd.sat.v16i8(<16 x i8> %x, <16 x i8> %y) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: sub_sat_s_v16i8: | 
|  | ; CHECK-NEXT: .functype sub_sat_s_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.sub_sat_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.sub.sat.signed.v16i8(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @sub_sat_s_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.wasm.sub.sat.signed.v16i8( | 
|  | <16 x i8> %x, <16 x i8> %y | 
|  | ) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: sub_sat_u_v16i8: | 
|  | ; CHECK-NEXT: .functype sub_sat_u_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.sub_sat_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.sub.sat.unsigned.v16i8(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @sub_sat_u_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.wasm.sub.sat.unsigned.v16i8( | 
|  | <16 x i8> %x, <16 x i8> %y | 
|  | ) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: avgr_u_v16i8: | 
|  | ; CHECK-NEXT: .functype avgr_u_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.avgr_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.avgr.unsigned.v16i8(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @avgr_u_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.wasm.avgr.unsigned.v16i8(<16 x i8> %x, <16 x i8> %y) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: popcnt_v16i8: | 
|  | ; CHECK-NEXT: .functype popcnt_v16i8 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.popcnt $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.ctpop.v16i8(<16 x i8>) | 
|  | define <16 x i8> @popcnt_v16i8(<16 x i8> %x) { | 
|  | %a = call <16 x i8> @llvm.ctpop.v16i8(<16 x i8> %x) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: any_v16i8: | 
|  | ; CHECK-NEXT: .functype any_v16i8 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: v128.any_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.anytrue.v16i8(<16 x i8>) | 
|  | define i32 @any_v16i8(<16 x i8> %x) { | 
|  | %a = call i32 @llvm.wasm.anytrue.v16i8(<16 x i8> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: all_v16i8: | 
|  | ; CHECK-NEXT: .functype all_v16i8 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i8x16.all_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.alltrue.v16i8(<16 x i8>) | 
|  | define i32 @all_v16i8(<16 x i8> %x) { | 
|  | %a = call i32 @llvm.wasm.alltrue.v16i8(<16 x i8> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitmask_v16i8: | 
|  | ; CHECK-NEXT: .functype bitmask_v16i8 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i8x16.bitmask $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.bitmask.v16i8(<16 x i8>) | 
|  | define i32 @bitmask_v16i8(<16 x i8> %x) { | 
|  | %a = call i32 @llvm.wasm.bitmask.v16i8(<16 x i8> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitselect_v16i8: | 
|  | ; CHECK-NEXT: .functype bitselect_v16i8 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: v128.bitselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.bitselect.v16i8(<16 x i8>, <16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @bitselect_v16i8(<16 x i8> %v1, <16 x i8> %v2, <16 x i8> %c) { | 
|  | %a = call <16 x i8> @llvm.wasm.bitselect.v16i8( | 
|  | <16 x i8> %v1, <16 x i8> %v2, <16 x i8> %c | 
|  | ) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: narrow_signed_v16i8: | 
|  | ; CHECK-NEXT: .functype narrow_signed_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.narrow_i16x8_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.narrow.signed.v16i8.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <16 x i8> @narrow_signed_v16i8(<8 x i16> %low, <8 x i16> %high) { | 
|  | %a = call <16 x i8> @llvm.wasm.narrow.signed.v16i8.v8i16( | 
|  | <8 x i16> %low, <8 x i16> %high | 
|  | ) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: narrow_unsigned_v16i8: | 
|  | ; CHECK-NEXT: .functype narrow_unsigned_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.narrow_i16x8_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.narrow.unsigned.v16i8.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <16 x i8> @narrow_unsigned_v16i8(<8 x i16> %low, <8 x i16> %high) { | 
|  | %a = call <16 x i8> @llvm.wasm.narrow.unsigned.v16i8.v8i16( | 
|  | <8 x i16> %low, <8 x i16> %high | 
|  | ) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: shuffle_v16i8: | 
|  | ; NO-CHECK-NOT: i8x16 | 
|  | ; CHECK-NEXT: .functype shuffle_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.shuffle $push[[R:[0-9]+]]=, $0, $1, | 
|  | ; CHECK-SAME: 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.shuffle( | 
|  | <16 x i8>, <16 x i8>, i32 immarg, i32 immarg, i32 immarg, i32 immarg, | 
|  | i32 immarg, i32 immarg, i32 immarg, i32 immarg, i32 immarg, i32 immarg, | 
|  | i32 immarg, i32 immarg, i32 immarg, i32 immarg, i32 immarg, i32 immarg) | 
|  | define <16 x i8> @shuffle_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %res = call <16 x i8> @llvm.wasm.shuffle(<16 x i8> %x, <16 x i8> %y, | 
|  | i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, | 
|  | i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 35) | 
|  | ret <16 x i8> %res | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: laneselect_v16i8: | 
|  | ; CHECK-NEXT: .functype laneselect_v16i8 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.relaxed_laneselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.relaxed.laneselect.v16i8(<16 x i8>, <16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @laneselect_v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c) { | 
|  | %v = call <16 x i8> @llvm.wasm.relaxed.laneselect.v16i8( | 
|  | <16 x i8> %a, <16 x i8> %b, <16 x i8> %c | 
|  | ) | 
|  | ret <16 x i8> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_swizzle_v16i8: | 
|  | ; CHECK-NEXT: .functype relaxed_swizzle_v16i8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i8x16.relaxed_swizzle $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <16 x i8> @llvm.wasm.relaxed.swizzle(<16 x i8>, <16 x i8>) | 
|  | define <16 x i8> @relaxed_swizzle_v16i8(<16 x i8> %x, <16 x i8> %y) { | 
|  | %a = call <16 x i8> @llvm.wasm.relaxed.swizzle(<16 x i8> %x, <16 x i8> %y) | 
|  | ret <16 x i8> %a | 
|  | } | 
|  |  | 
|  | ; ============================================================================== | 
|  | ; 8 x i16 | 
|  | ; ============================================================================== | 
|  | ; CHECK-LABEL: add_sat_s_v8i16: | 
|  | ; CHECK-NEXT: .functype add_sat_s_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.add_sat_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.sadd.sat.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @add_sat_s_v8i16(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <8 x i16> @llvm.sadd.sat.v8i16(<8 x i16> %x, <8 x i16> %y) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: add_sat_u_v8i16: | 
|  | ; CHECK-NEXT: .functype add_sat_u_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.add_sat_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.uadd.sat.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @add_sat_u_v8i16(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <8 x i16> @llvm.uadd.sat.v8i16(<8 x i16> %x, <8 x i16> %y) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: sub_sat_s_v8i16: | 
|  | ; CHECK-NEXT: .functype sub_sat_s_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.sub_sat_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.sub.sat.signed.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @sub_sat_s_v8i16(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <8 x i16> @llvm.wasm.sub.sat.signed.v8i16( | 
|  | <8 x i16> %x, <8 x i16> %y | 
|  | ) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: sub_sat_u_v8i16: | 
|  | ; CHECK-NEXT: .functype sub_sat_u_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.sub_sat_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.sub.sat.unsigned.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @sub_sat_u_v8i16(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <8 x i16> @llvm.wasm.sub.sat.unsigned.v8i16( | 
|  | <8 x i16> %x, <8 x i16> %y | 
|  | ) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: avgr_u_v8i16: | 
|  | ; CHECK-NEXT: .functype avgr_u_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.avgr_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.avgr.unsigned.v8i16(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @avgr_u_v8i16(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <8 x i16> @llvm.wasm.avgr.unsigned.v8i16(<8 x i16> %x, <8 x i16> %y) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: q15mulr_sat_s_v8i16: | 
|  | ; CHECK-NEXT: .functype q15mulr_sat_s_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.q15mulr_sat_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.q15mulr.sat.signed(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @q15mulr_sat_s_v8i16(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <8 x i16> @llvm.wasm.q15mulr.sat.signed(<8 x i16> %x, | 
|  | <8 x i16> %y) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: extadd_pairwise_s_v8i16: | 
|  | ; CHECK-NEXT: .functype extadd_pairwise_s_v8i16 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.extadd_pairwise_i8x16_s $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.extadd.pairwise.signed.v8i16(<16 x i8>) | 
|  | define <8 x i16> @extadd_pairwise_s_v8i16(<16 x i8> %x) { | 
|  | %a = call <8 x i16> @llvm.wasm.extadd.pairwise.signed.v8i16(<16 x i8> %x) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: extadd_pairwise_u_v8i16: | 
|  | ; CHECK-NEXT: .functype extadd_pairwise_u_v8i16 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.extadd_pairwise_i8x16_u $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.extadd.pairwise.unsigned.v8i16(<16 x i8>) | 
|  | define <8 x i16> @extadd_pairwise_u_v8i16(<16 x i8> %x) { | 
|  | %a = call <8 x i16> @llvm.wasm.extadd.pairwise.unsigned.v8i16(<16 x i8> %x) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: any_v8i16: | 
|  | ; CHECK-NEXT: .functype any_v8i16 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: v128.any_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.anytrue.v8i16(<8 x i16>) | 
|  | define i32 @any_v8i16(<8 x i16> %x) { | 
|  | %a = call i32 @llvm.wasm.anytrue.v8i16(<8 x i16> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: all_v8i16: | 
|  | ; CHECK-NEXT: .functype all_v8i16 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i16x8.all_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.alltrue.v8i16(<8 x i16>) | 
|  | define i32 @all_v8i16(<8 x i16> %x) { | 
|  | %a = call i32 @llvm.wasm.alltrue.v8i16(<8 x i16> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitmask_v8i16: | 
|  | ; CHECK-NEXT: .functype bitmask_v8i16 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i16x8.bitmask $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.bitmask.v8i16(<8 x i16>) | 
|  | define i32 @bitmask_v8i16(<8 x i16> %x) { | 
|  | %a = call i32 @llvm.wasm.bitmask.v8i16(<8 x i16> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitselect_v8i16: | 
|  | ; CHECK-NEXT: .functype bitselect_v8i16 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: v128.bitselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.bitselect.v8i16(<8 x i16>, <8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @bitselect_v8i16(<8 x i16> %v1, <8 x i16> %v2, <8 x i16> %c) { | 
|  | %a = call <8 x i16> @llvm.wasm.bitselect.v8i16( | 
|  | <8 x i16> %v1, <8 x i16> %v2, <8 x i16> %c | 
|  | ) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: narrow_signed_v8i16: | 
|  | ; CHECK-NEXT: .functype narrow_signed_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.narrow_i32x4_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.narrow.signed.v8i16.v4i32(<4 x i32>, <4 x i32>) | 
|  | define <8 x i16> @narrow_signed_v8i16(<4 x i32> %low, <4 x i32> %high) { | 
|  | %a = call <8 x i16> @llvm.wasm.narrow.signed.v8i16.v4i32( | 
|  | <4 x i32> %low, <4 x i32> %high | 
|  | ) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: narrow_unsigned_v8i16: | 
|  | ; CHECK-NEXT: .functype narrow_unsigned_v8i16 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.narrow_i32x4_u $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.narrow.unsigned.v8i16.v4i32(<4 x i32>, <4 x i32>) | 
|  | define <8 x i16> @narrow_unsigned_v8i16(<4 x i32> %low, <4 x i32> %high) { | 
|  | %a = call <8 x i16> @llvm.wasm.narrow.unsigned.v8i16.v4i32( | 
|  | <4 x i32> %low, <4 x i32> %high | 
|  | ) | 
|  | ret <8 x i16> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: laneselect_v8i16: | 
|  | ; CHECK-NEXT: .functype laneselect_v8i16 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.relaxed_laneselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.relaxed.laneselect.v8i16(<8 x i16>, <8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @laneselect_v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> %c) { | 
|  | %v = call <8 x i16> @llvm.wasm.relaxed.laneselect.v8i16( | 
|  | <8 x i16> %a, <8 x i16> %b, <8 x i16> %c | 
|  | ) | 
|  | ret <8 x i16> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_q15mulr_s_i16x8: | 
|  | ; CHECK-NEXT: .functype relaxed_q15mulr_s_i16x8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.relaxed_q15mulr_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.relaxed.q15mulr.signed(<8 x i16>, <8 x i16>) | 
|  | define <8 x i16> @relaxed_q15mulr_s_i16x8(<8 x i16> %a, <8 x i16> %b) { | 
|  | %v = call <8 x i16> @llvm.wasm.relaxed.q15mulr.signed( | 
|  | <8 x i16> %a, <8 x i16> %b | 
|  | ) | 
|  | ret <8 x i16> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: dot_i8x16_i7x16_s_i16x8: | 
|  | ; CHECK-NEXT: .functype dot_i8x16_i7x16_s_i16x8 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i16x8.relaxed_dot_i8x16_i7x16_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <8 x i16> @llvm.wasm.relaxed.dot.i8x16.i7x16.signed(<16 x i8>, <16 x i8>) | 
|  | define <8 x i16> @dot_i8x16_i7x16_s_i16x8(<16 x i8> %a, <16 x i8> %b) { | 
|  | %v = call <8 x i16> @llvm.wasm.relaxed.dot.i8x16.i7x16.signed( | 
|  | <16 x i8> %a, <16 x i8> %b | 
|  | ) | 
|  | ret <8 x i16> %v | 
|  | } | 
|  |  | 
|  | ; ============================================================================== | 
|  | ; 4 x i32 | 
|  | ; ============================================================================== | 
|  | ; CHECK-LABEL: dot: | 
|  | ; CHECK-NEXT: .functype dot (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.dot_i16x8_s $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.dot(<8 x i16>, <8 x i16>) | 
|  | define <4 x i32> @dot(<8 x i16> %x, <8 x i16> %y) { | 
|  | %a = call <4 x i32> @llvm.wasm.dot(<8 x i16> %x, <8 x i16> %y) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: extadd_pairwise_s_v4i32: | 
|  | ; CHECK-NEXT: .functype extadd_pairwise_s_v4i32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.extadd_pairwise_i16x8_s $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.extadd.pairwise.signed.v4i32(<8 x i16>) | 
|  | define <4 x i32> @extadd_pairwise_s_v4i32(<8 x i16> %x) { | 
|  | %a = call <4 x i32> @llvm.wasm.extadd.pairwise.signed.v4i32(<8 x i16> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: extadd_pairwise_u_v4i32: | 
|  | ; CHECK-NEXT: .functype extadd_pairwise_u_v4i32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.extadd_pairwise_i16x8_u $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.extadd.pairwise.unsigned.v4i32(<8 x i16>) | 
|  | define <4 x i32> @extadd_pairwise_u_v4i32(<8 x i16> %x) { | 
|  | %a = call <4 x i32> @llvm.wasm.extadd.pairwise.unsigned.v4i32(<8 x i16> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  |  | 
|  | ; CHECK-LABEL: any_v4i32: | 
|  | ; CHECK-NEXT: .functype any_v4i32 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: v128.any_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.anytrue.v4i32(<4 x i32>) | 
|  | define i32 @any_v4i32(<4 x i32> %x) { | 
|  | %a = call i32 @llvm.wasm.anytrue.v4i32(<4 x i32> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: all_v4i32: | 
|  | ; CHECK-NEXT: .functype all_v4i32 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i32x4.all_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.alltrue.v4i32(<4 x i32>) | 
|  | define i32 @all_v4i32(<4 x i32> %x) { | 
|  | %a = call i32 @llvm.wasm.alltrue.v4i32(<4 x i32> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitmask_v4i32: | 
|  | ; CHECK-NEXT: .functype bitmask_v4i32 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i32x4.bitmask $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.bitmask.v4i32(<4 x i32>) | 
|  | define i32 @bitmask_v4i32(<4 x i32> %x) { | 
|  | %a = call i32 @llvm.wasm.bitmask.v4i32(<4 x i32> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitselect_v4i32: | 
|  | ; CHECK-NEXT: .functype bitselect_v4i32 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: v128.bitselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.bitselect.v4i32(<4 x i32>, <4 x i32>, <4 x i32>) | 
|  | define <4 x i32> @bitselect_v4i32(<4 x i32> %v1, <4 x i32> %v2, <4 x i32> %c) { | 
|  | %a = call <4 x i32> @llvm.wasm.bitselect.v4i32( | 
|  | <4 x i32> %v1, <4 x i32> %v2, <4 x i32> %c | 
|  | ) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_sat_s_v4i32: | 
|  | ; NO-CHECK-NOT: f32x4 | 
|  | ; CHECK-NEXT: .functype trunc_sat_s_v4i32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.trunc_sat_f32x4_s $push[[R:[0-9]+]]=, $0 | 
|  | ; CHECK-NEXT: return $pop[[R]] | 
|  | declare <4 x i32> @llvm.fptosi.sat.v4i32.v4f32(<4 x float>) | 
|  | define <4 x i32> @trunc_sat_s_v4i32(<4 x float> %x) { | 
|  | %a = call <4 x i32> @llvm.fptosi.sat.v4i32.v4f32(<4 x float> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_sat_u_v4i32: | 
|  | ; NO-CHECK-NOT: f32x4 | 
|  | ; CHECK-NEXT: .functype trunc_sat_u_v4i32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.trunc_sat_f32x4_u $push[[R:[0-9]+]]=, $0 | 
|  | ; CHECK-NEXT: return $pop[[R]] | 
|  | declare <4 x i32> @llvm.fptoui.sat.v4i32.v4f32(<4 x float>) | 
|  | define <4 x i32> @trunc_sat_u_v4i32(<4 x float> %x) { | 
|  | %a = call <4 x i32> @llvm.fptoui.sat.v4i32.v4f32(<4 x float> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_sat_s_zero_v4i32: | 
|  | ; CHECK-NEXT: .functype trunc_sat_s_zero_v4i32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.trunc_sat_f64x2_s_zero $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x i32> @llvm.fptosi.sat.v2i32.v2f64(<2 x double>) | 
|  | define <4 x i32> @trunc_sat_s_zero_v4i32(<2 x double> %x) { | 
|  | %v = call <2 x i32> @llvm.fptosi.sat.v2i32.v2f64(<2 x double> %x) | 
|  | %a = shufflevector <2 x i32> %v, <2 x i32> <i32 0, i32 0>, | 
|  | <4 x i32> <i32 0, i32 1, i32 2, i32 3> | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_sat_s_zero_v4i32_2: | 
|  | ; CHECK-NEXT: .functype trunc_sat_s_zero_v4i32_2 (v128) -> (v128){{$}} | 
|  | ; SLOW-NEXT: i32x4.trunc_sat_f64x2_s_zero $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; SLOW-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.fptosi.sat.v4i32.v4f64(<4 x double>) | 
|  | define <4 x i32> @trunc_sat_s_zero_v4i32_2(<2 x double> %x) { | 
|  | %v = shufflevector <2 x double> %x, <2 x double> zeroinitializer, | 
|  | <4 x i32> <i32 0, i32 1, i32 2, i32 3> | 
|  | %a = call <4 x i32> @llvm.fptosi.sat.v4i32.v4f64(<4 x double> %v) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_sat_u_zero_v4i32: | 
|  | ; CHECK-NEXT: .functype trunc_sat_u_zero_v4i32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.trunc_sat_f64x2_u_zero $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x i32> @llvm.fptoui.sat.v2i32.v2f64(<2 x double>) | 
|  | define <4 x i32> @trunc_sat_u_zero_v4i32(<2 x double> %x) { | 
|  | %v = call <2 x i32> @llvm.fptoui.sat.v2i32.v2f64(<2 x double> %x) | 
|  | %a = shufflevector <2 x i32> %v, <2 x i32> <i32 0, i32 0>, | 
|  | <4 x i32> <i32 0, i32 1, i32 2, i32 3> | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_sat_u_zero_v4i32_2: | 
|  | ; CHECK-NEXT: .functype trunc_sat_u_zero_v4i32_2 (v128) -> (v128){{$}} | 
|  | ; SLOW-NEXT: i32x4.trunc_sat_f64x2_u_zero $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; SLOW-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.fptoui.sat.v4i32.v4f64(<4 x double>) | 
|  | define <4 x i32> @trunc_sat_u_zero_v4i32_2(<2 x double> %x) { | 
|  | %v = shufflevector <2 x double> %x, <2 x double> zeroinitializer, | 
|  | <4 x i32> <i32 0, i32 1, i32 2, i32 3> | 
|  | %a = call <4 x i32> @llvm.fptoui.sat.v4i32.v4f64(<4 x double> %v) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: laneselect_v4i32: | 
|  | ; CHECK-NEXT: .functype laneselect_v4i32 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.relaxed_laneselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.relaxed.laneselect.v4i32(<4 x i32>, <4 x i32>, <4 x i32>) | 
|  | define <4 x i32> @laneselect_v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> %c) { | 
|  | %v = call <4 x i32> @llvm.wasm.relaxed.laneselect.v4i32( | 
|  | <4 x i32> %a, <4 x i32> %b, <4 x i32> %c | 
|  | ) | 
|  | ret <4 x i32> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_trunc_s: | 
|  | ; NO-CHECK-NOT: f32x4 | 
|  | ; CHECK-NEXT: .functype relaxed_trunc_s (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.relaxed_trunc_f32x4_s $push[[R:[0-9]+]]=, $0 | 
|  | ; CHECK-NEXT: return $pop[[R]] | 
|  | declare <4 x i32> @llvm.wasm.relaxed.trunc.signed(<4 x float>) | 
|  | define <4 x i32> @relaxed_trunc_s(<4 x float> %x) { | 
|  | %a = call <4 x i32> @llvm.wasm.relaxed.trunc.signed(<4 x float> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_trunc_u: | 
|  | ; NO-CHECK-NOT: f32x4 | 
|  | ; CHECK-NEXT: .functype relaxed_trunc_u (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.relaxed_trunc_f32x4_u $push[[R:[0-9]+]]=, $0 | 
|  | ; CHECK-NEXT: return $pop[[R]] | 
|  | declare <4 x i32> @llvm.wasm.relaxed.trunc.unsigned(<4 x float>) | 
|  | define <4 x i32> @relaxed_trunc_u(<4 x float> %x) { | 
|  | %a = call <4 x i32> @llvm.wasm.relaxed.trunc.unsigned(<4 x float> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_trunc_s_zero: | 
|  | ; CHECK-NEXT: .functype relaxed_trunc_s_zero (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.relaxed_trunc_f64x2_s_zero $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.relaxed.trunc.signed.zero(<2 x double>) | 
|  | define <4 x i32> @relaxed_trunc_s_zero(<2 x double> %x) { | 
|  | %a = call <4 x i32> @llvm.wasm.relaxed.trunc.signed.zero(<2 x double> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_trunc_u_zero: | 
|  | ; CHECK-NEXT: .functype relaxed_trunc_u_zero (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.relaxed_trunc_f64x2_u_zero $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.relaxed.trunc.unsigned.zero(<2 x double>) | 
|  | define <4 x i32> @relaxed_trunc_u_zero(<2 x double> %x) { | 
|  | %a = call <4 x i32> @llvm.wasm.relaxed.trunc.unsigned.zero(<2 x double> %x) | 
|  | ret <4 x i32> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: dot_i8x16_i7x16_add_s_i32x4: | 
|  | ; CHECK-NEXT: .functype dot_i8x16_i7x16_add_s_i32x4 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i32x4.relaxed_dot_i8x16_i7x16_add_s $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x i32> @llvm.wasm.relaxed.dot.i8x16.i7x16.add.signed( | 
|  | <16 x i8>, <16 x i8>, <4 x i32>) | 
|  | define <4 x i32> @dot_i8x16_i7x16_add_s_i32x4(<16 x i8> %a, <16 x i8> %b, | 
|  | <4 x i32> %c) { | 
|  | %v = call <4 x i32> @llvm.wasm.relaxed.dot.i8x16.i7x16.add.signed( | 
|  | <16 x i8> %a, <16 x i8> %b, <4 x i32> %c | 
|  | ) | 
|  | ret <4 x i32> %v | 
|  | } | 
|  |  | 
|  | ; ============================================================================== | 
|  | ; 2 x i64 | 
|  | ; ============================================================================== | 
|  | ; CHECK-LABEL: any_v2i64: | 
|  | ; CHECK-NEXT: .functype any_v2i64 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: v128.any_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.anytrue.v2i64(<2 x i64>) | 
|  | define i32 @any_v2i64(<2 x i64> %x) { | 
|  | %a = call i32 @llvm.wasm.anytrue.v2i64(<2 x i64> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: all_v2i64: | 
|  | ; CHECK-NEXT: .functype all_v2i64 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i64x2.all_true $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.alltrue.v2i64(<2 x i64>) | 
|  | define i32 @all_v2i64(<2 x i64> %x) { | 
|  | %a = call i32 @llvm.wasm.alltrue.v2i64(<2 x i64> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitmask_v2i64: | 
|  | ; CHECK-NEXT: .functype bitmask_v2i64 (v128) -> (i32){{$}} | 
|  | ; CHECK-NEXT: i64x2.bitmask $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare i32 @llvm.wasm.bitmask.v2i64(<2 x i64>) | 
|  | define i32 @bitmask_v2i64(<2 x i64> %x) { | 
|  | %a = call i32 @llvm.wasm.bitmask.v2i64(<2 x i64> %x) | 
|  | ret i32 %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: bitselect_v2i64: | 
|  | ; CHECK-NEXT: .functype bitselect_v2i64 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: v128.bitselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x i64> @llvm.wasm.bitselect.v2i64(<2 x i64>, <2 x i64>, <2 x i64>) | 
|  | define <2 x i64> @bitselect_v2i64(<2 x i64> %v1, <2 x i64> %v2, <2 x i64> %c) { | 
|  | %a = call <2 x i64> @llvm.wasm.bitselect.v2i64( | 
|  | <2 x i64> %v1, <2 x i64> %v2, <2 x i64> %c | 
|  | ) | 
|  | ret <2 x i64> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: laneselect_v2i64: | 
|  | ; CHECK-NEXT: .functype laneselect_v2i64 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: i64x2.relaxed_laneselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x i64> @llvm.wasm.relaxed.laneselect.v2i64(<2 x i64>, <2 x i64>, <2 x i64>) | 
|  | define <2 x i64> @laneselect_v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> %c) { | 
|  | %v = call <2 x i64> @llvm.wasm.relaxed.laneselect.v2i64( | 
|  | <2 x i64> %a, <2 x i64> %b, <2 x i64> %c | 
|  | ) | 
|  | ret <2 x i64> %v | 
|  | } | 
|  |  | 
|  | ; ============================================================================== | 
|  | ; 4 x f32 | 
|  | ; ============================================================================== | 
|  | ; CHECK-LABEL: bitselect_v4f32: | 
|  | ; CHECK-NEXT: .functype bitselect_v4f32 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: v128.bitselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.bitselect.v4f32(<4 x float>, <4 x float>, <4 x float>) | 
|  | define <4 x float> @bitselect_v4f32(<4 x float> %v1, <4 x float> %v2, <4 x float> %c) { | 
|  | %a = call <4 x float> @llvm.wasm.bitselect.v4f32( | 
|  | <4 x float> %v1, <4 x float> %v2, <4 x float> %c | 
|  | ) | 
|  | ret <4 x float> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: pmin_v4f32: | 
|  | ; CHECK-NEXT: .functype pmin_v4f32 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.pmin $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.pmin.v4f32(<4 x float>, <4 x float>) | 
|  | define <4 x float> @pmin_v4f32(<4 x float> %a, <4 x float> %b) { | 
|  | %v = call <4 x float> @llvm.wasm.pmin.v4f32(<4 x float> %a, <4 x float> %b) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: pmax_v4f32: | 
|  | ; CHECK-NEXT: .functype pmax_v4f32 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.pmax $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.pmax.v4f32(<4 x float>, <4 x float>) | 
|  | define <4 x float> @pmax_v4f32(<4 x float> %a, <4 x float> %b) { | 
|  | %v = call <4 x float> @llvm.wasm.pmax.v4f32(<4 x float> %a, <4 x float> %b) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: ceil_v4f32: | 
|  | ; CHECK-NEXT: .functype ceil_v4f32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.ceil $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.ceil.v4f32(<4 x float>) | 
|  | define <4 x float> @ceil_v4f32(<4 x float> %a) { | 
|  | %v = call <4 x float> @llvm.ceil.v4f32(<4 x float> %a) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: floor_v4f32: | 
|  | ; CHECK-NEXT: .functype floor_v4f32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.floor $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.floor.v4f32(<4 x float>) | 
|  | define <4 x float> @floor_v4f32(<4 x float> %a) { | 
|  | %v = call <4 x float> @llvm.floor.v4f32(<4 x float> %a) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_v4f32: | 
|  | ; CHECK-NEXT: .functype trunc_v4f32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.trunc $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.trunc.v4f32(<4 x float>) | 
|  | define <4 x float> @trunc_v4f32(<4 x float> %a) { | 
|  | %v = call <4 x float> @llvm.trunc.v4f32(<4 x float> %a) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nearest_v4f32: | 
|  | ; CHECK-NEXT: .functype nearest_v4f32 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.nearest $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.nearbyint.v4f32(<4 x float>) | 
|  | define <4 x float> @nearest_v4f32(<4 x float> %a) { | 
|  | %v = call <4 x float> @llvm.nearbyint.v4f32(<4 x float> %a) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nearest_v4f32_via_rint: | 
|  | ; CHECK-NEXT: .functype nearest_v4f32_via_rint (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.nearest $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.rint.v4f32(<4 x float>) | 
|  | define <4 x float> @nearest_v4f32_via_rint(<4 x float> %a) { | 
|  | %v = call <4 x float> @llvm.rint.v4f32(<4 x float> %a) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nearest_v4f32_via_roundeven: | 
|  | ; CHECK-NEXT: .functype nearest_v4f32_via_roundeven (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.nearest $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.roundeven.v4f32(<4 x float>) | 
|  | define <4 x float> @nearest_v4f32_via_roundeven(<4 x float> %a) { | 
|  | %v = call <4 x float> @llvm.roundeven.v4f32(<4 x float> %a) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: madd_v4f32: | 
|  | ; CHECK-NEXT: .functype madd_v4f32 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.relaxed_madd $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.relaxed.madd.v4f32(<4 x float>, <4 x float>, <4 x float>) | 
|  | define <4 x float> @madd_v4f32(<4 x float> %a, <4 x float> %b, <4 x float> %c) { | 
|  | %v = call <4 x float> @llvm.wasm.relaxed.madd.v4f32( | 
|  | <4 x float> %a, <4 x float> %b, <4 x float> %c | 
|  | ) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nmadd_v4f32: | 
|  | ; CHECK-NEXT: .functype nmadd_v4f32 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.relaxed_nmadd $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.relaxed.nmadd.v4f32(<4 x float>, <4 x float>, <4 x float>) | 
|  | define <4 x float> @nmadd_v4f32(<4 x float> %a, <4 x float> %b, <4 x float> %c) { | 
|  | %v = call <4 x float> @llvm.wasm.relaxed.nmadd.v4f32( | 
|  | <4 x float> %a, <4 x float> %b, <4 x float> %c | 
|  | ) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_min_v4f32: | 
|  | ; CHECK-NEXT: .functype relaxed_min_v4f32 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.relaxed_min $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.relaxed.min.v4f32(<4 x float>, <4 x float>) | 
|  | define <4 x float> @relaxed_min_v4f32(<4 x float> %a, <4 x float> %b) { | 
|  | %v = call <4 x float> @llvm.wasm.relaxed.min.v4f32( | 
|  | <4 x float> %a, <4 x float> %b | 
|  | ) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_max_v4f32: | 
|  | ; CHECK-NEXT: .functype relaxed_max_v4f32 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.relaxed_max $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.relaxed.max.v4f32(<4 x float>, <4 x float>) | 
|  | define <4 x float> @relaxed_max_v4f32(<4 x float> %a, <4 x float> %b) { | 
|  | %v = call <4 x float> @llvm.wasm.relaxed.max.v4f32( | 
|  | <4 x float> %a, <4 x float> %b | 
|  | ) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_dot_bf16x8_add_f32: | 
|  | ; CHECK-NEXT: .functype relaxed_dot_bf16x8_add_f32 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f32x4.relaxed_dot_bf16x8_add_f32 $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <4 x float> @llvm.wasm.relaxed.dot.bf16x8.add.f32(<8 x i16>, <8 x i16>, | 
|  | <4 x float>) | 
|  | define <4 x float> @relaxed_dot_bf16x8_add_f32(<8 x i16> %a, <8 x i16> %b, | 
|  | <4 x float> %c) { | 
|  | %v = call <4 x float> @llvm.wasm.relaxed.dot.bf16x8.add.f32( | 
|  | <8 x i16> %a, <8 x i16> %b, <4 x float> %c | 
|  | ) | 
|  | ret <4 x float> %v | 
|  | } | 
|  |  | 
|  | ; ============================================================================== | 
|  | ; 2 x f64 | 
|  | ; ============================================================================== | 
|  | ; CHECK-LABEL: bitselect_v2f64: | 
|  | ; CHECK-NEXT: .functype bitselect_v2f64 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: v128.bitselect $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.bitselect.v2f64(<2 x double>, <2 x double>, <2 x double>) | 
|  | define <2 x double> @bitselect_v2f64(<2 x double> %v1, <2 x double> %v2, <2 x double> %c) { | 
|  | %a = call <2 x double> @llvm.wasm.bitselect.v2f64( | 
|  | <2 x double> %v1, <2 x double> %v2, <2 x double> %c | 
|  | ) | 
|  | ret <2 x double> %a | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: pmin_v2f64: | 
|  | ; CHECK-NEXT: .functype pmin_v2f64 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.pmin $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.pmin.v2f64(<2 x double>, <2 x double>) | 
|  | define <2 x double> @pmin_v2f64(<2 x double> %a, <2 x double> %b) { | 
|  | %v = call <2 x double> @llvm.wasm.pmin.v2f64(<2 x double> %a, <2 x double> %b) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: pmax_v2f64: | 
|  | ; CHECK-NEXT: .functype pmax_v2f64 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.pmax $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.pmax.v2f64(<2 x double>, <2 x double>) | 
|  | define <2 x double> @pmax_v2f64(<2 x double> %a, <2 x double> %b) { | 
|  | %v = call <2 x double> @llvm.wasm.pmax.v2f64(<2 x double> %a, <2 x double> %b) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: ceil_v2f64: | 
|  | ; CHECK-NEXT: .functype ceil_v2f64 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.ceil $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.ceil.v2f64(<2 x double>) | 
|  | define <2 x double> @ceil_v2f64(<2 x double> %a) { | 
|  | %v = call <2 x double> @llvm.ceil.v2f64(<2 x double> %a) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: floor_v2f64: | 
|  | ; CHECK-NEXT: .functype floor_v2f64 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.floor $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.floor.v2f64(<2 x double>) | 
|  | define <2 x double> @floor_v2f64(<2 x double> %a) { | 
|  | %v = call <2 x double> @llvm.floor.v2f64(<2 x double> %a) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: trunc_v2f64: | 
|  | ; CHECK-NEXT: .functype trunc_v2f64 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.trunc $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.trunc.v2f64(<2 x double>) | 
|  | define <2 x double> @trunc_v2f64(<2 x double> %a) { | 
|  | %v = call <2 x double> @llvm.trunc.v2f64(<2 x double> %a) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nearest_v2f64: | 
|  | ; CHECK-NEXT: .functype nearest_v2f64 (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.nearest $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.nearbyint.v2f64(<2 x double>) | 
|  | define <2 x double> @nearest_v2f64(<2 x double> %a) { | 
|  | %v = call <2 x double> @llvm.nearbyint.v2f64(<2 x double> %a) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nearest_v2f64_via_rint: | 
|  | ; CHECK-NEXT: .functype nearest_v2f64_via_rint (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.nearest $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.rint.v2f64(<2 x double>) | 
|  | define <2 x double> @nearest_v2f64_via_rint(<2 x double> %a) { | 
|  | %v = call <2 x double> @llvm.rint.v2f64(<2 x double> %a) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nearest_v2f64_via_roundeven: | 
|  | ; CHECK-NEXT: .functype nearest_v2f64_via_roundeven (v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.nearest $push[[R:[0-9]+]]=, $0{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.roundeven.v2f64(<2 x double>) | 
|  | define <2 x double> @nearest_v2f64_via_roundeven(<2 x double> %a) { | 
|  | %v = call <2 x double> @llvm.roundeven.v2f64(<2 x double> %a) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: madd_v2f64: | 
|  | ; CHECK-NEXT: .functype madd_v2f64 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.relaxed_madd $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.relaxed.madd.v2f64( | 
|  | <2 x double>, <2 x double>, <2 x double>) | 
|  | define <2 x double> @madd_v2f64(<2 x double> %a, <2 x double> %b, <2 x double> %c) { | 
|  | %v = call <2 x double> @llvm.wasm.relaxed.madd.v2f64( | 
|  | <2 x double> %a, <2 x double> %b, <2 x double> %c | 
|  | ) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: nmadd_v2f64: | 
|  | ; CHECK-NEXT: .functype nmadd_v2f64 (v128, v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.relaxed_nmadd $push[[R:[0-9]+]]=, $0, $1, $2{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.relaxed.nmadd.v2f64( | 
|  | <2 x double>, <2 x double>, <2 x double>) | 
|  | define <2 x double> @nmadd_v2f64(<2 x double> %a, <2 x double> %b, <2 x double> %c) { | 
|  | %v = call <2 x double> @llvm.wasm.relaxed.nmadd.v2f64( | 
|  | <2 x double> %a, <2 x double> %b, <2 x double> %c | 
|  | ) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_min_v2f64: | 
|  | ; CHECK-NEXT: .functype relaxed_min_v2f64 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.relaxed_min $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.relaxed.min.v2f64(<2 x double>, <2 x double>) | 
|  | define <2 x double> @relaxed_min_v2f64(<2 x double> %a, <2 x double> %b) { | 
|  | %v = call <2 x double> @llvm.wasm.relaxed.min.v2f64( | 
|  | <2 x double> %a, <2 x double> %b | 
|  | ) | 
|  | ret <2 x double> %v | 
|  | } | 
|  |  | 
|  | ; CHECK-LABEL: relaxed_max_v2f64: | 
|  | ; CHECK-NEXT: .functype relaxed_max_v2f64 (v128, v128) -> (v128){{$}} | 
|  | ; CHECK-NEXT: f64x2.relaxed_max $push[[R:[0-9]+]]=, $0, $1{{$}} | 
|  | ; CHECK-NEXT: return $pop[[R]]{{$}} | 
|  | declare <2 x double> @llvm.wasm.relaxed.max.v2f64(<2 x double>, <2 x double>) | 
|  | define <2 x double> @relaxed_max_v2f64(<2 x double> %a, <2 x double> %b) { | 
|  | %v = call <2 x double> @llvm.wasm.relaxed.max.v2f64( | 
|  | <2 x double> %a, <2 x double> %b | 
|  | ) | 
|  | ret <2 x double> %v | 
|  | } |