1; RUN: llc < %s -asm-verbose=false -verify-machineinstrs -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -mattr=+unimplemented-simd128 | FileCheck %s
2
3; Test that the logic to choose between v128.const vector
4; initialization and splat vector initialization and to optimize the
5; choice of splat value works correctly.
6
7target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128"
8target triple = "wasm32-unknown-unknown"
9
10; CHECK-LABEL: same_const_one_replaced_i8x16:
11; CHECK-NEXT:  .functype       same_const_one_replaced_i8x16 (i32) -> (v128)
12; CHECK-NEXT:  i32.const       $push[[L0:[0-9]+]]=, 42
13; CHECK-NEXT:  i16x8.splat     $push[[L1:[0-9]+]]=, $pop[[L0]]
14; CHECK-NEXT:  i16x8.replace_lane      $push[[L2:[0-9]+]]=, $pop[[L1]], 5, $0
15; CHECK-NEXT:  return          $pop[[L2]]
16define <8 x i16> @same_const_one_replaced_i8x16(i16 %x) {
17  %v = insertelement
18    <8 x i16> <i16 42, i16 42, i16 42, i16 42, i16 42, i16 42, i16 42, i16 42>,
19    i16 %x,
20    i32 5
21  ret <8 x i16> %v
22}
23
24; CHECK-LABEL: different_const_one_replaced_i8x16:
25; CHECK-NEXT:  .functype       different_const_one_replaced_i8x16 (i32) -> (v128)
26; CHECK-NEXT:  v128.const      $push[[L0:[0-9]+]]=, 1, -2, 3, -4, 5, 0, 7, -8
27; CHECK-NEXT:  i16x8.replace_lane      $push[[L1:[0-9]+]]=, $pop[[L0]], 5, $0
28; CHECK-NEXT:  return          $pop[[L1]]
29define <8 x i16> @different_const_one_replaced_i8x16(i16 %x) {
30  %v = insertelement
31    <8 x i16> <i16 1, i16 -2, i16 3, i16 -4, i16 5, i16 -6, i16 7, i16 -8>,
32    i16 %x,
33    i32 5
34  ret <8 x i16> %v
35}
36
37; CHECK-LABEL: same_const_one_replaced_f32x4:
38; CHECK-NEXT:  .functype       same_const_one_replaced_f32x4 (f32) -> (v128)
39; CHECK-NEXT:  f32.const       $push[[L0:[0-9]+]]=, 0x1.5p5
40; CHECK-NEXT:  f32x4.splat     $push[[L1:[0-9]+]]=, $pop[[L0]]
41; CHECK-NEXT:  f32x4.replace_lane      $push[[L2:[0-9]+]]=, $pop[[L1]], 2, $0
42; CHECK-NEXT:  return          $pop[[L2]]
43define <4 x float> @same_const_one_replaced_f32x4(float %x) {
44  %v = insertelement
45    <4 x float> <float 42., float 42., float 42., float 42.>,
46    float %x,
47    i32 2
48  ret <4 x float> %v
49}
50
51; CHECK-LABEL: different_const_one_replaced_f32x4:
52; CHECK-NEXT:  .functype       different_const_one_replaced_f32x4 (f32) -> (v128)
53; CHECK-NEXT:  v128.const      $push[[L0:[0-9]+]]=, 0x1p0, 0x1p1, 0x0p0, 0x1p2
54; CHECK-NEXT:  f32x4.replace_lane      $push[[L1:[0-9]+]]=, $pop[[L0]], 2, $0
55; CHECK-NEXT:  return          $pop[[L1]]
56define <4 x float> @different_const_one_replaced_f32x4(float %x) {
57  %v = insertelement
58    <4 x float> <float 1., float 2., float 3., float 4.>,
59    float %x,
60    i32 2
61  ret <4 x float> %v
62}
63
64; CHECK-LABEL: splat_common_const_i32x4:
65; CHECK-NEXT:  .functype       splat_common_const_i32x4 () -> (v128)
66; CHECK-NEXT:  i32.const       $push[[L0:[0-9]+]]=, 3
67; CHECK-NEXT:  i32x4.splat     $push[[L1:[0-9]+]]=, $pop[[L0]]
68; CHECK-NEXT:  i32.const       $push[[L2:[0-9]+]]=, 1
69; CHECK-NEXT:  i32x4.replace_lane      $push[[L3:[0-9]+]]=, $pop[[L1]], 3, $pop[[L2]]
70; CHECK-NEXT:  return          $pop[[L3]]
71define <4 x i32> @splat_common_const_i32x4() {
72  ret <4 x i32> <i32 undef, i32 3, i32 3, i32 1>
73}
74
75; CHECK-LABEL: splat_common_arg_i16x8:
76; CHECK-NEXT:  .functype       splat_common_arg_i16x8 (i32, i32, i32) -> (v128)
77; CHECK-NEXT:  i16x8.splat     $push[[L0:[0-9]+]]=, $2
78; CHECK-NEXT:  i16x8.replace_lane      $push[[L1:[0-9]+]]=, $pop[[L0]], 0, $1
79; CHECK-NEXT:  i16x8.replace_lane      $push[[L2:[0-9]+]]=, $pop[[L1]], 2, $0
80; CHECK-NEXT:  i16x8.replace_lane      $push[[L3:[0-9]+]]=, $pop[[L2]], 4, $1
81; CHECK-NEXT:  i16x8.replace_lane      $push[[L4:[0-9]+]]=, $pop[[L3]], 7, $1
82; CHECK-NEXT:  return          $pop[[L4]]
83define <8 x i16> @splat_common_arg_i16x8(i16 %a, i16 %b, i16 %c) {
84  %v0 = insertelement <8 x i16> undef, i16 %b, i32 0
85  %v1 = insertelement <8 x i16> %v0, i16 %c, i32 1
86  %v2 = insertelement <8 x i16> %v1, i16 %a, i32 2
87  %v3 = insertelement <8 x i16> %v2, i16 %c, i32 3
88  %v4 = insertelement <8 x i16> %v3, i16 %b, i32 4
89  %v5 = insertelement <8 x i16> %v4, i16 %c, i32 5
90  %v6 = insertelement <8 x i16> %v5, i16 %c, i32 6
91  %v7 = insertelement <8 x i16> %v6, i16 %b, i32 7
92  ret <8 x i16> %v7
93}
94
95; CHECK-LABEL: undef_const_insert_f32x4:
96; CHECK-NEXT:  .functype       undef_const_insert_f32x4 () -> (v128)
97; CHECK-NEXT:  f32.const       $push[[L0:[0-9]+]]=, 0x1.5p5
98; CHECK-NEXT:  f32x4.splat     $push[[L1:[0-9]+]]=, $pop[[L0]]
99; CHECK-NEXT:  return          $pop[[L1]]
100define <4 x float> @undef_const_insert_f32x4() {
101  %v = insertelement <4 x float> undef, float 42., i32 1
102  ret <4 x float> %v
103}
104
105; CHECK-LABEL: undef_arg_insert_i32x4:
106; CHECK-NEXT:  .functype       undef_arg_insert_i32x4 (i32) -> (v128)
107; CHECK-NEXT:  i32x4.splat     $push[[L0:[0-9]+]]=, $0
108; CHECK-NEXT:  return          $pop[[L0]]
109define <4 x i32> @undef_arg_insert_i32x4(i32 %x) {
110  %v = insertelement <4 x i32> undef, i32 %x, i32 3
111  ret <4 x i32> %v
112}
113
114; CHECK-LABEL: all_undef_i8x16:
115; CHECK-NEXT:  .functype       all_undef_i8x16 () -> (v128)
116; CHECK-NEXT:  return          $0
117define <16 x i8> @all_undef_i8x16() {
118  %v = insertelement <16 x i8> undef, i8 undef, i32 4
119  ret <16 x i8> %v
120}
121
122; CHECK-LABEL: all_undef_f64x2:
123; CHECK-NEXT:  .functype       all_undef_f64x2 () -> (v128)
124; CHECK-NEXT:  return          $0
125define <2 x double> @all_undef_f64x2() {
126  ret <2 x double> undef
127}
128