1; RUN: llc -mtriple=s390x-linux-gnu -mcpu=z13 < %s | FileCheck %s 2 3; Store a <4 x i31> vector. 4define void @fun0(<4 x i31> %src, <4 x i31>* %p) 5; CHECK-LABEL: fun0: 6; CHECK: # %bb.0: 7; CHECK-NEXT: vlgvf %r1, %v24, 0 8; CHECK-NEXT: vlgvf %r0, %v24, 1 9; CHECK-NEXT: sllg %r1, %r1, 29 10; CHECK-NEXT: rosbg %r1, %r0, 35, 63, 62 11; CHECK-NEXT: nihh %r1, 4095 12; CHECK-NEXT: stg %r1, 0(%r2) 13; CHECK-NEXT: vlgvf %r1, %v24, 2 14; CHECK-NEXT: risbgn %r0, %r0, 0, 129, 62 15; CHECK-NEXT: rosbg %r0, %r1, 2, 32, 31 16; CHECK-NEXT: vlgvf %r1, %v24, 3 17; CHECK-NEXT: rosbg %r0, %r1, 33, 63, 0 18; CHECK-NEXT: stg %r0, 8(%r2) 19; CHECK-NEXT: br %r14 20{ 21 store <4 x i31> %src, <4 x i31>* %p 22 ret void 23} 24 25; Store a <16 x i1> vector. 26define i16 @fun1(<16 x i1> %src) 27; CHECK-LABEL: fun1: 28; CHECK: # %bb.0: 29; CHECK-NEXT: aghi %r15, -168 30; CHECK-NEXT: .cfi_def_cfa_offset 328 31; CHECK-NEXT: vlgvb %r0, %v24, 0 32; CHECK-NEXT: vlgvb %r1, %v24, 1 33; CHECK-NEXT: risblg %r0, %r0, 16, 144, 15 34; CHECK-NEXT: rosbg %r0, %r1, 49, 49, 14 35; CHECK-NEXT: vlgvb %r1, %v24, 2 36; CHECK-NEXT: rosbg %r0, %r1, 50, 50, 13 37; CHECK-NEXT: vlgvb %r1, %v24, 3 38; CHECK-NEXT: rosbg %r0, %r1, 51, 51, 12 39; CHECK-NEXT: vlgvb %r1, %v24, 4 40; CHECK-NEXT: rosbg %r0, %r1, 52, 52, 11 41; CHECK-NEXT: vlgvb %r1, %v24, 5 42; CHECK-NEXT: rosbg %r0, %r1, 53, 53, 10 43; CHECK-NEXT: vlgvb %r1, %v24, 6 44; CHECK-NEXT: rosbg %r0, %r1, 54, 54, 9 45; CHECK-NEXT: vlgvb %r1, %v24, 7 46; CHECK-NEXT: rosbg %r0, %r1, 55, 55, 8 47; CHECK-NEXT: vlgvb %r1, %v24, 8 48; CHECK-NEXT: rosbg %r0, %r1, 56, 56, 7 49; CHECK-NEXT: vlgvb %r1, %v24, 9 50; CHECK-NEXT: rosbg %r0, %r1, 57, 57, 6 51; CHECK-NEXT: vlgvb %r1, %v24, 10 52; CHECK-NEXT: rosbg %r0, %r1, 58, 58, 5 53; CHECK-NEXT: vlgvb %r1, %v24, 11 54; CHECK-NEXT: rosbg %r0, %r1, 59, 59, 4 55; CHECK-NEXT: vlgvb %r1, %v24, 12 56; CHECK-NEXT: rosbg %r0, %r1, 60, 60, 3 57; CHECK-NEXT: vlgvb %r1, %v24, 13 58; CHECK-NEXT: rosbg %r0, %r1, 61, 61, 2 59; CHECK-NEXT: vlgvb %r1, %v24, 14 60; CHECK-NEXT: rosbg %r0, %r1, 62, 62, 1 61; CHECK-NEXT: vlgvb %r1, %v24, 15 62; CHECK-NEXT: rosbg %r0, %r1, 63, 63, 0 63; CHECK-NEXT: llhr %r2, %r0 64; CHECK-NEXT: aghi %r15, 168 65; CHECK-NEXT: br %r14 66{ 67 %res = bitcast <16 x i1> %src to i16 68 ret i16 %res 69} 70 71; Truncate a <8 x i32> vector to <8 x i31> and store it (test splitting). 72define void @fun2(<8 x i32> %src, <8 x i31>* %p) 73; CHECK-LABEL: fun2: 74; CHECK: # %bb.0: 75; CHECK-NEXT: stmg %r14, %r15, 112(%r15) 76; CHECK-NEXT: .cfi_offset %r14, -48 77; CHECK-NEXT: .cfi_offset %r15, -40 78; CHECK-NEXT: vlgvf %r3, %v26, 1 79; CHECK-NEXT: vlgvf %r1, %v26, 2 80; CHECK-NEXT: risbgn %r4, %r3, 0, 129, 62 81; CHECK-NEXT: rosbg %r4, %r1, 2, 32, 31 82; CHECK-DAG: vlgvf %r0, %v26, 3 83; CHECK-DAG: rosbg %r4, %r0, 33, 63, 0 84; CHECK-DAG: stc %r0, 30(%r2) 85; CHECK-DAG: srl %r0, 8 86; CHECK-DAG: vlgvf [[REG0:%r[0-9]+]], %v24, 1 87; CHECK-DAG: vlgvf [[REG1:%r[0-9]+]], %v24, 0 88; CHECK-DAG: sth %r0, 28(%r2) 89; CHECK-DAG: vlgvf [[REG2:%r[0-9]+]], %v24, 2 90; CHECK-DAG: risbgn [[REG3:%r[0-9]+]], [[REG0]], 0, 133, 58 91; CHECK-DAG: rosbg [[REG3]], [[REG2]], 6, 36, 27 92; CHECK-DAG: sllg [[REG4:%r[0-9]+]], [[REG1]], 25 93; CHECK-DAG: rosbg [[REG4]], [[REG0]], 39, 63, 58 94; CHECK-DAG: vlgvf [[REG5:%r[0-9]+]], %v24, 3 95; CHECK-DAG: rosbg [[REG3]], [[REG5]], 37, 63, 60 96; CHECK-DAG: sllg [[REG6:%r[0-9]+]], [[REG4]], 8 97; CHECK-DAG: rosbg [[REG6]], [[REG3]], 56, 63, 8 98; CHECK-NEXT: stg [[REG6]], 0(%r2) 99; CHECK-NEXT: srlg [[REG7:%r[0-9]+]], %r4, 24 100; CHECK-NEXT: st [[REG7]], 24(%r2) 101; CHECK-NEXT: vlgvf [[REG8:%r[0-9]+]], %v26, 0 102; CHECK-NEXT: risbgn [[REG10:%r[0-9]+]], [[REG5]], 0, 131, 60 103; CHECK-NEXT: rosbg [[REG10]], [[REG8]], 4, 34, 29 104; CHECK-NEXT: sllg [[REG9:%r[0-9]+]], [[REG3]], 8 105; CHECK-NEXT: rosbg [[REG10]], %r3, 35, 63, 62 106; CHECK-NEXT: rosbg [[REG9]], [[REG10]], 56, 63, 8 107; CHECK-NEXT: stg [[REG9]], 8(%r2) 108; CHECK-NEXT: sllg %r0, [[REG10]], 8 109; CHECK-NEXT: rosbg %r0, %r4, 56, 63, 8 110; CHECK-NEXT: stg %r0, 16(%r2) 111; CHECK-NEXT: lmg %r14, %r15, 112(%r15) 112; CHECK-NEXT: br %r14 113{ 114 %tmp = trunc <8 x i32> %src to <8 x i31> 115 store <8 x i31> %tmp, <8 x i31>* %p 116 ret void 117} 118 119; Load and store a <3 x i31> vector (test widening). 120define void @fun3(<3 x i31>* %src, <3 x i31>* %p) 121; CHECK-LABEL: fun3: 122; CHECK: # %bb.0: 123; CHECK-NEXT: llgf %r1, 0(%r2) 124; CHECK-NEXT: llgf %r0, 3(%r2) 125; CHECK-NEXT: sllg %r4, %r1, 62 126; CHECK-NEXT: rosbg %r4, %r0, 0, 32, 31 127; CHECK-NEXT: llgf %r0, 6(%r2) 128; CHECK-NEXT: ogr %r0, %r4 129; CHECK-NEXT: st %r0, 8(%r3) 130; CHECK-NEXT: srlg %r0, %r4, 32 131; CHECK-NEXT: sllg %r1, %r1, 30 132; CHECK-NEXT: lr %r1, %r0 133; CHECK-NEXT: nihh %r1, 8191 134; CHECK-NEXT: stg %r1, 0(%r3) 135; CHECK-NEXT: br %r14 136{ 137 %tmp = load <3 x i31>, <3 x i31>* %src 138 store <3 x i31> %tmp, <3 x i31>* %p 139 ret void 140} 141