1; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse2 | FileCheck %s 3 4declare <2 x i64> @llvm.cttz.v2i64(<2 x i64>, i1) 5declare <2 x i64> @llvm.ctlz.v2i64(<2 x i64>, i1) 6declare <2 x i64> @llvm.ctpop.v2i64(<2 x i64>) 7 8define <2 x i64> @footz(<2 x i64> %a) nounwind { 9; CHECK-LABEL: footz: 10; CHECK: # BB#0: 11; CHECK-NEXT: pxor %xmm1, %xmm1 12; CHECK-NEXT: pxor %xmm2, %xmm2 13; CHECK-NEXT: psubq %xmm0, %xmm2 14; CHECK-NEXT: pand %xmm0, %xmm2 15; CHECK-NEXT: psubq {{.*}}(%rip), %xmm2 16; CHECK-NEXT: movdqa %xmm2, %xmm0 17; CHECK-NEXT: psrlq $1, %xmm0 18; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 19; CHECK-NEXT: psubq %xmm0, %xmm2 20; CHECK-NEXT: movdqa {{.*#+}} xmm0 = [3689348814741910323,3689348814741910323] 21; CHECK-NEXT: movdqa %xmm2, %xmm3 22; CHECK-NEXT: pand %xmm0, %xmm3 23; CHECK-NEXT: psrlq $2, %xmm2 24; CHECK-NEXT: pand %xmm0, %xmm2 25; CHECK-NEXT: paddq %xmm3, %xmm2 26; CHECK-NEXT: movdqa %xmm2, %xmm0 27; CHECK-NEXT: psrlq $4, %xmm0 28; CHECK-NEXT: paddq %xmm2, %xmm0 29; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 30; CHECK-NEXT: psadbw %xmm1, %xmm0 31; CHECK-NEXT: retq 32 %c = call <2 x i64> @llvm.cttz.v2i64(<2 x i64> %a, i1 true) 33 ret <2 x i64> %c 34 35} 36define <2 x i64> @foolz(<2 x i64> %a) nounwind { 37; CHECK-LABEL: foolz: 38; CHECK: # BB#0: 39; CHECK-NEXT: movdqa %xmm0, %xmm1 40; CHECK-NEXT: psrlq $1, %xmm1 41; CHECK-NEXT: por %xmm0, %xmm1 42; CHECK-NEXT: movdqa %xmm1, %xmm0 43; CHECK-NEXT: psrlq $2, %xmm0 44; CHECK-NEXT: por %xmm1, %xmm0 45; CHECK-NEXT: movdqa %xmm0, %xmm1 46; CHECK-NEXT: psrlq $4, %xmm1 47; CHECK-NEXT: por %xmm0, %xmm1 48; CHECK-NEXT: movdqa %xmm1, %xmm0 49; CHECK-NEXT: psrlq $8, %xmm0 50; CHECK-NEXT: por %xmm1, %xmm0 51; CHECK-NEXT: movdqa %xmm0, %xmm1 52; CHECK-NEXT: psrlq $16, %xmm1 53; CHECK-NEXT: por %xmm0, %xmm1 54; CHECK-NEXT: movdqa %xmm1, %xmm0 55; CHECK-NEXT: psrlq $32, %xmm0 56; CHECK-NEXT: por %xmm1, %xmm0 57; CHECK-NEXT: pcmpeqd %xmm1, %xmm1 58; CHECK-NEXT: pxor %xmm0, %xmm1 59; CHECK-NEXT: movdqa %xmm1, %xmm0 60; CHECK-NEXT: psrlq $1, %xmm0 61; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 62; CHECK-NEXT: psubq %xmm0, %xmm1 63; CHECK-NEXT: movdqa {{.*#+}} xmm0 = [3689348814741910323,3689348814741910323] 64; CHECK-NEXT: movdqa %xmm1, %xmm2 65; CHECK-NEXT: pand %xmm0, %xmm2 66; CHECK-NEXT: psrlq $2, %xmm1 67; CHECK-NEXT: pand %xmm0, %xmm1 68; CHECK-NEXT: paddq %xmm2, %xmm1 69; CHECK-NEXT: movdqa %xmm1, %xmm2 70; CHECK-NEXT: psrlq $4, %xmm2 71; CHECK-NEXT: paddq %xmm1, %xmm2 72; CHECK-NEXT: pand {{.*}}(%rip), %xmm2 73; CHECK-NEXT: pxor %xmm0, %xmm0 74; CHECK-NEXT: psadbw %xmm2, %xmm0 75; CHECK-NEXT: retq 76 %c = call <2 x i64> @llvm.ctlz.v2i64(<2 x i64> %a, i1 true) 77 ret <2 x i64> %c 78 79} 80 81define <2 x i64> @foopop(<2 x i64> %a) nounwind { 82; CHECK-LABEL: foopop: 83; CHECK: # BB#0: 84; CHECK-NEXT: movdqa %xmm0, %xmm1 85; CHECK-NEXT: psrlq $1, %xmm1 86; CHECK-NEXT: pand {{.*}}(%rip), %xmm1 87; CHECK-NEXT: psubq %xmm1, %xmm0 88; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [3689348814741910323,3689348814741910323] 89; CHECK-NEXT: movdqa %xmm0, %xmm2 90; CHECK-NEXT: pand %xmm1, %xmm2 91; CHECK-NEXT: psrlq $2, %xmm0 92; CHECK-NEXT: pand %xmm1, %xmm0 93; CHECK-NEXT: paddq %xmm2, %xmm0 94; CHECK-NEXT: movdqa %xmm0, %xmm1 95; CHECK-NEXT: psrlq $4, %xmm1 96; CHECK-NEXT: paddq %xmm0, %xmm1 97; CHECK-NEXT: pand {{.*}}(%rip), %xmm1 98; CHECK-NEXT: pxor %xmm0, %xmm0 99; CHECK-NEXT: psadbw %xmm0, %xmm1 100; CHECK-NEXT: movdqa %xmm1, %xmm0 101; CHECK-NEXT: retq 102 %c = call <2 x i64> @llvm.ctpop.v2i64(<2 x i64> %a) 103 ret <2 x i64> %c 104} 105 106declare <2 x i32> @llvm.cttz.v2i32(<2 x i32>, i1) 107declare <2 x i32> @llvm.ctlz.v2i32(<2 x i32>, i1) 108declare <2 x i32> @llvm.ctpop.v2i32(<2 x i32>) 109 110define <2 x i32> @promtz(<2 x i32> %a) nounwind { 111; CHECK-LABEL: promtz: 112; CHECK: # BB#0: 113; CHECK-NEXT: por {{.*}}(%rip), %xmm0 114; CHECK-NEXT: pxor %xmm1, %xmm1 115; CHECK-NEXT: pxor %xmm2, %xmm2 116; CHECK-NEXT: psubq %xmm0, %xmm2 117; CHECK-NEXT: pand %xmm0, %xmm2 118; CHECK-NEXT: psubq {{.*}}(%rip), %xmm2 119; CHECK-NEXT: movdqa %xmm2, %xmm0 120; CHECK-NEXT: psrlq $1, %xmm0 121; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 122; CHECK-NEXT: psubq %xmm0, %xmm2 123; CHECK-NEXT: movdqa {{.*#+}} xmm0 = [3689348814741910323,3689348814741910323] 124; CHECK-NEXT: movdqa %xmm2, %xmm3 125; CHECK-NEXT: pand %xmm0, %xmm3 126; CHECK-NEXT: psrlq $2, %xmm2 127; CHECK-NEXT: pand %xmm0, %xmm2 128; CHECK-NEXT: paddq %xmm3, %xmm2 129; CHECK-NEXT: movdqa %xmm2, %xmm0 130; CHECK-NEXT: psrlq $4, %xmm0 131; CHECK-NEXT: paddq %xmm2, %xmm0 132; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 133; CHECK-NEXT: psadbw %xmm1, %xmm0 134; CHECK-NEXT: retq 135 %c = call <2 x i32> @llvm.cttz.v2i32(<2 x i32> %a, i1 false) 136 ret <2 x i32> %c 137 138} 139define <2 x i32> @promlz(<2 x i32> %a) nounwind { 140; CHECK-LABEL: promlz: 141; CHECK: # BB#0: 142; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 143; CHECK-NEXT: pxor %xmm1, %xmm1 144; CHECK-NEXT: movdqa %xmm0, %xmm2 145; CHECK-NEXT: psrlq $1, %xmm2 146; CHECK-NEXT: por %xmm0, %xmm2 147; CHECK-NEXT: movdqa %xmm2, %xmm0 148; CHECK-NEXT: psrlq $2, %xmm0 149; CHECK-NEXT: por %xmm2, %xmm0 150; CHECK-NEXT: movdqa %xmm0, %xmm2 151; CHECK-NEXT: psrlq $4, %xmm2 152; CHECK-NEXT: por %xmm0, %xmm2 153; CHECK-NEXT: movdqa %xmm2, %xmm0 154; CHECK-NEXT: psrlq $8, %xmm0 155; CHECK-NEXT: por %xmm2, %xmm0 156; CHECK-NEXT: movdqa %xmm0, %xmm2 157; CHECK-NEXT: psrlq $16, %xmm2 158; CHECK-NEXT: por %xmm0, %xmm2 159; CHECK-NEXT: movdqa %xmm2, %xmm0 160; CHECK-NEXT: psrlq $32, %xmm0 161; CHECK-NEXT: por %xmm2, %xmm0 162; CHECK-NEXT: pcmpeqd %xmm2, %xmm2 163; CHECK-NEXT: pxor %xmm0, %xmm2 164; CHECK-NEXT: movdqa %xmm2, %xmm0 165; CHECK-NEXT: psrlq $1, %xmm0 166; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 167; CHECK-NEXT: psubq %xmm0, %xmm2 168; CHECK-NEXT: movdqa {{.*#+}} xmm0 = [3689348814741910323,3689348814741910323] 169; CHECK-NEXT: movdqa %xmm2, %xmm3 170; CHECK-NEXT: pand %xmm0, %xmm3 171; CHECK-NEXT: psrlq $2, %xmm2 172; CHECK-NEXT: pand %xmm0, %xmm2 173; CHECK-NEXT: paddq %xmm3, %xmm2 174; CHECK-NEXT: movdqa %xmm2, %xmm0 175; CHECK-NEXT: psrlq $4, %xmm0 176; CHECK-NEXT: paddq %xmm2, %xmm0 177; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 178; CHECK-NEXT: psadbw %xmm1, %xmm0 179; CHECK-NEXT: psubq {{.*}}(%rip), %xmm0 180; CHECK-NEXT: retq 181 %c = call <2 x i32> @llvm.ctlz.v2i32(<2 x i32> %a, i1 false) 182 ret <2 x i32> %c 183 184} 185 186define <2 x i32> @prompop(<2 x i32> %a) nounwind { 187; CHECK-LABEL: prompop: 188; CHECK: # BB#0: 189; CHECK-NEXT: pand {{.*}}(%rip), %xmm0 190; CHECK-NEXT: pxor %xmm2, %xmm2 191; CHECK-NEXT: movdqa %xmm0, %xmm1 192; CHECK-NEXT: psrlq $1, %xmm1 193; CHECK-NEXT: pand {{.*}}(%rip), %xmm1 194; CHECK-NEXT: psubq %xmm1, %xmm0 195; CHECK-NEXT: movdqa {{.*#+}} xmm1 = [3689348814741910323,3689348814741910323] 196; CHECK-NEXT: movdqa %xmm0, %xmm3 197; CHECK-NEXT: pand %xmm1, %xmm3 198; CHECK-NEXT: psrlq $2, %xmm0 199; CHECK-NEXT: pand %xmm1, %xmm0 200; CHECK-NEXT: paddq %xmm3, %xmm0 201; CHECK-NEXT: movdqa %xmm0, %xmm1 202; CHECK-NEXT: psrlq $4, %xmm1 203; CHECK-NEXT: paddq %xmm0, %xmm1 204; CHECK-NEXT: pand {{.*}}(%rip), %xmm1 205; CHECK-NEXT: psadbw %xmm2, %xmm1 206; CHECK-NEXT: movdqa %xmm1, %xmm0 207; CHECK-NEXT: retq 208 %c = call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> %a) 209 ret <2 x i32> %c 210} 211