1 // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --function-signature --include-generated-funcs --replace-value-regex "__omp_offloading_[0-9a-z]+_[0-9a-z]+" "reduction_size[.].+[.]" "pl_cond[.].+[.|,]" --prefix-filecheck-ir-name _ 2 // Test host code gen 3 // RUN: %clang_cc1 -DLAMBDA -verify -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK1 4 // RUN: %clang_cc1 -DLAMBDA -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s 5 // RUN: %clang_cc1 -DLAMBDA -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK2 6 // RUN: %clang_cc1 -DLAMBDA -verify -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK3 7 // RUN: %clang_cc1 -DLAMBDA -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s 8 // RUN: %clang_cc1 -DLAMBDA -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK4 9 10 // RUN: %clang_cc1 -DLAMBDA -verify -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK5 11 // RUN: %clang_cc1 -DLAMBDA -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s 12 // RUN: %clang_cc1 -DLAMBDA -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK6 13 // RUN: %clang_cc1 -DLAMBDA -verify -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK7 14 // RUN: %clang_cc1 -DLAMBDA -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s 15 // RUN: %clang_cc1 -DLAMBDA -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK8 16 17 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK9 18 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s 19 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK10 20 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK11 21 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s 22 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK12 23 24 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK13 25 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s 26 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK14 27 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix=CHECK15 28 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s 29 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix=CHECK16 30 // expected-no-diagnostics 31 #ifndef HEADER 32 #define HEADER 33 34 35 template <typename T> 36 T tmain() { 37 T *a, *b, *c; 38 int n = 10000; 39 int ch = 100; 40 41 // no schedule clauses 42 #pragma omp target 43 #pragma omp teams 44 #pragma omp distribute parallel for 45 for (int i = 0; i < n; ++i) { 46 #pragma omp cancel for 47 a[i] = b[i] + c[i]; 48 } 49 50 // dist_schedule: static no chunk 51 #pragma omp target 52 #pragma omp teams 53 #pragma omp distribute parallel for dist_schedule(static) 54 for (int i = 0; i < n; ++i) { 55 a[i] = b[i] + c[i]; 56 } 57 58 // dist_schedule: static chunk 59 #pragma omp target 60 #pragma omp teams 61 #pragma omp distribute parallel for dist_schedule(static, ch) 62 for (int i = 0; i < n; ++i) { 63 a[i] = b[i] + c[i]; 64 } 65 66 // schedule: static no chunk 67 #pragma omp target 68 #pragma omp teams 69 #pragma omp distribute parallel for schedule(static) 70 for (int i = 0; i < n; ++i) { 71 a[i] = b[i] + c[i]; 72 } 73 74 // schedule: static chunk 75 #pragma omp target 76 #pragma omp teams 77 #pragma omp distribute parallel for schedule(static, ch) 78 for (int i = 0; i < n; ++i) { 79 a[i] = b[i] + c[i]; 80 } 81 82 // schedule: dynamic no chunk 83 #pragma omp target 84 #pragma omp teams 85 #pragma omp distribute parallel for schedule(dynamic) 86 for (int i = 0; i < n; ++i) { 87 a[i] = b[i] + c[i]; 88 } 89 90 // schedule: dynamic chunk 91 #pragma omp target 92 #pragma omp teams 93 #pragma omp distribute parallel for schedule(dynamic, ch) 94 for (int i = 0; i < n; ++i) { 95 a[i] = b[i] + c[i]; 96 } 97 98 return T(); 99 } 100 101 int main() { 102 double *a, *b, *c; 103 int n = 10000; 104 int ch = 100; 105 106 #ifdef LAMBDA 107 [&]() { 108 109 110 111 112 113 114 115 116 // no schedule clauses 117 #pragma omp target 118 #pragma omp teams 119 120 #pragma omp distribute parallel for 121 for (int i = 0; i < n; ++i) { 122 a[i] = b[i] + c[i]; 123 124 125 // check EUB for distribute 126 127 // initialize omp.iv 128 129 // check exit condition 130 131 // check that PrevLB and PrevUB are passed to the 'for' 132 // check that distlb and distub are properly passed to fork_call 133 134 // increment by stride (distInc - 'parallel for' executes the whole chunk) and latch 135 136 137 // implementation of 'parallel for' 138 139 140 // initialize lb and ub to PrevLB and PrevUB 141 142 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 143 // In this case we use EUB 144 145 // initialize omp.iv 146 147 // check exit condition 148 149 // check that PrevLB and PrevUB are passed to the 'for' 150 151 // check stride 1 for 'for' in 'distribute parallel for' 152 153 154 [&]() { 155 a[i] = b[i] + c[i]; 156 }(); 157 } 158 159 // dist_schedule: static no chunk (same sa default - no dist_schedule) 160 #pragma omp target 161 #pragma omp teams 162 163 #pragma omp distribute parallel for dist_schedule(static) 164 for (int i = 0; i < n; ++i) { 165 a[i] = b[i] + c[i]; 166 167 168 // check EUB for distribute 169 170 // initialize omp.iv 171 172 // check exit condition 173 174 // check that PrevLB and PrevUB are passed to the 'for' 175 // check that distlb and distub are properly passed to fork_call 176 177 // increment by stride (distInc - 'parallel for' executes the whole chunk) and latch 178 179 180 // implementation of 'parallel for' 181 182 183 // initialize lb and ub to PrevLB and PrevUB 184 185 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 186 // In this case we use EUB 187 188 // initialize omp.iv 189 190 // check exit condition 191 192 // check that PrevLB and PrevUB are passed to the 'for' 193 194 // check stride 1 for 'for' in 'distribute parallel for' 195 196 [&]() { 197 a[i] = b[i] + c[i]; 198 }(); 199 } 200 201 // dist_schedule: static chunk 202 #pragma omp target 203 #pragma omp teams 204 205 #pragma omp distribute parallel for dist_schedule(static, ch) 206 for (int i = 0; i < n; ++i) { 207 a[i] = b[i] + c[i]; 208 209 210 // check EUB for distribute 211 212 // initialize omp.iv 213 214 // check exit condition 215 216 // check that PrevLB and PrevUB are passed to the 'for' 217 // check that distlb and distub are properly passed to fork_call 218 219 // check DistInc 220 221 // Update UB 222 223 // Store LB in IV 224 225 226 // loop exit 227 228 // skip implementation of 'parallel for': using default scheduling and was tested above 229 [&]() { 230 a[i] = b[i] + c[i]; 231 }(); 232 } 233 234 // schedule: static no chunk 235 #pragma omp target 236 #pragma omp teams 237 238 #pragma omp distribute parallel for schedule(static) 239 for (int i = 0; i < n; ++i) { 240 a[i] = b[i] + c[i]; 241 242 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 243 244 // 'parallel for' implementation is the same as the case without schedule clase (static no chunk is the default) 245 246 247 // initialize lb and ub to PrevLB and PrevUB 248 249 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 250 // In this case we use EUB 251 252 // initialize omp.iv 253 254 // check exit condition 255 256 // check that PrevLB and PrevUB are passed to the 'for' 257 258 // check stride 1 for 'for' in 'distribute parallel for' 259 260 261 [&]() { 262 a[i] = b[i] + c[i]; 263 }(); 264 } 265 266 // schedule: static chunk 267 #pragma omp target 268 #pragma omp teams 269 270 #pragma omp distribute parallel for schedule(static, ch) 271 for (int i = 0; i < n; ++i) { 272 a[i] = b[i] + c[i]; 273 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 274 275 // 'parallel for' implementation using outer and inner loops and PrevEUB 276 277 // initialize lb and ub to PrevLB and PrevUB 278 279 // check PrevEUB (using PrevUB instead of NumIt as upper bound) 280 281 // initialize omp.iv (IV = LB) 282 283 // outer loop: while (IV < UB) { 284 285 286 287 // skip body branch 288 289 // IV = IV + 1 and inner loop latch 290 291 // check NextLB and NextUB 292 293 294 [&]() { 295 a[i] = b[i] + c[i]; 296 }(); 297 } 298 299 // schedule: dynamic no chunk 300 #pragma omp target 301 #pragma omp teams 302 303 #pragma omp distribute parallel for schedule(dynamic) 304 for (int i = 0; i < n; ++i) { 305 a[i] = b[i] + c[i]; 306 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 307 308 // 'parallel for' implementation using outer and inner loops and PrevEUB 309 310 // initialize lb and ub to PrevLB and PrevUB 311 312 313 // initialize omp.iv (IV = LB) 314 315 316 // skip body branch 317 318 // IV = IV + 1 and inner loop latch 319 320 // check NextLB and NextUB 321 322 323 [&]() { 324 a[i] = b[i] + c[i]; 325 }(); 326 } 327 328 // schedule: dynamic chunk 329 #pragma omp target 330 #pragma omp teams 331 332 #pragma omp distribute parallel for schedule(dynamic, ch) 333 for (int i = 0; i < n; ++i) { 334 a[i] = b[i] + c[i]; 335 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 336 337 // 'parallel for' implementation using outer and inner loops and PrevEUB 338 339 // initialize lb and ub to PrevLB and PrevUB 340 341 342 // initialize omp.iv (IV = LB) 343 344 345 // skip body branch 346 347 // IV = IV + 1 and inner loop latch 348 349 // check NextLB and NextUB 350 351 352 [&]() { 353 a[i] = b[i] + c[i]; 354 }(); 355 } 356 }(); 357 return 0; 358 #else 359 360 361 362 363 364 365 366 367 368 // no schedule clauses 369 #pragma omp target 370 #pragma omp teams 371 372 #pragma omp distribute parallel for 373 for (int i = 0; i < n; ++i) { 374 a[i] = b[i] + c[i]; 375 376 377 // check EUB for distribute 378 379 // initialize omp.iv 380 381 // check exit condition 382 383 // check that PrevLB and PrevUB are passed to the 'for' 384 // check that distlb and distub are properly passed to fork_call 385 386 // increment by stride (distInc - 'parallel for' executes the whole chunk) and latch 387 388 389 // implementation of 'parallel for' 390 391 392 // initialize lb and ub to PrevLB and PrevUB 393 394 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 395 // In this case we use EUB 396 397 // initialize omp.iv 398 399 // check exit condition 400 401 // check that PrevLB and PrevUB are passed to the 'for' 402 403 // check stride 1 for 'for' in 'distribute parallel for' 404 405 } 406 407 // dist_schedule: static no chunk 408 #pragma omp target 409 #pragma omp teams 410 411 #pragma omp distribute parallel for dist_schedule(static) 412 for (int i = 0; i < n; ++i) { 413 a[i] = b[i] + c[i]; 414 415 416 // check EUB for distribute 417 418 // initialize omp.iv 419 420 // check exit condition 421 422 // check that PrevLB and PrevUB are passed to the 'for' 423 // check that distlb and distub are properly passed to fork_call 424 425 // increment by stride (distInc - 'parallel for' executes the whole chunk) and latch 426 427 428 // implementation of 'parallel for' 429 430 431 // initialize lb and ub to PrevLB and PrevUB 432 433 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 434 // In this case we use EUB 435 436 // initialize omp.iv 437 438 // check exit condition 439 440 // check that PrevLB and PrevUB are passed to the 'for' 441 442 // check stride 1 for 'for' in 'distribute parallel for' 443 444 } 445 446 // dist_schedule: static chunk 447 #pragma omp target 448 #pragma omp teams 449 450 #pragma omp distribute parallel for dist_schedule(static, ch) 451 for (int i = 0; i < n; ++i) { 452 a[i] = b[i] + c[i]; 453 454 // unlike the previous tests, in this one we have a outer and inner loop for 'distribute' 455 456 // check EUB for distribute 457 458 // initialize omp.iv 459 460 // check exit condition 461 462 // check that PrevLB and PrevUB are passed to the 'for' 463 // check that distlb and distub are properly passed to fork_call 464 465 // check DistInc 466 467 // Update UB 468 469 // Store LB in IV 470 471 472 // loop exit 473 474 // skip implementation of 'parallel for': using default scheduling and was tested above 475 } 476 477 // schedule: static no chunk 478 #pragma omp target 479 #pragma omp teams 480 481 #pragma omp distribute parallel for schedule(static) 482 for (int i = 0; i < n; ++i) { 483 a[i] = b[i] + c[i]; 484 485 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 486 487 // 'parallel for' implementation is the same as the case without schedule clase (static no chunk is the default) 488 489 490 // initialize lb and ub to PrevLB and PrevUB 491 492 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 493 // In this case we use EUB 494 495 // initialize omp.iv 496 497 // check exit condition 498 499 // check that PrevLB and PrevUB are passed to the 'for' 500 501 // check stride 1 for 'for' in 'distribute parallel for' 502 503 } 504 505 // schedule: static chunk 506 #pragma omp target 507 #pragma omp teams 508 509 #pragma omp distribute parallel for schedule(static, ch) 510 for (int i = 0; i < n; ++i) { 511 a[i] = b[i] + c[i]; 512 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 513 514 // 'parallel for' implementation using outer and inner loops and PrevEUB 515 516 // initialize lb and ub to PrevLB and PrevUB 517 518 // check PrevEUB (using PrevUB instead of NumIt as upper bound) 519 520 // initialize omp.iv (IV = LB) 521 522 // outer loop: while (IV < UB) { 523 524 525 526 // skip body branch 527 528 // IV = IV + 1 and inner loop latch 529 530 // check NextLB and NextUB 531 532 533 } 534 535 // schedule: dynamic no chunk 536 #pragma omp target 537 #pragma omp teams 538 539 #pragma omp distribute parallel for schedule(dynamic) 540 for (int i = 0; i < n; ++i) { 541 a[i] = b[i] + c[i]; 542 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 543 544 // 'parallel for' implementation using outer and inner loops and PrevEUB 545 546 // initialize lb and ub to PrevLB and PrevUB 547 548 549 // initialize omp.iv (IV = LB) 550 551 552 // skip body branch 553 554 // IV = IV + 1 and inner loop latch 555 556 // check NextLB and NextUB 557 558 559 } 560 561 // schedule: dynamic chunk 562 #pragma omp target 563 #pragma omp teams 564 565 #pragma omp distribute parallel for schedule(dynamic, ch) 566 for (int i = 0; i < n; ++i) { 567 a[i] = b[i] + c[i]; 568 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 569 570 // 'parallel for' implementation using outer and inner loops and PrevEUB 571 572 // initialize lb and ub to PrevLB and PrevUB 573 574 575 // initialize omp.iv (IV = LB) 576 577 578 // skip body branch 579 580 // IV = IV + 1 and inner loop latch 581 582 // check NextLB and NextUB 583 584 585 } 586 587 return tmain<int>(); 588 #endif 589 } 590 591 // check code 592 593 594 595 596 597 598 599 600 601 602 603 // check EUB for distribute 604 605 // initialize omp.iv 606 607 // check exit condition 608 609 // check that PrevLB and PrevUB are passed to the 'for' 610 // check that distlb and distub are properly passed to fork_call 611 612 // increment by stride (distInc - 'parallel for' executes the whole chunk) and latch 613 614 615 // implementation of 'parallel for' 616 617 618 // initialize lb and ub to PrevLB and PrevUB 619 620 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 621 // In this case we use EUB 622 623 // initialize omp.iv 624 625 // check exit condition 626 627 // check that PrevLB and PrevUB are passed to the 'for' 628 629 // check stride 1 for 'for' in 'distribute parallel for' 630 631 632 633 634 635 // check EUB for distribute 636 637 // initialize omp.iv 638 639 // check exit condition 640 641 // check that PrevLB and PrevUB are passed to the 'for' 642 // check that distlb and distub are properly passed to fork_call 643 644 // increment by stride (distInc - 'parallel for' executes the whole chunk) and latch 645 646 647 // implementation of 'parallel for' 648 649 650 // initialize lb and ub to PrevLB and PrevUB 651 652 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 653 // In this case we use EUB 654 655 // initialize omp.iv 656 657 // check exit condition 658 659 // check that PrevLB and PrevUB are passed to the 'for' 660 661 // check stride 1 for 'for' in 'distribute parallel for' 662 663 664 665 666 // unlike the previous tests, in this one we have a outer and inner loop for 'distribute' 667 668 // check EUB for distribute 669 670 // initialize omp.iv 671 672 // check exit condition 673 674 // check that PrevLB and PrevUB are passed to the 'for' 675 // check that distlb and distub are properly passed to fork_call 676 677 // check DistInc 678 679 // Update UB 680 681 // Store LB in IV 682 683 684 // loop exit 685 686 // skip implementation of 'parallel for': using default scheduling and was tested above 687 688 689 690 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 691 692 // 'parallel for' implementation is the same as the case without schedule clase (static no chunk is the default) 693 694 695 // initialize lb and ub to PrevLB and PrevUB 696 697 // PrevEUB is only used when 'for' has a chunked schedule, otherwise EUB is used 698 // In this case we use EUB 699 700 // initialize omp.iv 701 702 // check exit condition 703 704 // check that PrevLB and PrevUB are passed to the 'for' 705 706 // check stride 1 for 'for' in 'distribute parallel for' 707 708 709 710 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 711 712 // 'parallel for' implementation using outer and inner loops and PrevEUB 713 714 // initialize lb and ub to PrevLB and PrevUB 715 716 // check PrevEUB (using PrevUB instead of NumIt as upper bound) 717 718 // initialize omp.iv (IV = LB) 719 720 // outer loop: while (IV < UB) { 721 722 723 724 // skip body branch 725 726 // IV = IV + 1 and inner loop latch 727 728 // check NextLB and NextUB 729 730 731 732 733 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 734 735 // 'parallel for' implementation using outer and inner loops and PrevEUB 736 737 // initialize lb and ub to PrevLB and PrevUB 738 739 740 // initialize omp.iv (IV = LB) 741 742 743 // skip body branch 744 745 // IV = IV + 1 and inner loop latch 746 747 // check NextLB and NextUB 748 749 750 751 752 // skip rest of implementation of 'distribute' as it is tested above for default dist_schedule case 753 754 // 'parallel for' implementation using outer and inner loops and PrevEUB 755 756 // initialize lb and ub to PrevLB and PrevUB 757 758 759 // initialize omp.iv (IV = LB) 760 761 762 // skip body branch 763 764 // IV = IV + 1 and inner loop latch 765 766 // check NextLB and NextUB 767 768 769 #endif 770 // CHECK1-LABEL: define {{[^@]+}}@main 771 // CHECK1-SAME: () #[[ATTR0:[0-9]+]] { 772 // CHECK1-NEXT: entry: 773 // CHECK1-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 774 // CHECK1-NEXT: [[A:%.*]] = alloca double*, align 8 775 // CHECK1-NEXT: [[B:%.*]] = alloca double*, align 8 776 // CHECK1-NEXT: [[C:%.*]] = alloca double*, align 8 777 // CHECK1-NEXT: [[N:%.*]] = alloca i32, align 4 778 // CHECK1-NEXT: [[CH:%.*]] = alloca i32, align 4 779 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 8 780 // CHECK1-NEXT: store i32 0, i32* [[RETVAL]], align 4 781 // CHECK1-NEXT: store i32 10000, i32* [[N]], align 4 782 // CHECK1-NEXT: store i32 100, i32* [[CH]], align 4 783 // CHECK1-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 784 // CHECK1-NEXT: store i32* [[N]], i32** [[TMP0]], align 8 785 // CHECK1-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 786 // CHECK1-NEXT: store double** [[A]], double*** [[TMP1]], align 8 787 // CHECK1-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 788 // CHECK1-NEXT: store double** [[B]], double*** [[TMP2]], align 8 789 // CHECK1-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 790 // CHECK1-NEXT: store double** [[C]], double*** [[TMP3]], align 8 791 // CHECK1-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 792 // CHECK1-NEXT: store i32* [[CH]], i32** [[TMP4]], align 8 793 // CHECK1-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(40) [[REF_TMP]]) 794 // CHECK1-NEXT: ret i32 0 795 // 796 // 797 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l117 798 // CHECK1-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2:[0-9]+]] { 799 // CHECK1-NEXT: entry: 800 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 801 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 802 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 803 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 804 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 805 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 806 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 807 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 808 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 809 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3:[0-9]+]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 810 // CHECK1-NEXT: ret void 811 // 812 // 813 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined. 814 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 815 // CHECK1-NEXT: entry: 816 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 817 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 818 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 819 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 820 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 821 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 822 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 823 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 824 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 825 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 826 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 827 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 828 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 829 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 830 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 831 // CHECK1-NEXT: [[I3:%.*]] = alloca i32, align 4 832 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 833 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 834 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 835 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 836 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 837 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 838 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 839 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 840 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 841 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 842 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 843 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 844 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 845 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 846 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 847 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 848 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 849 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 850 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 851 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 852 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 853 // CHECK1: omp.precond.then: 854 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 855 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 856 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 857 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 858 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 859 // CHECK1-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 860 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 861 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 862 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 863 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 864 // CHECK1-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 865 // CHECK1-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 866 // CHECK1: cond.true: 867 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 868 // CHECK1-NEXT: br label [[COND_END:%.*]] 869 // CHECK1: cond.false: 870 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 871 // CHECK1-NEXT: br label [[COND_END]] 872 // CHECK1: cond.end: 873 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 874 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 875 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 876 // CHECK1-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 877 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 878 // CHECK1: omp.inner.for.cond: 879 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 880 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 881 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 882 // CHECK1-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 883 // CHECK1: omp.inner.for.body: 884 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 885 // CHECK1-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 886 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 887 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 888 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 889 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 890 // CHECK1: omp.inner.for.inc: 891 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 892 // CHECK1-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 893 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 894 // CHECK1-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 895 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 896 // CHECK1: omp.inner.for.end: 897 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 898 // CHECK1: omp.loop.exit: 899 // CHECK1-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 900 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 901 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 902 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 903 // CHECK1: omp.precond.end: 904 // CHECK1-NEXT: ret void 905 // 906 // 907 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..1 908 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 909 // CHECK1-NEXT: entry: 910 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 911 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 912 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 913 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 914 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 915 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 916 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 917 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 918 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 919 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 920 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 921 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 922 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 923 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 924 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 925 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 926 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 927 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 928 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_0:%.*]], align 8 929 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 930 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 931 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 932 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 933 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 934 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 935 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 936 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 937 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 938 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 939 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 940 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 941 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 942 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 943 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 944 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 945 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 946 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 947 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 948 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 949 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 950 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 951 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 952 // CHECK1: omp.precond.then: 953 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 954 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 955 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 956 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 957 // CHECK1-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 958 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 959 // CHECK1-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 960 // CHECK1-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 961 // CHECK1-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 962 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 963 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 964 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 965 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 966 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 967 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 968 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 969 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 970 // CHECK1-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 971 // CHECK1: cond.true: 972 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 973 // CHECK1-NEXT: br label [[COND_END:%.*]] 974 // CHECK1: cond.false: 975 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 976 // CHECK1-NEXT: br label [[COND_END]] 977 // CHECK1: cond.end: 978 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 979 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 980 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 981 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 982 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 983 // CHECK1: omp.inner.for.cond: 984 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 985 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 986 // CHECK1-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 987 // CHECK1-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 988 // CHECK1: omp.inner.for.body: 989 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 990 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 991 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 992 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 993 // CHECK1-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 994 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 995 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 996 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 997 // CHECK1-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 998 // CHECK1-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 999 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 1000 // CHECK1-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 1001 // CHECK1-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 1002 // CHECK1-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 1003 // CHECK1-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 1004 // CHECK1-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 1005 // CHECK1-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 1006 // CHECK1-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 1007 // CHECK1-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 1008 // CHECK1-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 1009 // CHECK1-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 0 1010 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 1011 // CHECK1-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 1 1012 // CHECK1-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 1013 // CHECK1-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 2 1014 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 1015 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 3 1016 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 1017 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE_clEv"(%class.anon.0* nonnull dereferenceable(32) [[REF_TMP]]) 1018 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 1019 // CHECK1: omp.body.continue: 1020 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1021 // CHECK1: omp.inner.for.inc: 1022 // CHECK1-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1023 // CHECK1-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 1024 // CHECK1-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 1025 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1026 // CHECK1: omp.inner.for.end: 1027 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1028 // CHECK1: omp.loop.exit: 1029 // CHECK1-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1030 // CHECK1-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 1031 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 1032 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1033 // CHECK1: omp.precond.end: 1034 // CHECK1-NEXT: ret void 1035 // 1036 // 1037 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l160 1038 // CHECK1-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 1039 // CHECK1-NEXT: entry: 1040 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 1041 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 1042 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 1043 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 1044 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 1045 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 1046 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 1047 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 1048 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 1049 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 1050 // CHECK1-NEXT: ret void 1051 // 1052 // 1053 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..2 1054 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1055 // CHECK1-NEXT: entry: 1056 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1057 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1058 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1059 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1060 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1061 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1062 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1063 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1064 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1065 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1066 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1067 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 1068 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 1069 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1070 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1071 // CHECK1-NEXT: [[I3:%.*]] = alloca i32, align 4 1072 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1073 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1074 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1075 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1076 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1077 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1078 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1079 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 1080 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 1081 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 1082 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 1083 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 1084 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1085 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 1086 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1087 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 1088 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1089 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1090 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1091 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 1092 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1093 // CHECK1: omp.precond.then: 1094 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 1095 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1096 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 1097 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1098 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1099 // CHECK1-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1100 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 1101 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 1102 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1103 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1104 // CHECK1-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 1105 // CHECK1-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1106 // CHECK1: cond.true: 1107 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1108 // CHECK1-NEXT: br label [[COND_END:%.*]] 1109 // CHECK1: cond.false: 1110 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1111 // CHECK1-NEXT: br label [[COND_END]] 1112 // CHECK1: cond.end: 1113 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 1114 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 1115 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1116 // CHECK1-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 1117 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1118 // CHECK1: omp.inner.for.cond: 1119 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1120 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1121 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 1122 // CHECK1-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1123 // CHECK1: omp.inner.for.body: 1124 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1125 // CHECK1-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 1126 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1127 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 1128 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 1129 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1130 // CHECK1: omp.inner.for.inc: 1131 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1132 // CHECK1-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 1133 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 1134 // CHECK1-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 1135 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1136 // CHECK1: omp.inner.for.end: 1137 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1138 // CHECK1: omp.loop.exit: 1139 // CHECK1-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1140 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 1141 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 1142 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1143 // CHECK1: omp.precond.end: 1144 // CHECK1-NEXT: ret void 1145 // 1146 // 1147 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..3 1148 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1149 // CHECK1-NEXT: entry: 1150 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1151 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1152 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 1153 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 1154 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1155 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1156 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1157 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1158 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1159 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1160 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1161 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1162 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1163 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 1164 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 1165 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1166 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1167 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 1168 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_1:%.*]], align 8 1169 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1170 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1171 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1172 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1173 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1174 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1175 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1176 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1177 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1178 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 1179 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 1180 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 1181 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 1182 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 1183 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1184 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 1185 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1186 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 1187 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1188 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1189 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1190 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 1191 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1192 // CHECK1: omp.precond.then: 1193 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 1194 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1195 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 1196 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1197 // CHECK1-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 1198 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1199 // CHECK1-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 1200 // CHECK1-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 1201 // CHECK1-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 1202 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1203 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1204 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1205 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 1206 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 1207 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1208 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1209 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 1210 // CHECK1-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1211 // CHECK1: cond.true: 1212 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1213 // CHECK1-NEXT: br label [[COND_END:%.*]] 1214 // CHECK1: cond.false: 1215 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1216 // CHECK1-NEXT: br label [[COND_END]] 1217 // CHECK1: cond.end: 1218 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 1219 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 1220 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 1221 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 1222 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1223 // CHECK1: omp.inner.for.cond: 1224 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1225 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1226 // CHECK1-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 1227 // CHECK1-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1228 // CHECK1: omp.inner.for.body: 1229 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1230 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 1231 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 1232 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 1233 // CHECK1-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 1234 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 1235 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 1236 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 1237 // CHECK1-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 1238 // CHECK1-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 1239 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 1240 // CHECK1-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 1241 // CHECK1-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 1242 // CHECK1-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 1243 // CHECK1-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 1244 // CHECK1-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 1245 // CHECK1-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 1246 // CHECK1-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 1247 // CHECK1-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 1248 // CHECK1-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 1249 // CHECK1-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 0 1250 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 1251 // CHECK1-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 1 1252 // CHECK1-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 1253 // CHECK1-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 2 1254 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 1255 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 3 1256 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 1257 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE0_clEv"(%class.anon.1* nonnull dereferenceable(32) [[REF_TMP]]) 1258 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 1259 // CHECK1: omp.body.continue: 1260 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1261 // CHECK1: omp.inner.for.inc: 1262 // CHECK1-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1263 // CHECK1-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 1264 // CHECK1-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 1265 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1266 // CHECK1: omp.inner.for.end: 1267 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1268 // CHECK1: omp.loop.exit: 1269 // CHECK1-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1270 // CHECK1-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 1271 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 1272 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1273 // CHECK1: omp.precond.end: 1274 // CHECK1-NEXT: ret void 1275 // 1276 // 1277 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l202 1278 // CHECK1-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 1279 // CHECK1-NEXT: entry: 1280 // CHECK1-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 1281 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 1282 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 1283 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 1284 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 1285 // CHECK1-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 1286 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 1287 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 1288 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 1289 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 1290 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 1291 // CHECK1-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 1292 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 1293 // CHECK1-NEXT: ret void 1294 // 1295 // 1296 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..6 1297 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1298 // CHECK1-NEXT: entry: 1299 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1300 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1301 // CHECK1-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 1302 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1303 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1304 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1305 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1306 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1307 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1308 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1309 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1310 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1311 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 1312 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 1313 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1314 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1315 // CHECK1-NEXT: [[I3:%.*]] = alloca i32, align 4 1316 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1317 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1318 // CHECK1-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 1319 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1320 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1321 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1322 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1323 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 1324 // CHECK1-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1325 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 1326 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 1327 // CHECK1-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 1328 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 1329 // CHECK1-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 1330 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1331 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 1332 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1333 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 1334 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1335 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1336 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1337 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 1338 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1339 // CHECK1: omp.precond.then: 1340 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 1341 // CHECK1-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1342 // CHECK1-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 1343 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1344 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1345 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 1346 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1347 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 1348 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 1349 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1350 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1351 // CHECK1-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 1352 // CHECK1-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1353 // CHECK1: cond.true: 1354 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1355 // CHECK1-NEXT: br label [[COND_END:%.*]] 1356 // CHECK1: cond.false: 1357 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1358 // CHECK1-NEXT: br label [[COND_END]] 1359 // CHECK1: cond.end: 1360 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 1361 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 1362 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1363 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 1364 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1365 // CHECK1: omp.inner.for.cond: 1366 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1367 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1368 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 1369 // CHECK1-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 1370 // CHECK1-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1371 // CHECK1: omp.inner.for.body: 1372 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1373 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 1374 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1375 // CHECK1-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 1376 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 1377 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1378 // CHECK1: omp.inner.for.inc: 1379 // CHECK1-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1380 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 1381 // CHECK1-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 1382 // CHECK1-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 1383 // CHECK1-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1384 // CHECK1-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 1385 // CHECK1-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 1386 // CHECK1-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 1387 // CHECK1-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1388 // CHECK1-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 1389 // CHECK1-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP27]], [[TMP28]] 1390 // CHECK1-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 1391 // CHECK1-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1392 // CHECK1-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1393 // CHECK1-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP29]], [[TMP30]] 1394 // CHECK1-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 1395 // CHECK1: cond.true10: 1396 // CHECK1-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1397 // CHECK1-NEXT: br label [[COND_END12:%.*]] 1398 // CHECK1: cond.false11: 1399 // CHECK1-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1400 // CHECK1-NEXT: br label [[COND_END12]] 1401 // CHECK1: cond.end12: 1402 // CHECK1-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP31]], [[COND_TRUE10]] ], [ [[TMP32]], [[COND_FALSE11]] ] 1403 // CHECK1-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 1404 // CHECK1-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1405 // CHECK1-NEXT: store i32 [[TMP33]], i32* [[DOTOMP_IV]], align 4 1406 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1407 // CHECK1: omp.inner.for.end: 1408 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1409 // CHECK1: omp.loop.exit: 1410 // CHECK1-NEXT: [[TMP34:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1411 // CHECK1-NEXT: [[TMP35:%.*]] = load i32, i32* [[TMP34]], align 4 1412 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP35]]) 1413 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1414 // CHECK1: omp.precond.end: 1415 // CHECK1-NEXT: ret void 1416 // 1417 // 1418 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..7 1419 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1420 // CHECK1-NEXT: entry: 1421 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1422 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1423 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 1424 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 1425 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1426 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1427 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1428 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1429 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1430 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1431 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1432 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1433 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1434 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 1435 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 1436 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1437 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1438 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 1439 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_2:%.*]], align 8 1440 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1441 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1442 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1443 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1444 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1445 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1446 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1447 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1448 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1449 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 1450 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 1451 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 1452 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 1453 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 1454 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1455 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 1456 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1457 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 1458 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1459 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1460 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1461 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 1462 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1463 // CHECK1: omp.precond.then: 1464 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 1465 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1466 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 1467 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1468 // CHECK1-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 1469 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1470 // CHECK1-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 1471 // CHECK1-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 1472 // CHECK1-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 1473 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1474 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1475 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1476 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 1477 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 1478 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1479 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1480 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 1481 // CHECK1-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1482 // CHECK1: cond.true: 1483 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1484 // CHECK1-NEXT: br label [[COND_END:%.*]] 1485 // CHECK1: cond.false: 1486 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1487 // CHECK1-NEXT: br label [[COND_END]] 1488 // CHECK1: cond.end: 1489 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 1490 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 1491 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 1492 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 1493 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1494 // CHECK1: omp.inner.for.cond: 1495 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1496 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1497 // CHECK1-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 1498 // CHECK1-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1499 // CHECK1: omp.inner.for.body: 1500 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1501 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 1502 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 1503 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 1504 // CHECK1-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 1505 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 1506 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 1507 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 1508 // CHECK1-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 1509 // CHECK1-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 1510 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 1511 // CHECK1-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 1512 // CHECK1-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 1513 // CHECK1-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 1514 // CHECK1-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 1515 // CHECK1-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 1516 // CHECK1-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 1517 // CHECK1-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 1518 // CHECK1-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 1519 // CHECK1-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 1520 // CHECK1-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 0 1521 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 1522 // CHECK1-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 1 1523 // CHECK1-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 1524 // CHECK1-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 2 1525 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 1526 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 3 1527 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 1528 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE1_clEv"(%class.anon.2* nonnull dereferenceable(32) [[REF_TMP]]) 1529 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 1530 // CHECK1: omp.body.continue: 1531 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1532 // CHECK1: omp.inner.for.inc: 1533 // CHECK1-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1534 // CHECK1-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 1535 // CHECK1-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 1536 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1537 // CHECK1: omp.inner.for.end: 1538 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1539 // CHECK1: omp.loop.exit: 1540 // CHECK1-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1541 // CHECK1-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 1542 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 1543 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1544 // CHECK1: omp.precond.end: 1545 // CHECK1-NEXT: ret void 1546 // 1547 // 1548 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l235 1549 // CHECK1-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 1550 // CHECK1-NEXT: entry: 1551 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 1552 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 1553 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 1554 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 1555 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 1556 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 1557 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 1558 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 1559 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 1560 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 1561 // CHECK1-NEXT: ret void 1562 // 1563 // 1564 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..10 1565 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1566 // CHECK1-NEXT: entry: 1567 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1568 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1569 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1570 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1571 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1572 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1573 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1574 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1575 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1576 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1577 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1578 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 1579 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 1580 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1581 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1582 // CHECK1-NEXT: [[I3:%.*]] = alloca i32, align 4 1583 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1584 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1585 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1586 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1587 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1588 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1589 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1590 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 1591 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 1592 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 1593 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 1594 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 1595 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1596 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 1597 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1598 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 1599 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1600 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1601 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1602 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 1603 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1604 // CHECK1: omp.precond.then: 1605 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 1606 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1607 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 1608 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1609 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1610 // CHECK1-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1611 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 1612 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 1613 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1614 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1615 // CHECK1-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 1616 // CHECK1-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1617 // CHECK1: cond.true: 1618 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1619 // CHECK1-NEXT: br label [[COND_END:%.*]] 1620 // CHECK1: cond.false: 1621 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1622 // CHECK1-NEXT: br label [[COND_END]] 1623 // CHECK1: cond.end: 1624 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 1625 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 1626 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1627 // CHECK1-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 1628 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1629 // CHECK1: omp.inner.for.cond: 1630 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1631 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1632 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 1633 // CHECK1-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1634 // CHECK1: omp.inner.for.body: 1635 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1636 // CHECK1-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 1637 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1638 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 1639 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 1640 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1641 // CHECK1: omp.inner.for.inc: 1642 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1643 // CHECK1-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 1644 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 1645 // CHECK1-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 1646 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1647 // CHECK1: omp.inner.for.end: 1648 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1649 // CHECK1: omp.loop.exit: 1650 // CHECK1-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1651 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 1652 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 1653 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1654 // CHECK1: omp.precond.end: 1655 // CHECK1-NEXT: ret void 1656 // 1657 // 1658 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..11 1659 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1660 // CHECK1-NEXT: entry: 1661 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1662 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1663 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 1664 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 1665 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1666 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1667 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1668 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1669 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1670 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1671 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1672 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1673 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1674 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 1675 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 1676 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1677 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1678 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 1679 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_3:%.*]], align 8 1680 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1681 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1682 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1683 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1684 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1685 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1686 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1687 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1688 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1689 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 1690 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 1691 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 1692 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 1693 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 1694 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1695 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 1696 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1697 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 1698 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1699 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1700 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1701 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 1702 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1703 // CHECK1: omp.precond.then: 1704 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 1705 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1706 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 1707 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1708 // CHECK1-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 1709 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1710 // CHECK1-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 1711 // CHECK1-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 1712 // CHECK1-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 1713 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1714 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1715 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1716 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 1717 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 1718 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1719 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1720 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 1721 // CHECK1-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1722 // CHECK1: cond.true: 1723 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1724 // CHECK1-NEXT: br label [[COND_END:%.*]] 1725 // CHECK1: cond.false: 1726 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1727 // CHECK1-NEXT: br label [[COND_END]] 1728 // CHECK1: cond.end: 1729 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 1730 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 1731 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 1732 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 1733 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1734 // CHECK1: omp.inner.for.cond: 1735 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1736 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1737 // CHECK1-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 1738 // CHECK1-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1739 // CHECK1: omp.inner.for.body: 1740 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1741 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 1742 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 1743 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 1744 // CHECK1-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 1745 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 1746 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 1747 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 1748 // CHECK1-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 1749 // CHECK1-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 1750 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 1751 // CHECK1-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 1752 // CHECK1-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 1753 // CHECK1-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 1754 // CHECK1-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 1755 // CHECK1-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 1756 // CHECK1-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 1757 // CHECK1-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 1758 // CHECK1-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 1759 // CHECK1-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 1760 // CHECK1-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 0 1761 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 1762 // CHECK1-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 1 1763 // CHECK1-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 1764 // CHECK1-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 2 1765 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 1766 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 3 1767 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 1768 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE2_clEv"(%class.anon.3* nonnull dereferenceable(32) [[REF_TMP]]) 1769 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 1770 // CHECK1: omp.body.continue: 1771 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1772 // CHECK1: omp.inner.for.inc: 1773 // CHECK1-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1774 // CHECK1-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 1775 // CHECK1-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 1776 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1777 // CHECK1: omp.inner.for.end: 1778 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1779 // CHECK1: omp.loop.exit: 1780 // CHECK1-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1781 // CHECK1-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 1782 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 1783 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1784 // CHECK1: omp.precond.end: 1785 // CHECK1-NEXT: ret void 1786 // 1787 // 1788 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l267 1789 // CHECK1-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 1790 // CHECK1-NEXT: entry: 1791 // CHECK1-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 1792 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 1793 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 1794 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 1795 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 1796 // CHECK1-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 1797 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 1798 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 1799 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 1800 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 1801 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 1802 // CHECK1-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 1803 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 1804 // CHECK1-NEXT: ret void 1805 // 1806 // 1807 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..14 1808 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 1809 // CHECK1-NEXT: entry: 1810 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1811 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1812 // CHECK1-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 1813 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1814 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1815 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1816 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1817 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 1818 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1819 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1820 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1821 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 1822 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1823 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 1824 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 1825 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1826 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1827 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 1828 // CHECK1-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 1829 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1830 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1831 // CHECK1-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 1832 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1833 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1834 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1835 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1836 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 1837 // CHECK1-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1838 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 1839 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 1840 // CHECK1-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 1841 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 1842 // CHECK1-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 1843 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 1844 // CHECK1-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1845 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1846 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 1847 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1848 // CHECK1-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 1849 // CHECK1-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 1850 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1851 // CHECK1-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1852 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 1853 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1854 // CHECK1: omp.precond.then: 1855 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 1856 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 1857 // CHECK1-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 1858 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1859 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1860 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1861 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 1862 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 1863 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1864 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 1865 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 1866 // CHECK1-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1867 // CHECK1: cond.true: 1868 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 1869 // CHECK1-NEXT: br label [[COND_END:%.*]] 1870 // CHECK1: cond.false: 1871 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1872 // CHECK1-NEXT: br label [[COND_END]] 1873 // CHECK1: cond.end: 1874 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 1875 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 1876 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1877 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 1878 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 1879 // CHECK1: omp.inner.for.cond: 1880 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1881 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1882 // CHECK1-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 1883 // CHECK1-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 1884 // CHECK1: omp.inner.for.body: 1885 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 1886 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 1887 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 1888 // CHECK1-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 1889 // CHECK1-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 1890 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 1891 // CHECK1-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 1892 // CHECK1-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 1893 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 1894 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 1895 // CHECK1: omp.inner.for.inc: 1896 // CHECK1-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1897 // CHECK1-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 1898 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 1899 // CHECK1-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 1900 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 1901 // CHECK1: omp.inner.for.end: 1902 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 1903 // CHECK1: omp.loop.exit: 1904 // CHECK1-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1905 // CHECK1-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 1906 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 1907 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 1908 // CHECK1: omp.precond.end: 1909 // CHECK1-NEXT: ret void 1910 // 1911 // 1912 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..15 1913 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 1914 // CHECK1-NEXT: entry: 1915 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 1916 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 1917 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 1918 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 1919 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 1920 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 1921 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 1922 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 1923 // CHECK1-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 1924 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 1925 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 1926 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 1927 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 1928 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 1929 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 1930 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 1931 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 1932 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 1933 // CHECK1-NEXT: [[I6:%.*]] = alloca i32, align 4 1934 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_4:%.*]], align 8 1935 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 1936 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 1937 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1938 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1939 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 1940 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 1941 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 1942 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 1943 // CHECK1-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 1944 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 1945 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 1946 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 1947 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 1948 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 1949 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 1950 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 1951 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1952 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 1953 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 1954 // CHECK1-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 1955 // CHECK1-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 1956 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 1957 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 1958 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 1959 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 1960 // CHECK1: omp.precond.then: 1961 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 1962 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 1963 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 1964 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 1965 // CHECK1-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 1966 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1967 // CHECK1-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 1968 // CHECK1-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 1969 // CHECK1-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 1970 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 1971 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 1972 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 1973 // CHECK1-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 1974 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 1975 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 1976 // CHECK1-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 1977 // CHECK1: omp.dispatch.cond: 1978 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1979 // CHECK1-NEXT: [[CONV7:%.*]] = sext i32 [[TMP13]] to i64 1980 // CHECK1-NEXT: [[TMP14:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1981 // CHECK1-NEXT: [[CMP8:%.*]] = icmp ugt i64 [[CONV7]], [[TMP14]] 1982 // CHECK1-NEXT: br i1 [[CMP8]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 1983 // CHECK1: cond.true: 1984 // CHECK1-NEXT: [[TMP15:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 1985 // CHECK1-NEXT: br label [[COND_END:%.*]] 1986 // CHECK1: cond.false: 1987 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1988 // CHECK1-NEXT: [[CONV9:%.*]] = sext i32 [[TMP16]] to i64 1989 // CHECK1-NEXT: br label [[COND_END]] 1990 // CHECK1: cond.end: 1991 // CHECK1-NEXT: [[COND:%.*]] = phi i64 [ [[TMP15]], [[COND_TRUE]] ], [ [[CONV9]], [[COND_FALSE]] ] 1992 // CHECK1-NEXT: [[CONV10:%.*]] = trunc i64 [[COND]] to i32 1993 // CHECK1-NEXT: store i32 [[CONV10]], i32* [[DOTOMP_UB]], align 4 1994 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 1995 // CHECK1-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 1996 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 1997 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 1998 // CHECK1-NEXT: [[CMP11:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 1999 // CHECK1-NEXT: br i1 [[CMP11]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 2000 // CHECK1: omp.dispatch.body: 2001 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2002 // CHECK1: omp.inner.for.cond: 2003 // CHECK1-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2004 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2005 // CHECK1-NEXT: [[CMP12:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 2006 // CHECK1-NEXT: br i1 [[CMP12]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2007 // CHECK1: omp.inner.for.body: 2008 // CHECK1-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2009 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 2010 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 2011 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I6]], align 4 2012 // CHECK1-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 8 2013 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[I6]], align 4 2014 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP24]] to i64 2015 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM]] 2016 // CHECK1-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 8 2017 // CHECK1-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 8 2018 // CHECK1-NEXT: [[TMP27:%.*]] = load i32, i32* [[I6]], align 4 2019 // CHECK1-NEXT: [[IDXPROM13:%.*]] = sext i32 [[TMP27]] to i64 2020 // CHECK1-NEXT: [[ARRAYIDX14:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM13]] 2021 // CHECK1-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX14]], align 8 2022 // CHECK1-NEXT: [[ADD15:%.*]] = fadd double [[TMP25]], [[TMP28]] 2023 // CHECK1-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 8 2024 // CHECK1-NEXT: [[TMP30:%.*]] = load i32, i32* [[I6]], align 4 2025 // CHECK1-NEXT: [[IDXPROM16:%.*]] = sext i32 [[TMP30]] to i64 2026 // CHECK1-NEXT: [[ARRAYIDX17:%.*]] = getelementptr inbounds double, double* [[TMP29]], i64 [[IDXPROM16]] 2027 // CHECK1-NEXT: store double [[ADD15]], double* [[ARRAYIDX17]], align 8 2028 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 0 2029 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP31]], align 8 2030 // CHECK1-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 1 2031 // CHECK1-NEXT: store i32* [[I6]], i32** [[TMP32]], align 8 2032 // CHECK1-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 2 2033 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP33]], align 8 2034 // CHECK1-NEXT: [[TMP34:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 3 2035 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP34]], align 8 2036 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE3_clEv"(%class.anon.4* nonnull dereferenceable(32) [[REF_TMP]]) 2037 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 2038 // CHECK1: omp.body.continue: 2039 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2040 // CHECK1: omp.inner.for.inc: 2041 // CHECK1-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2042 // CHECK1-NEXT: [[ADD18:%.*]] = add nsw i32 [[TMP35]], 1 2043 // CHECK1-NEXT: store i32 [[ADD18]], i32* [[DOTOMP_IV]], align 4 2044 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 2045 // CHECK1: omp.inner.for.end: 2046 // CHECK1-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 2047 // CHECK1: omp.dispatch.inc: 2048 // CHECK1-NEXT: [[TMP36:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 2049 // CHECK1-NEXT: [[TMP37:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 2050 // CHECK1-NEXT: [[ADD19:%.*]] = add nsw i32 [[TMP36]], [[TMP37]] 2051 // CHECK1-NEXT: store i32 [[ADD19]], i32* [[DOTOMP_LB]], align 4 2052 // CHECK1-NEXT: [[TMP38:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2053 // CHECK1-NEXT: [[TMP39:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 2054 // CHECK1-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP38]], [[TMP39]] 2055 // CHECK1-NEXT: store i32 [[ADD20]], i32* [[DOTOMP_UB]], align 4 2056 // CHECK1-NEXT: br label [[OMP_DISPATCH_COND]] 2057 // CHECK1: omp.dispatch.end: 2058 // CHECK1-NEXT: [[TMP40:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2059 // CHECK1-NEXT: [[TMP41:%.*]] = load i32, i32* [[TMP40]], align 4 2060 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP41]]) 2061 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 2062 // CHECK1: omp.precond.end: 2063 // CHECK1-NEXT: ret void 2064 // 2065 // 2066 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l300 2067 // CHECK1-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 2068 // CHECK1-NEXT: entry: 2069 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 2070 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 2071 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 2072 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 2073 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 2074 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 2075 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 2076 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 2077 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 2078 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 2079 // CHECK1-NEXT: ret void 2080 // 2081 // 2082 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..18 2083 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2084 // CHECK1-NEXT: entry: 2085 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2086 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2087 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2088 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2089 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2090 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2091 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2092 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 2093 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2094 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2095 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 2096 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 2097 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 2098 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2099 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2100 // CHECK1-NEXT: [[I3:%.*]] = alloca i32, align 4 2101 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2102 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2103 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2104 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2105 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2106 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2107 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2108 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2109 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2110 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2111 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2112 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 2113 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2114 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2115 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2116 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 2117 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2118 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 2119 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2120 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2121 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2122 // CHECK1: omp.precond.then: 2123 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 2124 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2125 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 2126 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2127 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2128 // CHECK1-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2129 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 2130 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 2131 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2132 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2133 // CHECK1-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 2134 // CHECK1-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 2135 // CHECK1: cond.true: 2136 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2137 // CHECK1-NEXT: br label [[COND_END:%.*]] 2138 // CHECK1: cond.false: 2139 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2140 // CHECK1-NEXT: br label [[COND_END]] 2141 // CHECK1: cond.end: 2142 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 2143 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 2144 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2145 // CHECK1-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 2146 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2147 // CHECK1: omp.inner.for.cond: 2148 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2149 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2150 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 2151 // CHECK1-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2152 // CHECK1: omp.inner.for.body: 2153 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2154 // CHECK1-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 2155 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2156 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 2157 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 2158 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2159 // CHECK1: omp.inner.for.inc: 2160 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2161 // CHECK1-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 2162 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 2163 // CHECK1-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 2164 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 2165 // CHECK1: omp.inner.for.end: 2166 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 2167 // CHECK1: omp.loop.exit: 2168 // CHECK1-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2169 // CHECK1-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 2170 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 2171 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 2172 // CHECK1: omp.precond.end: 2173 // CHECK1-NEXT: ret void 2174 // 2175 // 2176 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..19 2177 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2178 // CHECK1-NEXT: entry: 2179 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2180 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2181 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 2182 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 2183 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2184 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2185 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2186 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2187 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2188 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 2189 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2190 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2191 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 2192 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 2193 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 2194 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2195 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2196 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 2197 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_5:%.*]], align 8 2198 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2199 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2200 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2201 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2202 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2203 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2204 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2205 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2206 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2207 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2208 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2209 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2210 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2211 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 2212 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2213 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2214 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2215 // CHECK1-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 2216 // CHECK1-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2217 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 2218 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2219 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2220 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2221 // CHECK1: omp.precond.then: 2222 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 2223 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2224 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 2225 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2226 // CHECK1-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 2227 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2228 // CHECK1-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 2229 // CHECK1-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 2230 // CHECK1-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 2231 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2232 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2233 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 2234 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2235 // CHECK1-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2236 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 2237 // CHECK1-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 2238 // CHECK1-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 2239 // CHECK1: omp.dispatch.cond: 2240 // CHECK1-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2241 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 2242 // CHECK1-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 2243 // CHECK1-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 2244 // CHECK1-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 2245 // CHECK1: omp.dispatch.body: 2246 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 2247 // CHECK1-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 2248 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2249 // CHECK1: omp.inner.for.cond: 2250 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 2251 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !11 2252 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 2253 // CHECK1-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2254 // CHECK1: omp.inner.for.body: 2255 // CHECK1-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 2256 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 2257 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 2258 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !11 2259 // CHECK1-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !11 2260 // CHECK1-NEXT: [[TMP22:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !11 2261 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP22]] to i64 2262 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i64 [[IDXPROM]] 2263 // CHECK1-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !11 2264 // CHECK1-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !11 2265 // CHECK1-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !11 2266 // CHECK1-NEXT: [[IDXPROM6:%.*]] = sext i32 [[TMP25]] to i64 2267 // CHECK1-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP24]], i64 [[IDXPROM6]] 2268 // CHECK1-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX7]], align 8, !llvm.access.group !11 2269 // CHECK1-NEXT: [[ADD8:%.*]] = fadd double [[TMP23]], [[TMP26]] 2270 // CHECK1-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !11 2271 // CHECK1-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !11 2272 // CHECK1-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP28]] to i64 2273 // CHECK1-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP27]], i64 [[IDXPROM9]] 2274 // CHECK1-NEXT: store double [[ADD8]], double* [[ARRAYIDX10]], align 8, !llvm.access.group !11 2275 // CHECK1-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 0 2276 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP29]], align 8, !llvm.access.group !11 2277 // CHECK1-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 1 2278 // CHECK1-NEXT: store i32* [[I4]], i32** [[TMP30]], align 8, !llvm.access.group !11 2279 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 2 2280 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP31]], align 8, !llvm.access.group !11 2281 // CHECK1-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 3 2282 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP32]], align 8, !llvm.access.group !11 2283 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE4_clEv"(%class.anon.5* nonnull dereferenceable(32) [[REF_TMP]]), !llvm.access.group !11 2284 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 2285 // CHECK1: omp.body.continue: 2286 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2287 // CHECK1: omp.inner.for.inc: 2288 // CHECK1-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 2289 // CHECK1-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP33]], 1 2290 // CHECK1-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 2291 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP12:![0-9]+]] 2292 // CHECK1: omp.inner.for.end: 2293 // CHECK1-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 2294 // CHECK1: omp.dispatch.inc: 2295 // CHECK1-NEXT: br label [[OMP_DISPATCH_COND]] 2296 // CHECK1: omp.dispatch.end: 2297 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 2298 // CHECK1: omp.precond.end: 2299 // CHECK1-NEXT: ret void 2300 // 2301 // 2302 // CHECK1-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l329 2303 // CHECK1-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 2304 // CHECK1-NEXT: entry: 2305 // CHECK1-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 2306 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 2307 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 2308 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 2309 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 2310 // CHECK1-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 2311 // CHECK1-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 2312 // CHECK1-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 2313 // CHECK1-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 2314 // CHECK1-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 2315 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 2316 // CHECK1-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 2317 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 2318 // CHECK1-NEXT: ret void 2319 // 2320 // 2321 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..22 2322 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2323 // CHECK1-NEXT: entry: 2324 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2325 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2326 // CHECK1-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 2327 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2328 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2329 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2330 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2331 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2332 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2333 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 2334 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2335 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 2336 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 2337 // CHECK1-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 2338 // CHECK1-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 2339 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2340 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2341 // CHECK1-NEXT: [[I4:%.*]] = alloca i32, align 4 2342 // CHECK1-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 2343 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2344 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2345 // CHECK1-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 2346 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2347 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2348 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2349 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2350 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 2351 // CHECK1-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2352 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 2353 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 2354 // CHECK1-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 2355 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 2356 // CHECK1-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 2357 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 2358 // CHECK1-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2359 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2360 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 2361 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2362 // CHECK1-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 2363 // CHECK1-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 2364 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 2365 // CHECK1-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2366 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 2367 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2368 // CHECK1: omp.precond.then: 2369 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 2370 // CHECK1-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 2371 // CHECK1-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 2372 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2373 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2374 // CHECK1-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2375 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 2376 // CHECK1-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 2377 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2378 // CHECK1-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 2379 // CHECK1-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 2380 // CHECK1-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 2381 // CHECK1: cond.true: 2382 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 2383 // CHECK1-NEXT: br label [[COND_END:%.*]] 2384 // CHECK1: cond.false: 2385 // CHECK1-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2386 // CHECK1-NEXT: br label [[COND_END]] 2387 // CHECK1: cond.end: 2388 // CHECK1-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 2389 // CHECK1-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 2390 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2391 // CHECK1-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 2392 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2393 // CHECK1: omp.inner.for.cond: 2394 // CHECK1-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2395 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2396 // CHECK1-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 2397 // CHECK1-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2398 // CHECK1: omp.inner.for.body: 2399 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2400 // CHECK1-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 2401 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2402 // CHECK1-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 2403 // CHECK1-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2404 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 2405 // CHECK1-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 2406 // CHECK1-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 2407 // CHECK1-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 2408 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2409 // CHECK1: omp.inner.for.inc: 2410 // CHECK1-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2411 // CHECK1-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 2412 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 2413 // CHECK1-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 2414 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]] 2415 // CHECK1: omp.inner.for.end: 2416 // CHECK1-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 2417 // CHECK1: omp.loop.exit: 2418 // CHECK1-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2419 // CHECK1-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 2420 // CHECK1-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 2421 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 2422 // CHECK1: omp.precond.end: 2423 // CHECK1-NEXT: ret void 2424 // 2425 // 2426 // CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..23 2427 // CHECK1-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 2428 // CHECK1-NEXT: entry: 2429 // CHECK1-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2430 // CHECK1-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2431 // CHECK1-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 2432 // CHECK1-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 2433 // CHECK1-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2434 // CHECK1-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2435 // CHECK1-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2436 // CHECK1-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2437 // CHECK1-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 2438 // CHECK1-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2439 // CHECK1-NEXT: [[TMP:%.*]] = alloca i32, align 4 2440 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2441 // CHECK1-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 2442 // CHECK1-NEXT: [[I:%.*]] = alloca i32, align 4 2443 // CHECK1-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 2444 // CHECK1-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 2445 // CHECK1-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2446 // CHECK1-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2447 // CHECK1-NEXT: [[I6:%.*]] = alloca i32, align 4 2448 // CHECK1-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_6:%.*]], align 8 2449 // CHECK1-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2450 // CHECK1-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2451 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2452 // CHECK1-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2453 // CHECK1-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2454 // CHECK1-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2455 // CHECK1-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2456 // CHECK1-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2457 // CHECK1-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 2458 // CHECK1-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2459 // CHECK1-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2460 // CHECK1-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2461 // CHECK1-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2462 // CHECK1-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 2463 // CHECK1-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2464 // CHECK1-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2465 // CHECK1-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2466 // CHECK1-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2467 // CHECK1-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2468 // CHECK1-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 2469 // CHECK1-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 2470 // CHECK1-NEXT: store i32 0, i32* [[I]], align 4 2471 // CHECK1-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2472 // CHECK1-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2473 // CHECK1-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2474 // CHECK1: omp.precond.then: 2475 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 2476 // CHECK1-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 2477 // CHECK1-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 2478 // CHECK1-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2479 // CHECK1-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 2480 // CHECK1-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2481 // CHECK1-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 2482 // CHECK1-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 2483 // CHECK1-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 2484 // CHECK1-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2485 // CHECK1-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2486 // CHECK1-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 2487 // CHECK1-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 2488 // CHECK1-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2489 // CHECK1-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2490 // CHECK1-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 2491 // CHECK1-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 2492 // CHECK1-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 2493 // CHECK1: omp.dispatch.cond: 2494 // CHECK1-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2495 // CHECK1-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 2496 // CHECK1-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 2497 // CHECK1-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 2498 // CHECK1-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 2499 // CHECK1: omp.dispatch.body: 2500 // CHECK1-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 2501 // CHECK1-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 2502 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2503 // CHECK1: omp.inner.for.cond: 2504 // CHECK1-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 2505 // CHECK1-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !14 2506 // CHECK1-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 2507 // CHECK1-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2508 // CHECK1: omp.inner.for.body: 2509 // CHECK1-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 2510 // CHECK1-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 2511 // CHECK1-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 2512 // CHECK1-NEXT: store i32 [[ADD]], i32* [[I6]], align 4, !llvm.access.group !14 2513 // CHECK1-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !14 2514 // CHECK1-NEXT: [[TMP23:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !14 2515 // CHECK1-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP23]] to i64 2516 // CHECK1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i64 [[IDXPROM]] 2517 // CHECK1-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !14 2518 // CHECK1-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !14 2519 // CHECK1-NEXT: [[TMP26:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !14 2520 // CHECK1-NEXT: [[IDXPROM8:%.*]] = sext i32 [[TMP26]] to i64 2521 // CHECK1-NEXT: [[ARRAYIDX9:%.*]] = getelementptr inbounds double, double* [[TMP25]], i64 [[IDXPROM8]] 2522 // CHECK1-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX9]], align 8, !llvm.access.group !14 2523 // CHECK1-NEXT: [[ADD10:%.*]] = fadd double [[TMP24]], [[TMP27]] 2524 // CHECK1-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !14 2525 // CHECK1-NEXT: [[TMP29:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !14 2526 // CHECK1-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP29]] to i64 2527 // CHECK1-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds double, double* [[TMP28]], i64 [[IDXPROM11]] 2528 // CHECK1-NEXT: store double [[ADD10]], double* [[ARRAYIDX12]], align 8, !llvm.access.group !14 2529 // CHECK1-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 0 2530 // CHECK1-NEXT: store double** [[TMP1]], double*** [[TMP30]], align 8, !llvm.access.group !14 2531 // CHECK1-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 1 2532 // CHECK1-NEXT: store i32* [[I6]], i32** [[TMP31]], align 8, !llvm.access.group !14 2533 // CHECK1-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 2 2534 // CHECK1-NEXT: store double** [[TMP2]], double*** [[TMP32]], align 8, !llvm.access.group !14 2535 // CHECK1-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 3 2536 // CHECK1-NEXT: store double** [[TMP3]], double*** [[TMP33]], align 8, !llvm.access.group !14 2537 // CHECK1-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE5_clEv"(%class.anon.6* nonnull dereferenceable(32) [[REF_TMP]]), !llvm.access.group !14 2538 // CHECK1-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 2539 // CHECK1: omp.body.continue: 2540 // CHECK1-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2541 // CHECK1: omp.inner.for.inc: 2542 // CHECK1-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 2543 // CHECK1-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP34]], 1 2544 // CHECK1-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 2545 // CHECK1-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP15:![0-9]+]] 2546 // CHECK1: omp.inner.for.end: 2547 // CHECK1-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 2548 // CHECK1: omp.dispatch.inc: 2549 // CHECK1-NEXT: br label [[OMP_DISPATCH_COND]] 2550 // CHECK1: omp.dispatch.end: 2551 // CHECK1-NEXT: br label [[OMP_PRECOND_END]] 2552 // CHECK1: omp.precond.end: 2553 // CHECK1-NEXT: ret void 2554 // 2555 // 2556 // CHECK1-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 2557 // CHECK1-SAME: () #[[ATTR4:[0-9]+]] { 2558 // CHECK1-NEXT: entry: 2559 // CHECK1-NEXT: call void @__tgt_register_requires(i64 1) 2560 // CHECK1-NEXT: ret void 2561 // 2562 // 2563 // CHECK2-LABEL: define {{[^@]+}}@main 2564 // CHECK2-SAME: () #[[ATTR0:[0-9]+]] { 2565 // CHECK2-NEXT: entry: 2566 // CHECK2-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 2567 // CHECK2-NEXT: [[A:%.*]] = alloca double*, align 8 2568 // CHECK2-NEXT: [[B:%.*]] = alloca double*, align 8 2569 // CHECK2-NEXT: [[C:%.*]] = alloca double*, align 8 2570 // CHECK2-NEXT: [[N:%.*]] = alloca i32, align 4 2571 // CHECK2-NEXT: [[CH:%.*]] = alloca i32, align 4 2572 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 8 2573 // CHECK2-NEXT: store i32 0, i32* [[RETVAL]], align 4 2574 // CHECK2-NEXT: store i32 10000, i32* [[N]], align 4 2575 // CHECK2-NEXT: store i32 100, i32* [[CH]], align 4 2576 // CHECK2-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 2577 // CHECK2-NEXT: store i32* [[N]], i32** [[TMP0]], align 8 2578 // CHECK2-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 2579 // CHECK2-NEXT: store double** [[A]], double*** [[TMP1]], align 8 2580 // CHECK2-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 2581 // CHECK2-NEXT: store double** [[B]], double*** [[TMP2]], align 8 2582 // CHECK2-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 2583 // CHECK2-NEXT: store double** [[C]], double*** [[TMP3]], align 8 2584 // CHECK2-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 2585 // CHECK2-NEXT: store i32* [[CH]], i32** [[TMP4]], align 8 2586 // CHECK2-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(40) [[REF_TMP]]) 2587 // CHECK2-NEXT: ret i32 0 2588 // 2589 // 2590 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l117 2591 // CHECK2-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2:[0-9]+]] { 2592 // CHECK2-NEXT: entry: 2593 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 2594 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 2595 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 2596 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 2597 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 2598 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 2599 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 2600 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 2601 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 2602 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3:[0-9]+]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 2603 // CHECK2-NEXT: ret void 2604 // 2605 // 2606 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined. 2607 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2608 // CHECK2-NEXT: entry: 2609 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2610 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2611 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2612 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2613 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2614 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2615 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2616 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 2617 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2618 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2619 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 2620 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 2621 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 2622 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2623 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2624 // CHECK2-NEXT: [[I3:%.*]] = alloca i32, align 4 2625 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2626 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2627 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2628 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2629 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2630 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2631 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2632 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2633 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2634 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2635 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2636 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 2637 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2638 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2639 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2640 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 2641 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2642 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 2643 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2644 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2645 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2646 // CHECK2: omp.precond.then: 2647 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 2648 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2649 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 2650 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2651 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2652 // CHECK2-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2653 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 2654 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 2655 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2656 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2657 // CHECK2-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 2658 // CHECK2-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 2659 // CHECK2: cond.true: 2660 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2661 // CHECK2-NEXT: br label [[COND_END:%.*]] 2662 // CHECK2: cond.false: 2663 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2664 // CHECK2-NEXT: br label [[COND_END]] 2665 // CHECK2: cond.end: 2666 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 2667 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 2668 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2669 // CHECK2-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 2670 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2671 // CHECK2: omp.inner.for.cond: 2672 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2673 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2674 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 2675 // CHECK2-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2676 // CHECK2: omp.inner.for.body: 2677 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2678 // CHECK2-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 2679 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2680 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 2681 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 2682 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2683 // CHECK2: omp.inner.for.inc: 2684 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2685 // CHECK2-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 2686 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 2687 // CHECK2-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 2688 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 2689 // CHECK2: omp.inner.for.end: 2690 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 2691 // CHECK2: omp.loop.exit: 2692 // CHECK2-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2693 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 2694 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 2695 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 2696 // CHECK2: omp.precond.end: 2697 // CHECK2-NEXT: ret void 2698 // 2699 // 2700 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..1 2701 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2702 // CHECK2-NEXT: entry: 2703 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2704 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2705 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 2706 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 2707 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2708 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2709 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2710 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2711 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2712 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 2713 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2714 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2715 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 2716 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 2717 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 2718 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2719 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2720 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 2721 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_0:%.*]], align 8 2722 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2723 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2724 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2725 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2726 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2727 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2728 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2729 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2730 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2731 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2732 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2733 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2734 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2735 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 2736 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2737 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2738 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2739 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 2740 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2741 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 2742 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2743 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2744 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2745 // CHECK2: omp.precond.then: 2746 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 2747 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2748 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 2749 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2750 // CHECK2-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 2751 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2752 // CHECK2-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 2753 // CHECK2-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 2754 // CHECK2-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 2755 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2756 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2757 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2758 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 2759 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 2760 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2761 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2762 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 2763 // CHECK2-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 2764 // CHECK2: cond.true: 2765 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2766 // CHECK2-NEXT: br label [[COND_END:%.*]] 2767 // CHECK2: cond.false: 2768 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2769 // CHECK2-NEXT: br label [[COND_END]] 2770 // CHECK2: cond.end: 2771 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 2772 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 2773 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 2774 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 2775 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2776 // CHECK2: omp.inner.for.cond: 2777 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2778 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 2779 // CHECK2-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 2780 // CHECK2-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2781 // CHECK2: omp.inner.for.body: 2782 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2783 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 2784 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 2785 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 2786 // CHECK2-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 2787 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 2788 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 2789 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 2790 // CHECK2-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 2791 // CHECK2-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 2792 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 2793 // CHECK2-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 2794 // CHECK2-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 2795 // CHECK2-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 2796 // CHECK2-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 2797 // CHECK2-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 2798 // CHECK2-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 2799 // CHECK2-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 2800 // CHECK2-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 2801 // CHECK2-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 2802 // CHECK2-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 0 2803 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 2804 // CHECK2-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 1 2805 // CHECK2-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 2806 // CHECK2-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 2 2807 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 2808 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 3 2809 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 2810 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE_clEv"(%class.anon.0* nonnull dereferenceable(32) [[REF_TMP]]) 2811 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 2812 // CHECK2: omp.body.continue: 2813 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2814 // CHECK2: omp.inner.for.inc: 2815 // CHECK2-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2816 // CHECK2-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 2817 // CHECK2-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 2818 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 2819 // CHECK2: omp.inner.for.end: 2820 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 2821 // CHECK2: omp.loop.exit: 2822 // CHECK2-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2823 // CHECK2-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 2824 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 2825 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 2826 // CHECK2: omp.precond.end: 2827 // CHECK2-NEXT: ret void 2828 // 2829 // 2830 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l160 2831 // CHECK2-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 2832 // CHECK2-NEXT: entry: 2833 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 2834 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 2835 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 2836 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 2837 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 2838 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 2839 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 2840 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 2841 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 2842 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 2843 // CHECK2-NEXT: ret void 2844 // 2845 // 2846 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..2 2847 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2848 // CHECK2-NEXT: entry: 2849 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2850 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2851 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2852 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2853 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2854 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2855 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2856 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 2857 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2858 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2859 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 2860 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 2861 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 2862 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2863 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2864 // CHECK2-NEXT: [[I3:%.*]] = alloca i32, align 4 2865 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2866 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2867 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2868 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2869 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2870 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2871 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2872 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2873 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2874 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2875 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2876 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 2877 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2878 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2879 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2880 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 2881 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2882 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 2883 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2884 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2885 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2886 // CHECK2: omp.precond.then: 2887 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 2888 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2889 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 2890 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2891 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2892 // CHECK2-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2893 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 2894 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 2895 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2896 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2897 // CHECK2-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 2898 // CHECK2-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 2899 // CHECK2: cond.true: 2900 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2901 // CHECK2-NEXT: br label [[COND_END:%.*]] 2902 // CHECK2: cond.false: 2903 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2904 // CHECK2-NEXT: br label [[COND_END]] 2905 // CHECK2: cond.end: 2906 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 2907 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 2908 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2909 // CHECK2-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 2910 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 2911 // CHECK2: omp.inner.for.cond: 2912 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2913 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2914 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 2915 // CHECK2-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 2916 // CHECK2: omp.inner.for.body: 2917 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 2918 // CHECK2-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 2919 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 2920 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 2921 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 2922 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 2923 // CHECK2: omp.inner.for.inc: 2924 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 2925 // CHECK2-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 2926 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 2927 // CHECK2-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 2928 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 2929 // CHECK2: omp.inner.for.end: 2930 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 2931 // CHECK2: omp.loop.exit: 2932 // CHECK2-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2933 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 2934 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 2935 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 2936 // CHECK2: omp.precond.end: 2937 // CHECK2-NEXT: ret void 2938 // 2939 // 2940 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..3 2941 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 2942 // CHECK2-NEXT: entry: 2943 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 2944 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 2945 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 2946 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 2947 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 2948 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 2949 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 2950 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 2951 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 2952 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 2953 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 2954 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 2955 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 2956 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 2957 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 2958 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 2959 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 2960 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 2961 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_1:%.*]], align 8 2962 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 2963 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 2964 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2965 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2966 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 2967 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 2968 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 2969 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 2970 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 2971 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 2972 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 2973 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 2974 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 2975 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 2976 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2977 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 2978 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 2979 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 2980 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 2981 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 2982 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 2983 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 2984 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 2985 // CHECK2: omp.precond.then: 2986 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 2987 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 2988 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 2989 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 2990 // CHECK2-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 2991 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 2992 // CHECK2-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 2993 // CHECK2-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 2994 // CHECK2-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 2995 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 2996 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 2997 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 2998 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 2999 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 3000 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3001 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3002 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 3003 // CHECK2-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3004 // CHECK2: cond.true: 3005 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3006 // CHECK2-NEXT: br label [[COND_END:%.*]] 3007 // CHECK2: cond.false: 3008 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3009 // CHECK2-NEXT: br label [[COND_END]] 3010 // CHECK2: cond.end: 3011 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 3012 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 3013 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 3014 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 3015 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3016 // CHECK2: omp.inner.for.cond: 3017 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3018 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3019 // CHECK2-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 3020 // CHECK2-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3021 // CHECK2: omp.inner.for.body: 3022 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3023 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 3024 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 3025 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 3026 // CHECK2-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 3027 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 3028 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 3029 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 3030 // CHECK2-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 3031 // CHECK2-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 3032 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 3033 // CHECK2-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 3034 // CHECK2-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 3035 // CHECK2-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 3036 // CHECK2-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 3037 // CHECK2-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 3038 // CHECK2-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 3039 // CHECK2-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 3040 // CHECK2-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 3041 // CHECK2-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 3042 // CHECK2-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 0 3043 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 3044 // CHECK2-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 1 3045 // CHECK2-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 3046 // CHECK2-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 2 3047 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 3048 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 3 3049 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 3050 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE0_clEv"(%class.anon.1* nonnull dereferenceable(32) [[REF_TMP]]) 3051 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 3052 // CHECK2: omp.body.continue: 3053 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3054 // CHECK2: omp.inner.for.inc: 3055 // CHECK2-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3056 // CHECK2-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 3057 // CHECK2-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 3058 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3059 // CHECK2: omp.inner.for.end: 3060 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3061 // CHECK2: omp.loop.exit: 3062 // CHECK2-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3063 // CHECK2-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 3064 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 3065 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3066 // CHECK2: omp.precond.end: 3067 // CHECK2-NEXT: ret void 3068 // 3069 // 3070 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l202 3071 // CHECK2-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 3072 // CHECK2-NEXT: entry: 3073 // CHECK2-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 3074 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 3075 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 3076 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 3077 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 3078 // CHECK2-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 3079 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 3080 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 3081 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 3082 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 3083 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 3084 // CHECK2-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 3085 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 3086 // CHECK2-NEXT: ret void 3087 // 3088 // 3089 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..6 3090 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3091 // CHECK2-NEXT: entry: 3092 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3093 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3094 // CHECK2-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 3095 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3096 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3097 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3098 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3099 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3100 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3101 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3102 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3103 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3104 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 3105 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 3106 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3107 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3108 // CHECK2-NEXT: [[I3:%.*]] = alloca i32, align 4 3109 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3110 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3111 // CHECK2-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 3112 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3113 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3114 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3115 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3116 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 3117 // CHECK2-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3118 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 3119 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 3120 // CHECK2-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 3121 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 3122 // CHECK2-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 3123 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3124 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 3125 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3126 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 3127 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3128 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3129 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3130 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 3131 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3132 // CHECK2: omp.precond.then: 3133 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 3134 // CHECK2-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3135 // CHECK2-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 3136 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3137 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3138 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 3139 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3140 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 3141 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 3142 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3143 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3144 // CHECK2-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 3145 // CHECK2-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3146 // CHECK2: cond.true: 3147 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3148 // CHECK2-NEXT: br label [[COND_END:%.*]] 3149 // CHECK2: cond.false: 3150 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3151 // CHECK2-NEXT: br label [[COND_END]] 3152 // CHECK2: cond.end: 3153 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 3154 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 3155 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3156 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 3157 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3158 // CHECK2: omp.inner.for.cond: 3159 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3160 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3161 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 3162 // CHECK2-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 3163 // CHECK2-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3164 // CHECK2: omp.inner.for.body: 3165 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3166 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 3167 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3168 // CHECK2-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 3169 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 3170 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3171 // CHECK2: omp.inner.for.inc: 3172 // CHECK2-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3173 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3174 // CHECK2-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 3175 // CHECK2-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 3176 // CHECK2-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3177 // CHECK2-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3178 // CHECK2-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 3179 // CHECK2-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 3180 // CHECK2-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3181 // CHECK2-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3182 // CHECK2-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP27]], [[TMP28]] 3183 // CHECK2-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 3184 // CHECK2-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3185 // CHECK2-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3186 // CHECK2-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP29]], [[TMP30]] 3187 // CHECK2-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 3188 // CHECK2: cond.true10: 3189 // CHECK2-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3190 // CHECK2-NEXT: br label [[COND_END12:%.*]] 3191 // CHECK2: cond.false11: 3192 // CHECK2-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3193 // CHECK2-NEXT: br label [[COND_END12]] 3194 // CHECK2: cond.end12: 3195 // CHECK2-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP31]], [[COND_TRUE10]] ], [ [[TMP32]], [[COND_FALSE11]] ] 3196 // CHECK2-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 3197 // CHECK2-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3198 // CHECK2-NEXT: store i32 [[TMP33]], i32* [[DOTOMP_IV]], align 4 3199 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3200 // CHECK2: omp.inner.for.end: 3201 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3202 // CHECK2: omp.loop.exit: 3203 // CHECK2-NEXT: [[TMP34:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3204 // CHECK2-NEXT: [[TMP35:%.*]] = load i32, i32* [[TMP34]], align 4 3205 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP35]]) 3206 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3207 // CHECK2: omp.precond.end: 3208 // CHECK2-NEXT: ret void 3209 // 3210 // 3211 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..7 3212 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3213 // CHECK2-NEXT: entry: 3214 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3215 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3216 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 3217 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 3218 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3219 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3220 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3221 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3222 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3223 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3224 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3225 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3226 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3227 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 3228 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 3229 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3230 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3231 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 3232 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_2:%.*]], align 8 3233 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3234 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3235 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3236 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3237 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3238 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3239 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3240 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3241 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3242 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 3243 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 3244 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 3245 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 3246 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 3247 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3248 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 3249 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3250 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 3251 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3252 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3253 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3254 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 3255 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3256 // CHECK2: omp.precond.then: 3257 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 3258 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3259 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 3260 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3261 // CHECK2-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 3262 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3263 // CHECK2-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 3264 // CHECK2-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 3265 // CHECK2-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 3266 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3267 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3268 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3269 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 3270 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 3271 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3272 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3273 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 3274 // CHECK2-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3275 // CHECK2: cond.true: 3276 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3277 // CHECK2-NEXT: br label [[COND_END:%.*]] 3278 // CHECK2: cond.false: 3279 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3280 // CHECK2-NEXT: br label [[COND_END]] 3281 // CHECK2: cond.end: 3282 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 3283 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 3284 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 3285 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 3286 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3287 // CHECK2: omp.inner.for.cond: 3288 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3289 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3290 // CHECK2-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 3291 // CHECK2-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3292 // CHECK2: omp.inner.for.body: 3293 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3294 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 3295 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 3296 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 3297 // CHECK2-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 3298 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 3299 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 3300 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 3301 // CHECK2-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 3302 // CHECK2-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 3303 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 3304 // CHECK2-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 3305 // CHECK2-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 3306 // CHECK2-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 3307 // CHECK2-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 3308 // CHECK2-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 3309 // CHECK2-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 3310 // CHECK2-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 3311 // CHECK2-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 3312 // CHECK2-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 3313 // CHECK2-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 0 3314 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 3315 // CHECK2-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 1 3316 // CHECK2-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 3317 // CHECK2-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 2 3318 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 3319 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 3 3320 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 3321 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE1_clEv"(%class.anon.2* nonnull dereferenceable(32) [[REF_TMP]]) 3322 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 3323 // CHECK2: omp.body.continue: 3324 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3325 // CHECK2: omp.inner.for.inc: 3326 // CHECK2-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3327 // CHECK2-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 3328 // CHECK2-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 3329 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3330 // CHECK2: omp.inner.for.end: 3331 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3332 // CHECK2: omp.loop.exit: 3333 // CHECK2-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3334 // CHECK2-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 3335 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 3336 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3337 // CHECK2: omp.precond.end: 3338 // CHECK2-NEXT: ret void 3339 // 3340 // 3341 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l235 3342 // CHECK2-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 3343 // CHECK2-NEXT: entry: 3344 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 3345 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 3346 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 3347 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 3348 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 3349 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 3350 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 3351 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 3352 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 3353 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 3354 // CHECK2-NEXT: ret void 3355 // 3356 // 3357 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..10 3358 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3359 // CHECK2-NEXT: entry: 3360 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3361 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3362 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3363 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3364 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3365 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3366 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3367 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3368 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3369 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3370 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3371 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 3372 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 3373 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3374 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3375 // CHECK2-NEXT: [[I3:%.*]] = alloca i32, align 4 3376 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3377 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3378 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3379 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3380 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3381 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3382 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3383 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 3384 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 3385 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 3386 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 3387 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 3388 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3389 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 3390 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3391 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 3392 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3393 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3394 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3395 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 3396 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3397 // CHECK2: omp.precond.then: 3398 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 3399 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3400 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 3401 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3402 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3403 // CHECK2-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3404 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 3405 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 3406 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3407 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3408 // CHECK2-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 3409 // CHECK2-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3410 // CHECK2: cond.true: 3411 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3412 // CHECK2-NEXT: br label [[COND_END:%.*]] 3413 // CHECK2: cond.false: 3414 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3415 // CHECK2-NEXT: br label [[COND_END]] 3416 // CHECK2: cond.end: 3417 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 3418 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 3419 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3420 // CHECK2-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 3421 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3422 // CHECK2: omp.inner.for.cond: 3423 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3424 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3425 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 3426 // CHECK2-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3427 // CHECK2: omp.inner.for.body: 3428 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3429 // CHECK2-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 3430 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3431 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 3432 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 3433 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3434 // CHECK2: omp.inner.for.inc: 3435 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3436 // CHECK2-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3437 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 3438 // CHECK2-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 3439 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3440 // CHECK2: omp.inner.for.end: 3441 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3442 // CHECK2: omp.loop.exit: 3443 // CHECK2-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3444 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 3445 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 3446 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3447 // CHECK2: omp.precond.end: 3448 // CHECK2-NEXT: ret void 3449 // 3450 // 3451 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..11 3452 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3453 // CHECK2-NEXT: entry: 3454 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3455 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3456 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 3457 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 3458 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3459 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3460 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3461 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3462 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3463 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3464 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3465 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3466 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3467 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 3468 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 3469 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3470 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3471 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 3472 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_3:%.*]], align 8 3473 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3474 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3475 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3476 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3477 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3478 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3479 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3480 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3481 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3482 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 3483 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 3484 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 3485 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 3486 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 3487 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3488 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 3489 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3490 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 3491 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3492 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3493 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3494 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 3495 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3496 // CHECK2: omp.precond.then: 3497 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 3498 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3499 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 3500 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3501 // CHECK2-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 3502 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3503 // CHECK2-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 3504 // CHECK2-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 3505 // CHECK2-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 3506 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3507 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3508 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3509 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 3510 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 3511 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3512 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3513 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 3514 // CHECK2-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3515 // CHECK2: cond.true: 3516 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3517 // CHECK2-NEXT: br label [[COND_END:%.*]] 3518 // CHECK2: cond.false: 3519 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3520 // CHECK2-NEXT: br label [[COND_END]] 3521 // CHECK2: cond.end: 3522 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 3523 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 3524 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 3525 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 3526 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3527 // CHECK2: omp.inner.for.cond: 3528 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3529 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3530 // CHECK2-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 3531 // CHECK2-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3532 // CHECK2: omp.inner.for.body: 3533 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3534 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 3535 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 3536 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 3537 // CHECK2-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 3538 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 3539 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 3540 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 3541 // CHECK2-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 3542 // CHECK2-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 3543 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 3544 // CHECK2-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 3545 // CHECK2-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 3546 // CHECK2-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 3547 // CHECK2-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 3548 // CHECK2-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 3549 // CHECK2-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 3550 // CHECK2-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 3551 // CHECK2-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 3552 // CHECK2-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 3553 // CHECK2-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 0 3554 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 8 3555 // CHECK2-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 1 3556 // CHECK2-NEXT: store i32* [[I4]], i32** [[TMP29]], align 8 3557 // CHECK2-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 2 3558 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 8 3559 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 3 3560 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 8 3561 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE2_clEv"(%class.anon.3* nonnull dereferenceable(32) [[REF_TMP]]) 3562 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 3563 // CHECK2: omp.body.continue: 3564 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3565 // CHECK2: omp.inner.for.inc: 3566 // CHECK2-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3567 // CHECK2-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 3568 // CHECK2-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 3569 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3570 // CHECK2: omp.inner.for.end: 3571 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3572 // CHECK2: omp.loop.exit: 3573 // CHECK2-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3574 // CHECK2-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 3575 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 3576 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3577 // CHECK2: omp.precond.end: 3578 // CHECK2-NEXT: ret void 3579 // 3580 // 3581 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l267 3582 // CHECK2-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 3583 // CHECK2-NEXT: entry: 3584 // CHECK2-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 3585 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 3586 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 3587 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 3588 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 3589 // CHECK2-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 3590 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 3591 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 3592 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 3593 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 3594 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 3595 // CHECK2-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 3596 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 3597 // CHECK2-NEXT: ret void 3598 // 3599 // 3600 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..14 3601 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3602 // CHECK2-NEXT: entry: 3603 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3604 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3605 // CHECK2-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 3606 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3607 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3608 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3609 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3610 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3611 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3612 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3613 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3614 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 3615 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3616 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 3617 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 3618 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3619 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3620 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 3621 // CHECK2-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 3622 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3623 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3624 // CHECK2-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 3625 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3626 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3627 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3628 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3629 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 3630 // CHECK2-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3631 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 3632 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 3633 // CHECK2-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 3634 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 3635 // CHECK2-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 3636 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 3637 // CHECK2-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3638 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3639 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 3640 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3641 // CHECK2-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 3642 // CHECK2-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 3643 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3644 // CHECK2-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3645 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 3646 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3647 // CHECK2: omp.precond.then: 3648 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 3649 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 3650 // CHECK2-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 3651 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3652 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3653 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3654 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 3655 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 3656 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3657 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 3658 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 3659 // CHECK2-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3660 // CHECK2: cond.true: 3661 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 3662 // CHECK2-NEXT: br label [[COND_END:%.*]] 3663 // CHECK2: cond.false: 3664 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3665 // CHECK2-NEXT: br label [[COND_END]] 3666 // CHECK2: cond.end: 3667 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 3668 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 3669 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3670 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 3671 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3672 // CHECK2: omp.inner.for.cond: 3673 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3674 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3675 // CHECK2-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 3676 // CHECK2-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3677 // CHECK2: omp.inner.for.body: 3678 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3679 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 3680 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3681 // CHECK2-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 3682 // CHECK2-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3683 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 3684 // CHECK2-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 3685 // CHECK2-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 3686 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 3687 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3688 // CHECK2: omp.inner.for.inc: 3689 // CHECK2-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3690 // CHECK2-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3691 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 3692 // CHECK2-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 3693 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3694 // CHECK2: omp.inner.for.end: 3695 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3696 // CHECK2: omp.loop.exit: 3697 // CHECK2-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3698 // CHECK2-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 3699 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 3700 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3701 // CHECK2: omp.precond.end: 3702 // CHECK2-NEXT: ret void 3703 // 3704 // 3705 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..15 3706 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 3707 // CHECK2-NEXT: entry: 3708 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3709 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3710 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 3711 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 3712 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3713 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3714 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3715 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3716 // CHECK2-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 3717 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3718 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3719 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3720 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 3721 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3722 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 3723 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 3724 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3725 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3726 // CHECK2-NEXT: [[I6:%.*]] = alloca i32, align 4 3727 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_4:%.*]], align 8 3728 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3729 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3730 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3731 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3732 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3733 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3734 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3735 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3736 // CHECK2-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 3737 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3738 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 3739 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 3740 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 3741 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 3742 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 3743 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3744 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3745 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 3746 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3747 // CHECK2-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 3748 // CHECK2-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 3749 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3750 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3751 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 3752 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3753 // CHECK2: omp.precond.then: 3754 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 3755 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 3756 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 3757 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3758 // CHECK2-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 3759 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3760 // CHECK2-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 3761 // CHECK2-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 3762 // CHECK2-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 3763 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3764 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3765 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 3766 // CHECK2-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3767 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 3768 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 3769 // CHECK2-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 3770 // CHECK2: omp.dispatch.cond: 3771 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3772 // CHECK2-NEXT: [[CONV7:%.*]] = sext i32 [[TMP13]] to i64 3773 // CHECK2-NEXT: [[TMP14:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3774 // CHECK2-NEXT: [[CMP8:%.*]] = icmp ugt i64 [[CONV7]], [[TMP14]] 3775 // CHECK2-NEXT: br i1 [[CMP8]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3776 // CHECK2: cond.true: 3777 // CHECK2-NEXT: [[TMP15:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3778 // CHECK2-NEXT: br label [[COND_END:%.*]] 3779 // CHECK2: cond.false: 3780 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3781 // CHECK2-NEXT: [[CONV9:%.*]] = sext i32 [[TMP16]] to i64 3782 // CHECK2-NEXT: br label [[COND_END]] 3783 // CHECK2: cond.end: 3784 // CHECK2-NEXT: [[COND:%.*]] = phi i64 [ [[TMP15]], [[COND_TRUE]] ], [ [[CONV9]], [[COND_FALSE]] ] 3785 // CHECK2-NEXT: [[CONV10:%.*]] = trunc i64 [[COND]] to i32 3786 // CHECK2-NEXT: store i32 [[CONV10]], i32* [[DOTOMP_UB]], align 4 3787 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 3788 // CHECK2-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 3789 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3790 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3791 // CHECK2-NEXT: [[CMP11:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 3792 // CHECK2-NEXT: br i1 [[CMP11]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 3793 // CHECK2: omp.dispatch.body: 3794 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3795 // CHECK2: omp.inner.for.cond: 3796 // CHECK2-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3797 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3798 // CHECK2-NEXT: [[CMP12:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 3799 // CHECK2-NEXT: br i1 [[CMP12]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3800 // CHECK2: omp.inner.for.body: 3801 // CHECK2-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3802 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 3803 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 3804 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I6]], align 4 3805 // CHECK2-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 8 3806 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[I6]], align 4 3807 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP24]] to i64 3808 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM]] 3809 // CHECK2-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 8 3810 // CHECK2-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 8 3811 // CHECK2-NEXT: [[TMP27:%.*]] = load i32, i32* [[I6]], align 4 3812 // CHECK2-NEXT: [[IDXPROM13:%.*]] = sext i32 [[TMP27]] to i64 3813 // CHECK2-NEXT: [[ARRAYIDX14:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM13]] 3814 // CHECK2-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX14]], align 8 3815 // CHECK2-NEXT: [[ADD15:%.*]] = fadd double [[TMP25]], [[TMP28]] 3816 // CHECK2-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 8 3817 // CHECK2-NEXT: [[TMP30:%.*]] = load i32, i32* [[I6]], align 4 3818 // CHECK2-NEXT: [[IDXPROM16:%.*]] = sext i32 [[TMP30]] to i64 3819 // CHECK2-NEXT: [[ARRAYIDX17:%.*]] = getelementptr inbounds double, double* [[TMP29]], i64 [[IDXPROM16]] 3820 // CHECK2-NEXT: store double [[ADD15]], double* [[ARRAYIDX17]], align 8 3821 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 0 3822 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP31]], align 8 3823 // CHECK2-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 1 3824 // CHECK2-NEXT: store i32* [[I6]], i32** [[TMP32]], align 8 3825 // CHECK2-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 2 3826 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP33]], align 8 3827 // CHECK2-NEXT: [[TMP34:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 3 3828 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP34]], align 8 3829 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE3_clEv"(%class.anon.4* nonnull dereferenceable(32) [[REF_TMP]]) 3830 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 3831 // CHECK2: omp.body.continue: 3832 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3833 // CHECK2: omp.inner.for.inc: 3834 // CHECK2-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3835 // CHECK2-NEXT: [[ADD18:%.*]] = add nsw i32 [[TMP35]], 1 3836 // CHECK2-NEXT: store i32 [[ADD18]], i32* [[DOTOMP_IV]], align 4 3837 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3838 // CHECK2: omp.inner.for.end: 3839 // CHECK2-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 3840 // CHECK2: omp.dispatch.inc: 3841 // CHECK2-NEXT: [[TMP36:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 3842 // CHECK2-NEXT: [[TMP37:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3843 // CHECK2-NEXT: [[ADD19:%.*]] = add nsw i32 [[TMP36]], [[TMP37]] 3844 // CHECK2-NEXT: store i32 [[ADD19]], i32* [[DOTOMP_LB]], align 4 3845 // CHECK2-NEXT: [[TMP38:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 3846 // CHECK2-NEXT: [[TMP39:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3847 // CHECK2-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP38]], [[TMP39]] 3848 // CHECK2-NEXT: store i32 [[ADD20]], i32* [[DOTOMP_UB]], align 4 3849 // CHECK2-NEXT: br label [[OMP_DISPATCH_COND]] 3850 // CHECK2: omp.dispatch.end: 3851 // CHECK2-NEXT: [[TMP40:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3852 // CHECK2-NEXT: [[TMP41:%.*]] = load i32, i32* [[TMP40]], align 4 3853 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP41]]) 3854 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3855 // CHECK2: omp.precond.end: 3856 // CHECK2-NEXT: ret void 3857 // 3858 // 3859 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l300 3860 // CHECK2-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 3861 // CHECK2-NEXT: entry: 3862 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 3863 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 3864 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 3865 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 3866 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 3867 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 3868 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 3869 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 3870 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 3871 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 3872 // CHECK2-NEXT: ret void 3873 // 3874 // 3875 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..18 3876 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3877 // CHECK2-NEXT: entry: 3878 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3879 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3880 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3881 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3882 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3883 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3884 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3885 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3886 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3887 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3888 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3889 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 3890 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 3891 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3892 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3893 // CHECK2-NEXT: [[I3:%.*]] = alloca i32, align 4 3894 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3895 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3896 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3897 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3898 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3899 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3900 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 3901 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 3902 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 3903 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 3904 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 3905 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 3906 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3907 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 3908 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 3909 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 3910 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 3911 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 3912 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 3913 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 3914 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 3915 // CHECK2: omp.precond.then: 3916 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 3917 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3918 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 3919 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 3920 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 3921 // CHECK2-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3922 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 3923 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 3924 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3925 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3926 // CHECK2-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 3927 // CHECK2-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 3928 // CHECK2: cond.true: 3929 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 3930 // CHECK2-NEXT: br label [[COND_END:%.*]] 3931 // CHECK2: cond.false: 3932 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3933 // CHECK2-NEXT: br label [[COND_END]] 3934 // CHECK2: cond.end: 3935 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 3936 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 3937 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3938 // CHECK2-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 3939 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 3940 // CHECK2: omp.inner.for.cond: 3941 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3942 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3943 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 3944 // CHECK2-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 3945 // CHECK2: omp.inner.for.body: 3946 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 3947 // CHECK2-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 3948 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 3949 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 3950 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 3951 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 3952 // CHECK2: omp.inner.for.inc: 3953 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 3954 // CHECK2-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 3955 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 3956 // CHECK2-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 3957 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 3958 // CHECK2: omp.inner.for.end: 3959 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 3960 // CHECK2: omp.loop.exit: 3961 // CHECK2-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 3962 // CHECK2-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 3963 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 3964 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 3965 // CHECK2: omp.precond.end: 3966 // CHECK2-NEXT: ret void 3967 // 3968 // 3969 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..19 3970 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 3971 // CHECK2-NEXT: entry: 3972 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 3973 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 3974 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 3975 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 3976 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 3977 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 3978 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 3979 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 3980 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 3981 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 3982 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 3983 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 3984 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 3985 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 3986 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 3987 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 3988 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 3989 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 3990 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_5:%.*]], align 8 3991 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 3992 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 3993 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 3994 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 3995 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 3996 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 3997 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 3998 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 3999 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 4000 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 4001 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 4002 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 4003 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 4004 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 4005 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4006 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 4007 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4008 // CHECK2-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 4009 // CHECK2-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4010 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 4011 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4012 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 4013 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4014 // CHECK2: omp.precond.then: 4015 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 4016 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4017 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 4018 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 4019 // CHECK2-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 4020 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 4021 // CHECK2-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 4022 // CHECK2-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 4023 // CHECK2-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 4024 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4025 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4026 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 4027 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4028 // CHECK2-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 4029 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 4030 // CHECK2-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 4031 // CHECK2-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 4032 // CHECK2: omp.dispatch.cond: 4033 // CHECK2-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 4034 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 4035 // CHECK2-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 4036 // CHECK2-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 4037 // CHECK2-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 4038 // CHECK2: omp.dispatch.body: 4039 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 4040 // CHECK2-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 4041 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4042 // CHECK2: omp.inner.for.cond: 4043 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 4044 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !11 4045 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 4046 // CHECK2-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4047 // CHECK2: omp.inner.for.body: 4048 // CHECK2-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 4049 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 4050 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 4051 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !11 4052 // CHECK2-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !11 4053 // CHECK2-NEXT: [[TMP22:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !11 4054 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP22]] to i64 4055 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i64 [[IDXPROM]] 4056 // CHECK2-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !11 4057 // CHECK2-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !11 4058 // CHECK2-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !11 4059 // CHECK2-NEXT: [[IDXPROM6:%.*]] = sext i32 [[TMP25]] to i64 4060 // CHECK2-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP24]], i64 [[IDXPROM6]] 4061 // CHECK2-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX7]], align 8, !llvm.access.group !11 4062 // CHECK2-NEXT: [[ADD8:%.*]] = fadd double [[TMP23]], [[TMP26]] 4063 // CHECK2-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !11 4064 // CHECK2-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !11 4065 // CHECK2-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP28]] to i64 4066 // CHECK2-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP27]], i64 [[IDXPROM9]] 4067 // CHECK2-NEXT: store double [[ADD8]], double* [[ARRAYIDX10]], align 8, !llvm.access.group !11 4068 // CHECK2-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 0 4069 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP29]], align 8, !llvm.access.group !11 4070 // CHECK2-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 1 4071 // CHECK2-NEXT: store i32* [[I4]], i32** [[TMP30]], align 8, !llvm.access.group !11 4072 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 2 4073 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP31]], align 8, !llvm.access.group !11 4074 // CHECK2-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 3 4075 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP32]], align 8, !llvm.access.group !11 4076 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE4_clEv"(%class.anon.5* nonnull dereferenceable(32) [[REF_TMP]]), !llvm.access.group !11 4077 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 4078 // CHECK2: omp.body.continue: 4079 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4080 // CHECK2: omp.inner.for.inc: 4081 // CHECK2-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 4082 // CHECK2-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP33]], 1 4083 // CHECK2-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !11 4084 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP12:![0-9]+]] 4085 // CHECK2: omp.inner.for.end: 4086 // CHECK2-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 4087 // CHECK2: omp.dispatch.inc: 4088 // CHECK2-NEXT: br label [[OMP_DISPATCH_COND]] 4089 // CHECK2: omp.dispatch.end: 4090 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 4091 // CHECK2: omp.precond.end: 4092 // CHECK2-NEXT: ret void 4093 // 4094 // 4095 // CHECK2-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l329 4096 // CHECK2-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 4097 // CHECK2-NEXT: entry: 4098 // CHECK2-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 4099 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 4100 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 4101 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 4102 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 4103 // CHECK2-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 4104 // CHECK2-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 4105 // CHECK2-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 4106 // CHECK2-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 4107 // CHECK2-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 4108 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 4109 // CHECK2-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 4110 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 4111 // CHECK2-NEXT: ret void 4112 // 4113 // 4114 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..22 4115 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR2]] { 4116 // CHECK2-NEXT: entry: 4117 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 4118 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 4119 // CHECK2-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 4120 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 4121 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 4122 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 4123 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 4124 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4125 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4126 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 4127 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4128 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 4129 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 4130 // CHECK2-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 4131 // CHECK2-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 4132 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4133 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4134 // CHECK2-NEXT: [[I4:%.*]] = alloca i32, align 4 4135 // CHECK2-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 4136 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 4137 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 4138 // CHECK2-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 4139 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 4140 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 4141 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 4142 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 4143 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 4144 // CHECK2-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 4145 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 4146 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 4147 // CHECK2-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 4148 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 4149 // CHECK2-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 4150 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 4151 // CHECK2-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4152 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4153 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 4154 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4155 // CHECK2-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 4156 // CHECK2-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 4157 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 4158 // CHECK2-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4159 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 4160 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4161 // CHECK2: omp.precond.then: 4162 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 4163 // CHECK2-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 4164 // CHECK2-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 4165 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4166 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4167 // CHECK2-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 4168 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 4169 // CHECK2-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 4170 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4171 // CHECK2-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 4172 // CHECK2-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 4173 // CHECK2-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 4174 // CHECK2: cond.true: 4175 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 4176 // CHECK2-NEXT: br label [[COND_END:%.*]] 4177 // CHECK2: cond.false: 4178 // CHECK2-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4179 // CHECK2-NEXT: br label [[COND_END]] 4180 // CHECK2: cond.end: 4181 // CHECK2-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 4182 // CHECK2-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 4183 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4184 // CHECK2-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 4185 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4186 // CHECK2: omp.inner.for.cond: 4187 // CHECK2-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4188 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4189 // CHECK2-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 4190 // CHECK2-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4191 // CHECK2: omp.inner.for.body: 4192 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4193 // CHECK2-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 4194 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4195 // CHECK2-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 4196 // CHECK2-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4197 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 4198 // CHECK2-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 4199 // CHECK2-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 4200 // CHECK2-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 4201 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4202 // CHECK2: omp.inner.for.inc: 4203 // CHECK2-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4204 // CHECK2-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 4205 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 4206 // CHECK2-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 4207 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]] 4208 // CHECK2: omp.inner.for.end: 4209 // CHECK2-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 4210 // CHECK2: omp.loop.exit: 4211 // CHECK2-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 4212 // CHECK2-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 4213 // CHECK2-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 4214 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 4215 // CHECK2: omp.precond.end: 4216 // CHECK2-NEXT: ret void 4217 // 4218 // 4219 // CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..23 4220 // CHECK2-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 4221 // CHECK2-NEXT: entry: 4222 // CHECK2-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 4223 // CHECK2-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 4224 // CHECK2-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 4225 // CHECK2-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 4226 // CHECK2-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 4227 // CHECK2-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 4228 // CHECK2-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 4229 // CHECK2-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 4230 // CHECK2-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 4231 // CHECK2-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4232 // CHECK2-NEXT: [[TMP:%.*]] = alloca i32, align 4 4233 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4234 // CHECK2-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 4235 // CHECK2-NEXT: [[I:%.*]] = alloca i32, align 4 4236 // CHECK2-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 4237 // CHECK2-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 4238 // CHECK2-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4239 // CHECK2-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4240 // CHECK2-NEXT: [[I6:%.*]] = alloca i32, align 4 4241 // CHECK2-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_6:%.*]], align 8 4242 // CHECK2-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 4243 // CHECK2-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 4244 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 4245 // CHECK2-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 4246 // CHECK2-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 4247 // CHECK2-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 4248 // CHECK2-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 4249 // CHECK2-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 4250 // CHECK2-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 4251 // CHECK2-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 4252 // CHECK2-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 4253 // CHECK2-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 4254 // CHECK2-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 4255 // CHECK2-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 4256 // CHECK2-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 4257 // CHECK2-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4258 // CHECK2-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4259 // CHECK2-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 4260 // CHECK2-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4261 // CHECK2-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 4262 // CHECK2-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 4263 // CHECK2-NEXT: store i32 0, i32* [[I]], align 4 4264 // CHECK2-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4265 // CHECK2-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 4266 // CHECK2-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4267 // CHECK2: omp.precond.then: 4268 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 4269 // CHECK2-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 4270 // CHECK2-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 4271 // CHECK2-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 4272 // CHECK2-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 4273 // CHECK2-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 4274 // CHECK2-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 4275 // CHECK2-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 4276 // CHECK2-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 4277 // CHECK2-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4278 // CHECK2-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4279 // CHECK2-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 4280 // CHECK2-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 4281 // CHECK2-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4282 // CHECK2-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 4283 // CHECK2-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 4284 // CHECK2-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 4285 // CHECK2-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 4286 // CHECK2: omp.dispatch.cond: 4287 // CHECK2-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 4288 // CHECK2-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 4289 // CHECK2-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 4290 // CHECK2-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 4291 // CHECK2-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 4292 // CHECK2: omp.dispatch.body: 4293 // CHECK2-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 4294 // CHECK2-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 4295 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4296 // CHECK2: omp.inner.for.cond: 4297 // CHECK2-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 4298 // CHECK2-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !14 4299 // CHECK2-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 4300 // CHECK2-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4301 // CHECK2: omp.inner.for.body: 4302 // CHECK2-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 4303 // CHECK2-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 4304 // CHECK2-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 4305 // CHECK2-NEXT: store i32 [[ADD]], i32* [[I6]], align 4, !llvm.access.group !14 4306 // CHECK2-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !14 4307 // CHECK2-NEXT: [[TMP23:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !14 4308 // CHECK2-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP23]] to i64 4309 // CHECK2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i64 [[IDXPROM]] 4310 // CHECK2-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !14 4311 // CHECK2-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !14 4312 // CHECK2-NEXT: [[TMP26:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !14 4313 // CHECK2-NEXT: [[IDXPROM8:%.*]] = sext i32 [[TMP26]] to i64 4314 // CHECK2-NEXT: [[ARRAYIDX9:%.*]] = getelementptr inbounds double, double* [[TMP25]], i64 [[IDXPROM8]] 4315 // CHECK2-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX9]], align 8, !llvm.access.group !14 4316 // CHECK2-NEXT: [[ADD10:%.*]] = fadd double [[TMP24]], [[TMP27]] 4317 // CHECK2-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !14 4318 // CHECK2-NEXT: [[TMP29:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !14 4319 // CHECK2-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP29]] to i64 4320 // CHECK2-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds double, double* [[TMP28]], i64 [[IDXPROM11]] 4321 // CHECK2-NEXT: store double [[ADD10]], double* [[ARRAYIDX12]], align 8, !llvm.access.group !14 4322 // CHECK2-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 0 4323 // CHECK2-NEXT: store double** [[TMP1]], double*** [[TMP30]], align 8, !llvm.access.group !14 4324 // CHECK2-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 1 4325 // CHECK2-NEXT: store i32* [[I6]], i32** [[TMP31]], align 8, !llvm.access.group !14 4326 // CHECK2-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 2 4327 // CHECK2-NEXT: store double** [[TMP2]], double*** [[TMP32]], align 8, !llvm.access.group !14 4328 // CHECK2-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 3 4329 // CHECK2-NEXT: store double** [[TMP3]], double*** [[TMP33]], align 8, !llvm.access.group !14 4330 // CHECK2-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE5_clEv"(%class.anon.6* nonnull dereferenceable(32) [[REF_TMP]]), !llvm.access.group !14 4331 // CHECK2-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 4332 // CHECK2: omp.body.continue: 4333 // CHECK2-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4334 // CHECK2: omp.inner.for.inc: 4335 // CHECK2-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 4336 // CHECK2-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP34]], 1 4337 // CHECK2-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !14 4338 // CHECK2-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP15:![0-9]+]] 4339 // CHECK2: omp.inner.for.end: 4340 // CHECK2-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 4341 // CHECK2: omp.dispatch.inc: 4342 // CHECK2-NEXT: br label [[OMP_DISPATCH_COND]] 4343 // CHECK2: omp.dispatch.end: 4344 // CHECK2-NEXT: br label [[OMP_PRECOND_END]] 4345 // CHECK2: omp.precond.end: 4346 // CHECK2-NEXT: ret void 4347 // 4348 // 4349 // CHECK2-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 4350 // CHECK2-SAME: () #[[ATTR4:[0-9]+]] { 4351 // CHECK2-NEXT: entry: 4352 // CHECK2-NEXT: call void @__tgt_register_requires(i64 1) 4353 // CHECK2-NEXT: ret void 4354 // 4355 // 4356 // CHECK3-LABEL: define {{[^@]+}}@main 4357 // CHECK3-SAME: () #[[ATTR0:[0-9]+]] { 4358 // CHECK3-NEXT: entry: 4359 // CHECK3-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 4360 // CHECK3-NEXT: [[A:%.*]] = alloca double*, align 4 4361 // CHECK3-NEXT: [[B:%.*]] = alloca double*, align 4 4362 // CHECK3-NEXT: [[C:%.*]] = alloca double*, align 4 4363 // CHECK3-NEXT: [[N:%.*]] = alloca i32, align 4 4364 // CHECK3-NEXT: [[CH:%.*]] = alloca i32, align 4 4365 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 4 4366 // CHECK3-NEXT: store i32 0, i32* [[RETVAL]], align 4 4367 // CHECK3-NEXT: store i32 10000, i32* [[N]], align 4 4368 // CHECK3-NEXT: store i32 100, i32* [[CH]], align 4 4369 // CHECK3-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 4370 // CHECK3-NEXT: store i32* [[N]], i32** [[TMP0]], align 4 4371 // CHECK3-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 4372 // CHECK3-NEXT: store double** [[A]], double*** [[TMP1]], align 4 4373 // CHECK3-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 4374 // CHECK3-NEXT: store double** [[B]], double*** [[TMP2]], align 4 4375 // CHECK3-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 4376 // CHECK3-NEXT: store double** [[C]], double*** [[TMP3]], align 4 4377 // CHECK3-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 4378 // CHECK3-NEXT: store i32* [[CH]], i32** [[TMP4]], align 4 4379 // CHECK3-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(20) [[REF_TMP]]) 4380 // CHECK3-NEXT: ret i32 0 4381 // 4382 // 4383 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l117 4384 // CHECK3-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2:[0-9]+]] { 4385 // CHECK3-NEXT: entry: 4386 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 4387 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 4388 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 4389 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 4390 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 4391 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 4392 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 4393 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 4394 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3:[0-9]+]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 4395 // CHECK3-NEXT: ret void 4396 // 4397 // 4398 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined. 4399 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 4400 // CHECK3-NEXT: entry: 4401 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 4402 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 4403 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 4404 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 4405 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 4406 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 4407 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4408 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 4409 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4410 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4411 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 4412 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 4413 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 4414 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4415 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4416 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 4417 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 4418 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 4419 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 4420 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 4421 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 4422 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 4423 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 4424 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 4425 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 4426 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 4427 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 4428 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 4429 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4430 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 4431 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4432 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 4433 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4434 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 4435 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4436 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 4437 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4438 // CHECK3: omp.precond.then: 4439 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 4440 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4441 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 4442 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4443 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4444 // CHECK3-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4445 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 4446 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 4447 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4448 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4449 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 4450 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 4451 // CHECK3: cond.true: 4452 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4453 // CHECK3-NEXT: br label [[COND_END:%.*]] 4454 // CHECK3: cond.false: 4455 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4456 // CHECK3-NEXT: br label [[COND_END]] 4457 // CHECK3: cond.end: 4458 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 4459 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 4460 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4461 // CHECK3-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 4462 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4463 // CHECK3: omp.inner.for.cond: 4464 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4465 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4466 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 4467 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4468 // CHECK3: omp.inner.for.body: 4469 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4470 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4471 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 4472 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4473 // CHECK3: omp.inner.for.inc: 4474 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4475 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 4476 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 4477 // CHECK3-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 4478 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 4479 // CHECK3: omp.inner.for.end: 4480 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 4481 // CHECK3: omp.loop.exit: 4482 // CHECK3-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4483 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 4484 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 4485 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 4486 // CHECK3: omp.precond.end: 4487 // CHECK3-NEXT: ret void 4488 // 4489 // 4490 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..1 4491 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 4492 // CHECK3-NEXT: entry: 4493 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 4494 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 4495 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 4496 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 4497 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 4498 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 4499 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 4500 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 4501 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4502 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 4503 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4504 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4505 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 4506 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 4507 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 4508 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4509 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4510 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 4511 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_0:%.*]], align 4 4512 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 4513 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 4514 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 4515 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 4516 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 4517 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 4518 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 4519 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 4520 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 4521 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 4522 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 4523 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 4524 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 4525 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 4526 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4527 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 4528 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4529 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 4530 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4531 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 4532 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4533 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 4534 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4535 // CHECK3: omp.precond.then: 4536 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 4537 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4538 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 4539 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 4540 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 4541 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 4542 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 4543 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4544 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4545 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4546 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 4547 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 4548 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4549 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4550 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 4551 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 4552 // CHECK3: cond.true: 4553 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4554 // CHECK3-NEXT: br label [[COND_END:%.*]] 4555 // CHECK3: cond.false: 4556 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4557 // CHECK3-NEXT: br label [[COND_END]] 4558 // CHECK3: cond.end: 4559 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 4560 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 4561 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 4562 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 4563 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4564 // CHECK3: omp.inner.for.cond: 4565 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4566 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4567 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 4568 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4569 // CHECK3: omp.inner.for.body: 4570 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4571 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 4572 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 4573 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 4574 // CHECK3-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 4575 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 4576 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 4577 // CHECK3-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 4578 // CHECK3-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 4579 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 4580 // CHECK3-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 4581 // CHECK3-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 4582 // CHECK3-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 4583 // CHECK3-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 4584 // CHECK3-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 4585 // CHECK3-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 4586 // CHECK3-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 4587 // CHECK3-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 0 4588 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 4589 // CHECK3-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 1 4590 // CHECK3-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 4591 // CHECK3-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 2 4592 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 4593 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 3 4594 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 4595 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE_clEv"(%class.anon.0* nonnull dereferenceable(16) [[REF_TMP]]) 4596 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 4597 // CHECK3: omp.body.continue: 4598 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4599 // CHECK3: omp.inner.for.inc: 4600 // CHECK3-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4601 // CHECK3-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 4602 // CHECK3-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 4603 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 4604 // CHECK3: omp.inner.for.end: 4605 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 4606 // CHECK3: omp.loop.exit: 4607 // CHECK3-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4608 // CHECK3-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 4609 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 4610 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 4611 // CHECK3: omp.precond.end: 4612 // CHECK3-NEXT: ret void 4613 // 4614 // 4615 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l160 4616 // CHECK3-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 4617 // CHECK3-NEXT: entry: 4618 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 4619 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 4620 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 4621 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 4622 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 4623 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 4624 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 4625 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 4626 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 4627 // CHECK3-NEXT: ret void 4628 // 4629 // 4630 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..2 4631 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 4632 // CHECK3-NEXT: entry: 4633 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 4634 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 4635 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 4636 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 4637 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 4638 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 4639 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4640 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 4641 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4642 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4643 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 4644 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 4645 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 4646 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4647 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4648 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 4649 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 4650 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 4651 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 4652 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 4653 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 4654 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 4655 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 4656 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 4657 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 4658 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 4659 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 4660 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 4661 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4662 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 4663 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4664 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 4665 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4666 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 4667 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4668 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 4669 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4670 // CHECK3: omp.precond.then: 4671 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 4672 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4673 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 4674 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4675 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4676 // CHECK3-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4677 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 4678 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 4679 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4680 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4681 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 4682 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 4683 // CHECK3: cond.true: 4684 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4685 // CHECK3-NEXT: br label [[COND_END:%.*]] 4686 // CHECK3: cond.false: 4687 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4688 // CHECK3-NEXT: br label [[COND_END]] 4689 // CHECK3: cond.end: 4690 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 4691 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 4692 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4693 // CHECK3-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 4694 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4695 // CHECK3: omp.inner.for.cond: 4696 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4697 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4698 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 4699 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4700 // CHECK3: omp.inner.for.body: 4701 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4702 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4703 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 4704 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4705 // CHECK3: omp.inner.for.inc: 4706 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4707 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 4708 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 4709 // CHECK3-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 4710 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 4711 // CHECK3: omp.inner.for.end: 4712 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 4713 // CHECK3: omp.loop.exit: 4714 // CHECK3-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4715 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 4716 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 4717 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 4718 // CHECK3: omp.precond.end: 4719 // CHECK3-NEXT: ret void 4720 // 4721 // 4722 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..3 4723 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 4724 // CHECK3-NEXT: entry: 4725 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 4726 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 4727 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 4728 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 4729 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 4730 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 4731 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 4732 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 4733 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4734 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 4735 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4736 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4737 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 4738 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 4739 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 4740 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4741 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4742 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 4743 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_1:%.*]], align 4 4744 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 4745 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 4746 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 4747 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 4748 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 4749 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 4750 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 4751 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 4752 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 4753 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 4754 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 4755 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 4756 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 4757 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 4758 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4759 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 4760 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4761 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 4762 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4763 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 4764 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4765 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 4766 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4767 // CHECK3: omp.precond.then: 4768 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 4769 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4770 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 4771 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 4772 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 4773 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 4774 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 4775 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4776 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4777 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4778 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 4779 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 4780 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4781 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4782 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 4783 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 4784 // CHECK3: cond.true: 4785 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4786 // CHECK3-NEXT: br label [[COND_END:%.*]] 4787 // CHECK3: cond.false: 4788 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4789 // CHECK3-NEXT: br label [[COND_END]] 4790 // CHECK3: cond.end: 4791 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 4792 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 4793 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 4794 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 4795 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4796 // CHECK3: omp.inner.for.cond: 4797 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4798 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 4799 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 4800 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4801 // CHECK3: omp.inner.for.body: 4802 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4803 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 4804 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 4805 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 4806 // CHECK3-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 4807 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 4808 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 4809 // CHECK3-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 4810 // CHECK3-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 4811 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 4812 // CHECK3-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 4813 // CHECK3-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 4814 // CHECK3-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 4815 // CHECK3-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 4816 // CHECK3-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 4817 // CHECK3-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 4818 // CHECK3-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 4819 // CHECK3-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 0 4820 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 4821 // CHECK3-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 1 4822 // CHECK3-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 4823 // CHECK3-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 2 4824 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 4825 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 3 4826 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 4827 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE0_clEv"(%class.anon.1* nonnull dereferenceable(16) [[REF_TMP]]) 4828 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 4829 // CHECK3: omp.body.continue: 4830 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4831 // CHECK3: omp.inner.for.inc: 4832 // CHECK3-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4833 // CHECK3-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 4834 // CHECK3-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 4835 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 4836 // CHECK3: omp.inner.for.end: 4837 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 4838 // CHECK3: omp.loop.exit: 4839 // CHECK3-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4840 // CHECK3-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 4841 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 4842 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 4843 // CHECK3: omp.precond.end: 4844 // CHECK3-NEXT: ret void 4845 // 4846 // 4847 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l202 4848 // CHECK3-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 4849 // CHECK3-NEXT: entry: 4850 // CHECK3-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 4851 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 4852 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 4853 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 4854 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 4855 // CHECK3-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 4856 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 4857 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 4858 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 4859 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 4860 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 4861 // CHECK3-NEXT: ret void 4862 // 4863 // 4864 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..6 4865 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 4866 // CHECK3-NEXT: entry: 4867 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 4868 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 4869 // CHECK3-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 4870 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 4871 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 4872 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 4873 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 4874 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4875 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 4876 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4877 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4878 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 4879 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 4880 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 4881 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 4882 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 4883 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 4884 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 4885 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 4886 // CHECK3-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 4887 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 4888 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 4889 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 4890 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 4891 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 4892 // CHECK3-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 4893 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 4894 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 4895 // CHECK3-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 4896 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 4897 // CHECK3-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 4898 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4899 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 4900 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 4901 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 4902 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 4903 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 4904 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 4905 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 4906 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 4907 // CHECK3: omp.precond.then: 4908 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 4909 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4910 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 4911 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 4912 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 4913 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 4914 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4915 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 4916 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 4917 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4918 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4919 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 4920 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 4921 // CHECK3: cond.true: 4922 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4923 // CHECK3-NEXT: br label [[COND_END:%.*]] 4924 // CHECK3: cond.false: 4925 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4926 // CHECK3-NEXT: br label [[COND_END]] 4927 // CHECK3: cond.end: 4928 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 4929 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 4930 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4931 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 4932 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 4933 // CHECK3: omp.inner.for.cond: 4934 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4935 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4936 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 4937 // CHECK3-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 4938 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 4939 // CHECK3: omp.inner.for.body: 4940 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4941 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4942 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 4943 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 4944 // CHECK3: omp.inner.for.inc: 4945 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 4946 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 4947 // CHECK3-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 4948 // CHECK3-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 4949 // CHECK3-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4950 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 4951 // CHECK3-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 4952 // CHECK3-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 4953 // CHECK3-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4954 // CHECK3-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 4955 // CHECK3-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 4956 // CHECK3-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 4957 // CHECK3-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4958 // CHECK3-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4959 // CHECK3-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP27]], [[TMP28]] 4960 // CHECK3-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 4961 // CHECK3: cond.true10: 4962 // CHECK3-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 4963 // CHECK3-NEXT: br label [[COND_END12:%.*]] 4964 // CHECK3: cond.false11: 4965 // CHECK3-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 4966 // CHECK3-NEXT: br label [[COND_END12]] 4967 // CHECK3: cond.end12: 4968 // CHECK3-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP29]], [[COND_TRUE10]] ], [ [[TMP30]], [[COND_FALSE11]] ] 4969 // CHECK3-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 4970 // CHECK3-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 4971 // CHECK3-NEXT: store i32 [[TMP31]], i32* [[DOTOMP_IV]], align 4 4972 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 4973 // CHECK3: omp.inner.for.end: 4974 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 4975 // CHECK3: omp.loop.exit: 4976 // CHECK3-NEXT: [[TMP32:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 4977 // CHECK3-NEXT: [[TMP33:%.*]] = load i32, i32* [[TMP32]], align 4 4978 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP33]]) 4979 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 4980 // CHECK3: omp.precond.end: 4981 // CHECK3-NEXT: ret void 4982 // 4983 // 4984 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..7 4985 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 4986 // CHECK3-NEXT: entry: 4987 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 4988 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 4989 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 4990 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 4991 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 4992 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 4993 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 4994 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 4995 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 4996 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 4997 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 4998 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 4999 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5000 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 5001 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 5002 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5003 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5004 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 5005 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_2:%.*]], align 4 5006 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5007 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5008 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5009 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5010 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5011 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5012 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5013 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5014 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5015 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5016 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5017 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5018 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5019 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 5020 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5021 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5022 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5023 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 5024 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5025 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5026 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5027 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5028 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5029 // CHECK3: omp.precond.then: 5030 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 5031 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5032 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 5033 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5034 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5035 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 5036 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 5037 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5038 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5039 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5040 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 5041 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 5042 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5043 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5044 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 5045 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5046 // CHECK3: cond.true: 5047 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5048 // CHECK3-NEXT: br label [[COND_END:%.*]] 5049 // CHECK3: cond.false: 5050 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5051 // CHECK3-NEXT: br label [[COND_END]] 5052 // CHECK3: cond.end: 5053 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 5054 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 5055 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 5056 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 5057 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5058 // CHECK3: omp.inner.for.cond: 5059 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5060 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5061 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 5062 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5063 // CHECK3: omp.inner.for.body: 5064 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5065 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 5066 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 5067 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 5068 // CHECK3-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 5069 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 5070 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 5071 // CHECK3-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 5072 // CHECK3-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 5073 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 5074 // CHECK3-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 5075 // CHECK3-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 5076 // CHECK3-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 5077 // CHECK3-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 5078 // CHECK3-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 5079 // CHECK3-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 5080 // CHECK3-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 5081 // CHECK3-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 0 5082 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 5083 // CHECK3-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 1 5084 // CHECK3-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 5085 // CHECK3-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 2 5086 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 5087 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 3 5088 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 5089 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE1_clEv"(%class.anon.2* nonnull dereferenceable(16) [[REF_TMP]]) 5090 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 5091 // CHECK3: omp.body.continue: 5092 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5093 // CHECK3: omp.inner.for.inc: 5094 // CHECK3-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5095 // CHECK3-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 5096 // CHECK3-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 5097 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5098 // CHECK3: omp.inner.for.end: 5099 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 5100 // CHECK3: omp.loop.exit: 5101 // CHECK3-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5102 // CHECK3-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 5103 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 5104 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5105 // CHECK3: omp.precond.end: 5106 // CHECK3-NEXT: ret void 5107 // 5108 // 5109 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l235 5110 // CHECK3-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 5111 // CHECK3-NEXT: entry: 5112 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 5113 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 5114 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 5115 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 5116 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 5117 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 5118 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 5119 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 5120 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 5121 // CHECK3-NEXT: ret void 5122 // 5123 // 5124 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..10 5125 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 5126 // CHECK3-NEXT: entry: 5127 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5128 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5129 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5130 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5131 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5132 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5133 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5134 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5135 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 5136 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5137 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5138 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 5139 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 5140 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5141 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5142 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 5143 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5144 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5145 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5146 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5147 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5148 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5149 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5150 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5151 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5152 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5153 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5154 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 5155 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5156 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5157 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5158 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 5159 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5160 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5161 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5162 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5163 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5164 // CHECK3: omp.precond.then: 5165 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 5166 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5167 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 5168 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5169 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5170 // CHECK3-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5171 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 5172 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 5173 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5174 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5175 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 5176 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5177 // CHECK3: cond.true: 5178 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5179 // CHECK3-NEXT: br label [[COND_END:%.*]] 5180 // CHECK3: cond.false: 5181 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5182 // CHECK3-NEXT: br label [[COND_END]] 5183 // CHECK3: cond.end: 5184 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 5185 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 5186 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5187 // CHECK3-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 5188 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5189 // CHECK3: omp.inner.for.cond: 5190 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5191 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5192 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 5193 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5194 // CHECK3: omp.inner.for.body: 5195 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5196 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5197 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 5198 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5199 // CHECK3: omp.inner.for.inc: 5200 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5201 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 5202 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 5203 // CHECK3-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 5204 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5205 // CHECK3: omp.inner.for.end: 5206 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 5207 // CHECK3: omp.loop.exit: 5208 // CHECK3-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5209 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 5210 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 5211 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5212 // CHECK3: omp.precond.end: 5213 // CHECK3-NEXT: ret void 5214 // 5215 // 5216 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..11 5217 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 5218 // CHECK3-NEXT: entry: 5219 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5220 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5221 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 5222 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 5223 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5224 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5225 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5226 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5227 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5228 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5229 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 5230 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5231 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5232 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 5233 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 5234 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5235 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5236 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 5237 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_3:%.*]], align 4 5238 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5239 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5240 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5241 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5242 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5243 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5244 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5245 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5246 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5247 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5248 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5249 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5250 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5251 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 5252 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5253 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5254 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5255 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 5256 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5257 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5258 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5259 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5260 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5261 // CHECK3: omp.precond.then: 5262 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 5263 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5264 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 5265 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5266 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5267 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 5268 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 5269 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5270 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5271 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5272 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 5273 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 5274 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5275 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5276 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 5277 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5278 // CHECK3: cond.true: 5279 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5280 // CHECK3-NEXT: br label [[COND_END:%.*]] 5281 // CHECK3: cond.false: 5282 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5283 // CHECK3-NEXT: br label [[COND_END]] 5284 // CHECK3: cond.end: 5285 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 5286 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 5287 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 5288 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 5289 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5290 // CHECK3: omp.inner.for.cond: 5291 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5292 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5293 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 5294 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5295 // CHECK3: omp.inner.for.body: 5296 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5297 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 5298 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 5299 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 5300 // CHECK3-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 5301 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 5302 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 5303 // CHECK3-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 5304 // CHECK3-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 5305 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 5306 // CHECK3-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 5307 // CHECK3-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 5308 // CHECK3-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 5309 // CHECK3-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 5310 // CHECK3-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 5311 // CHECK3-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 5312 // CHECK3-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 5313 // CHECK3-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 0 5314 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 5315 // CHECK3-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 1 5316 // CHECK3-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 5317 // CHECK3-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 2 5318 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 5319 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 3 5320 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 5321 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE2_clEv"(%class.anon.3* nonnull dereferenceable(16) [[REF_TMP]]) 5322 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 5323 // CHECK3: omp.body.continue: 5324 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5325 // CHECK3: omp.inner.for.inc: 5326 // CHECK3-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5327 // CHECK3-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 5328 // CHECK3-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 5329 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5330 // CHECK3: omp.inner.for.end: 5331 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 5332 // CHECK3: omp.loop.exit: 5333 // CHECK3-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5334 // CHECK3-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 5335 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 5336 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5337 // CHECK3: omp.precond.end: 5338 // CHECK3-NEXT: ret void 5339 // 5340 // 5341 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l267 5342 // CHECK3-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 5343 // CHECK3-NEXT: entry: 5344 // CHECK3-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 5345 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 5346 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 5347 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 5348 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 5349 // CHECK3-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 5350 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 5351 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 5352 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 5353 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 5354 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 5355 // CHECK3-NEXT: ret void 5356 // 5357 // 5358 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..14 5359 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 5360 // CHECK3-NEXT: entry: 5361 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5362 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5363 // CHECK3-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 5364 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5365 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5366 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5367 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5368 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 5369 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5370 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5371 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5372 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 5373 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5374 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 5375 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 5376 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5377 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5378 // CHECK3-NEXT: [[I4:%.*]] = alloca i32, align 4 5379 // CHECK3-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 5380 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5381 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5382 // CHECK3-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 5383 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5384 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5385 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5386 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5387 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 5388 // CHECK3-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5389 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 5390 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 5391 // CHECK3-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 5392 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 5393 // CHECK3-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 5394 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 5395 // CHECK3-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5396 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5397 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 5398 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5399 // CHECK3-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 5400 // CHECK3-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 5401 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5402 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5403 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 5404 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5405 // CHECK3: omp.precond.then: 5406 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 5407 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5408 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 5409 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5410 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5411 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5412 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 5413 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 5414 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5415 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5416 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 5417 // CHECK3-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5418 // CHECK3: cond.true: 5419 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5420 // CHECK3-NEXT: br label [[COND_END:%.*]] 5421 // CHECK3: cond.false: 5422 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5423 // CHECK3-NEXT: br label [[COND_END]] 5424 // CHECK3: cond.end: 5425 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 5426 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 5427 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5428 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 5429 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5430 // CHECK3: omp.inner.for.cond: 5431 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5432 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5433 // CHECK3-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 5434 // CHECK3-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5435 // CHECK3: omp.inner.for.body: 5436 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5437 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5438 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5439 // CHECK3-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 5440 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 5441 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 5442 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5443 // CHECK3: omp.inner.for.inc: 5444 // CHECK3-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5445 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 5446 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 5447 // CHECK3-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 5448 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5449 // CHECK3: omp.inner.for.end: 5450 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 5451 // CHECK3: omp.loop.exit: 5452 // CHECK3-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5453 // CHECK3-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 5454 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 5455 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5456 // CHECK3: omp.precond.end: 5457 // CHECK3-NEXT: ret void 5458 // 5459 // 5460 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..15 5461 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 5462 // CHECK3-NEXT: entry: 5463 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5464 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5465 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 5466 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 5467 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5468 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5469 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5470 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5471 // CHECK3-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 5472 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5473 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5474 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5475 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 5476 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5477 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 5478 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 5479 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5480 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5481 // CHECK3-NEXT: [[I4:%.*]] = alloca i32, align 4 5482 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_4:%.*]], align 4 5483 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5484 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5485 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5486 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5487 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5488 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5489 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5490 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5491 // CHECK3-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 5492 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5493 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5494 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5495 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5496 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5497 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5498 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5499 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5500 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5501 // CHECK3-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 5502 // CHECK3-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 5503 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5504 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5505 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5506 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5507 // CHECK3: omp.precond.then: 5508 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 5509 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5510 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 5511 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5512 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5513 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 5514 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 5515 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5516 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5517 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 5518 // CHECK3-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5519 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 5520 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 5521 // CHECK3-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 5522 // CHECK3: omp.dispatch.cond: 5523 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5524 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5525 // CHECK3-NEXT: [[CMP5:%.*]] = icmp ugt i32 [[TMP13]], [[TMP14]] 5526 // CHECK3-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5527 // CHECK3: cond.true: 5528 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5529 // CHECK3-NEXT: br label [[COND_END:%.*]] 5530 // CHECK3: cond.false: 5531 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5532 // CHECK3-NEXT: br label [[COND_END]] 5533 // CHECK3: cond.end: 5534 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP15]], [[COND_TRUE]] ], [ [[TMP16]], [[COND_FALSE]] ] 5535 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 5536 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 5537 // CHECK3-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 5538 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5539 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5540 // CHECK3-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 5541 // CHECK3-NEXT: br i1 [[CMP6]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 5542 // CHECK3: omp.dispatch.body: 5543 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5544 // CHECK3: omp.inner.for.cond: 5545 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5546 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5547 // CHECK3-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 5548 // CHECK3-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5549 // CHECK3: omp.inner.for.body: 5550 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5551 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 5552 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 5553 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 5554 // CHECK3-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 4 5555 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 5556 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 5557 // CHECK3-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 4 5558 // CHECK3-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 4 5559 // CHECK3-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 5560 // CHECK3-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 5561 // CHECK3-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX8]], align 4 5562 // CHECK3-NEXT: [[ADD9:%.*]] = fadd double [[TMP25]], [[TMP28]] 5563 // CHECK3-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 4 5564 // CHECK3-NEXT: [[TMP30:%.*]] = load i32, i32* [[I4]], align 4 5565 // CHECK3-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP29]], i32 [[TMP30]] 5566 // CHECK3-NEXT: store double [[ADD9]], double* [[ARRAYIDX10]], align 4 5567 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 0 5568 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP31]], align 4 5569 // CHECK3-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 1 5570 // CHECK3-NEXT: store i32* [[I4]], i32** [[TMP32]], align 4 5571 // CHECK3-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 2 5572 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP33]], align 4 5573 // CHECK3-NEXT: [[TMP34:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 3 5574 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP34]], align 4 5575 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE3_clEv"(%class.anon.4* nonnull dereferenceable(16) [[REF_TMP]]) 5576 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 5577 // CHECK3: omp.body.continue: 5578 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5579 // CHECK3: omp.inner.for.inc: 5580 // CHECK3-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5581 // CHECK3-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP35]], 1 5582 // CHECK3-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4 5583 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5584 // CHECK3: omp.inner.for.end: 5585 // CHECK3-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 5586 // CHECK3: omp.dispatch.inc: 5587 // CHECK3-NEXT: [[TMP36:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 5588 // CHECK3-NEXT: [[TMP37:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 5589 // CHECK3-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP36]], [[TMP37]] 5590 // CHECK3-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_LB]], align 4 5591 // CHECK3-NEXT: [[TMP38:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5592 // CHECK3-NEXT: [[TMP39:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 5593 // CHECK3-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP38]], [[TMP39]] 5594 // CHECK3-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_UB]], align 4 5595 // CHECK3-NEXT: br label [[OMP_DISPATCH_COND]] 5596 // CHECK3: omp.dispatch.end: 5597 // CHECK3-NEXT: [[TMP40:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5598 // CHECK3-NEXT: [[TMP41:%.*]] = load i32, i32* [[TMP40]], align 4 5599 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP41]]) 5600 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5601 // CHECK3: omp.precond.end: 5602 // CHECK3-NEXT: ret void 5603 // 5604 // 5605 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l300 5606 // CHECK3-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 5607 // CHECK3-NEXT: entry: 5608 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 5609 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 5610 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 5611 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 5612 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 5613 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 5614 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 5615 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 5616 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 5617 // CHECK3-NEXT: ret void 5618 // 5619 // 5620 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..18 5621 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 5622 // CHECK3-NEXT: entry: 5623 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5624 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5625 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5626 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5627 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5628 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5629 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5630 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5631 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 5632 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5633 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5634 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 5635 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 5636 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5637 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5638 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 5639 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5640 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5641 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5642 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5643 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5644 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5645 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5646 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5647 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5648 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5649 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5650 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 5651 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5652 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5653 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5654 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 5655 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5656 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5657 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5658 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5659 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5660 // CHECK3: omp.precond.then: 5661 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 5662 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5663 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 5664 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5665 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5666 // CHECK3-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5667 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 5668 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 5669 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5670 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5671 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 5672 // CHECK3-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5673 // CHECK3: cond.true: 5674 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5675 // CHECK3-NEXT: br label [[COND_END:%.*]] 5676 // CHECK3: cond.false: 5677 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5678 // CHECK3-NEXT: br label [[COND_END]] 5679 // CHECK3: cond.end: 5680 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 5681 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 5682 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5683 // CHECK3-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 5684 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5685 // CHECK3: omp.inner.for.cond: 5686 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5687 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5688 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 5689 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5690 // CHECK3: omp.inner.for.body: 5691 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5692 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5693 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 5694 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5695 // CHECK3: omp.inner.for.inc: 5696 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5697 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 5698 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 5699 // CHECK3-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 5700 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5701 // CHECK3: omp.inner.for.end: 5702 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 5703 // CHECK3: omp.loop.exit: 5704 // CHECK3-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5705 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 5706 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 5707 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5708 // CHECK3: omp.precond.end: 5709 // CHECK3-NEXT: ret void 5710 // 5711 // 5712 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..19 5713 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 5714 // CHECK3-NEXT: entry: 5715 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5716 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5717 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 5718 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 5719 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5720 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5721 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5722 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5723 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5724 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5725 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 5726 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5727 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5728 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 5729 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 5730 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5731 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5732 // CHECK3-NEXT: [[I3:%.*]] = alloca i32, align 4 5733 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_5:%.*]], align 4 5734 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5735 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5736 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5737 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5738 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5739 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5740 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5741 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5742 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5743 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5744 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5745 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5746 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5747 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 5748 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5749 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5750 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5751 // CHECK3-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 5752 // CHECK3-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5753 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5754 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5755 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5756 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5757 // CHECK3: omp.precond.then: 5758 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 5759 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5760 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 5761 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5762 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5763 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 5764 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 5765 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5766 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5767 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 5768 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 5769 // CHECK3-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5770 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 5771 // CHECK3-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 5772 // CHECK3-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 5773 // CHECK3: omp.dispatch.cond: 5774 // CHECK3-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5775 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 5776 // CHECK3-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 5777 // CHECK3-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 5778 // CHECK3-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 5779 // CHECK3: omp.dispatch.body: 5780 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 5781 // CHECK3-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 5782 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5783 // CHECK3: omp.inner.for.cond: 5784 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 5785 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !12 5786 // CHECK3-NEXT: [[CMP4:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 5787 // CHECK3-NEXT: br i1 [[CMP4]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5788 // CHECK3: omp.inner.for.body: 5789 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 5790 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 5791 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 5792 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I3]], align 4, !llvm.access.group !12 5793 // CHECK3-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !12 5794 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !12 5795 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i32 [[TMP22]] 5796 // CHECK3-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !12 5797 // CHECK3-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !12 5798 // CHECK3-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !12 5799 // CHECK3-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds double, double* [[TMP24]], i32 [[TMP25]] 5800 // CHECK3-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX5]], align 4, !llvm.access.group !12 5801 // CHECK3-NEXT: [[ADD6:%.*]] = fadd double [[TMP23]], [[TMP26]] 5802 // CHECK3-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !12 5803 // CHECK3-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !12 5804 // CHECK3-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP27]], i32 [[TMP28]] 5805 // CHECK3-NEXT: store double [[ADD6]], double* [[ARRAYIDX7]], align 4, !llvm.access.group !12 5806 // CHECK3-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 0 5807 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP29]], align 4, !llvm.access.group !12 5808 // CHECK3-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 1 5809 // CHECK3-NEXT: store i32* [[I3]], i32** [[TMP30]], align 4, !llvm.access.group !12 5810 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 2 5811 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP31]], align 4, !llvm.access.group !12 5812 // CHECK3-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 3 5813 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP32]], align 4, !llvm.access.group !12 5814 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE4_clEv"(%class.anon.5* nonnull dereferenceable(16) [[REF_TMP]]), !llvm.access.group !12 5815 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 5816 // CHECK3: omp.body.continue: 5817 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5818 // CHECK3: omp.inner.for.inc: 5819 // CHECK3-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 5820 // CHECK3-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP33]], 1 5821 // CHECK3-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 5822 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP13:![0-9]+]] 5823 // CHECK3: omp.inner.for.end: 5824 // CHECK3-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 5825 // CHECK3: omp.dispatch.inc: 5826 // CHECK3-NEXT: br label [[OMP_DISPATCH_COND]] 5827 // CHECK3: omp.dispatch.end: 5828 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5829 // CHECK3: omp.precond.end: 5830 // CHECK3-NEXT: ret void 5831 // 5832 // 5833 // CHECK3-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l329 5834 // CHECK3-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 5835 // CHECK3-NEXT: entry: 5836 // CHECK3-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 5837 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 5838 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 5839 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 5840 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 5841 // CHECK3-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 5842 // CHECK3-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 5843 // CHECK3-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 5844 // CHECK3-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 5845 // CHECK3-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 5846 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 5847 // CHECK3-NEXT: ret void 5848 // 5849 // 5850 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..22 5851 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 5852 // CHECK3-NEXT: entry: 5853 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5854 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5855 // CHECK3-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 5856 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5857 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5858 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5859 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5860 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 5861 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5862 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5863 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5864 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 5865 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5866 // CHECK3-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 5867 // CHECK3-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 5868 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5869 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5870 // CHECK3-NEXT: [[I4:%.*]] = alloca i32, align 4 5871 // CHECK3-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 5872 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5873 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5874 // CHECK3-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 5875 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5876 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5877 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5878 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5879 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 5880 // CHECK3-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5881 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 5882 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 5883 // CHECK3-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 5884 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 5885 // CHECK3-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 5886 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 5887 // CHECK3-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5888 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5889 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 5890 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5891 // CHECK3-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 5892 // CHECK3-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 5893 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5894 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5895 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 5896 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5897 // CHECK3: omp.precond.then: 5898 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 5899 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5900 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 5901 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 5902 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 5903 // CHECK3-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5904 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 5905 // CHECK3-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 5906 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5907 // CHECK3-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5908 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 5909 // CHECK3-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 5910 // CHECK3: cond.true: 5911 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 5912 // CHECK3-NEXT: br label [[COND_END:%.*]] 5913 // CHECK3: cond.false: 5914 // CHECK3-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5915 // CHECK3-NEXT: br label [[COND_END]] 5916 // CHECK3: cond.end: 5917 // CHECK3-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 5918 // CHECK3-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 5919 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5920 // CHECK3-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 5921 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 5922 // CHECK3: omp.inner.for.cond: 5923 // CHECK3-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5924 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5925 // CHECK3-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 5926 // CHECK3-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 5927 // CHECK3: omp.inner.for.body: 5928 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 5929 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 5930 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 5931 // CHECK3-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 5932 // CHECK3-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 5933 // CHECK3-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 5934 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 5935 // CHECK3: omp.inner.for.inc: 5936 // CHECK3-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 5937 // CHECK3-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 5938 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 5939 // CHECK3-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 5940 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]] 5941 // CHECK3: omp.inner.for.end: 5942 // CHECK3-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 5943 // CHECK3: omp.loop.exit: 5944 // CHECK3-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 5945 // CHECK3-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 5946 // CHECK3-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 5947 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 5948 // CHECK3: omp.precond.end: 5949 // CHECK3-NEXT: ret void 5950 // 5951 // 5952 // CHECK3-LABEL: define {{[^@]+}}@.omp_outlined..23 5953 // CHECK3-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 5954 // CHECK3-NEXT: entry: 5955 // CHECK3-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 5956 // CHECK3-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 5957 // CHECK3-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 5958 // CHECK3-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 5959 // CHECK3-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 5960 // CHECK3-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 5961 // CHECK3-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 5962 // CHECK3-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 5963 // CHECK3-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 5964 // CHECK3-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 5965 // CHECK3-NEXT: [[TMP:%.*]] = alloca i32, align 4 5966 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 5967 // CHECK3-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 5968 // CHECK3-NEXT: [[I:%.*]] = alloca i32, align 4 5969 // CHECK3-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 5970 // CHECK3-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 5971 // CHECK3-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 5972 // CHECK3-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 5973 // CHECK3-NEXT: [[I4:%.*]] = alloca i32, align 4 5974 // CHECK3-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_6:%.*]], align 4 5975 // CHECK3-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 5976 // CHECK3-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 5977 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 5978 // CHECK3-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 5979 // CHECK3-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 5980 // CHECK3-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 5981 // CHECK3-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 5982 // CHECK3-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 5983 // CHECK3-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 5984 // CHECK3-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 5985 // CHECK3-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 5986 // CHECK3-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 5987 // CHECK3-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 5988 // CHECK3-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 5989 // CHECK3-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 5990 // CHECK3-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5991 // CHECK3-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 5992 // CHECK3-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 5993 // CHECK3-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 5994 // CHECK3-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 5995 // CHECK3-NEXT: store i32 0, i32* [[I]], align 4 5996 // CHECK3-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 5997 // CHECK3-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 5998 // CHECK3-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 5999 // CHECK3: omp.precond.then: 6000 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 6001 // CHECK3-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 6002 // CHECK3-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 6003 // CHECK3-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6004 // CHECK3-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6005 // CHECK3-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 6006 // CHECK3-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 6007 // CHECK3-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6008 // CHECK3-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6009 // CHECK3-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 6010 // CHECK3-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 6011 // CHECK3-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6012 // CHECK3-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6013 // CHECK3-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 6014 // CHECK3-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 6015 // CHECK3-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 6016 // CHECK3: omp.dispatch.cond: 6017 // CHECK3-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6018 // CHECK3-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 6019 // CHECK3-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 6020 // CHECK3-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 6021 // CHECK3-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 6022 // CHECK3: omp.dispatch.body: 6023 // CHECK3-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 6024 // CHECK3-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 6025 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6026 // CHECK3: omp.inner.for.cond: 6027 // CHECK3-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 6028 // CHECK3-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !15 6029 // CHECK3-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 6030 // CHECK3-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6031 // CHECK3: omp.inner.for.body: 6032 // CHECK3-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 6033 // CHECK3-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 6034 // CHECK3-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 6035 // CHECK3-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !15 6036 // CHECK3-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !15 6037 // CHECK3-NEXT: [[TMP23:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !15 6038 // CHECK3-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i32 [[TMP23]] 6039 // CHECK3-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !15 6040 // CHECK3-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !15 6041 // CHECK3-NEXT: [[TMP26:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !15 6042 // CHECK3-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP25]], i32 [[TMP26]] 6043 // CHECK3-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX6]], align 4, !llvm.access.group !15 6044 // CHECK3-NEXT: [[ADD7:%.*]] = fadd double [[TMP24]], [[TMP27]] 6045 // CHECK3-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !15 6046 // CHECK3-NEXT: [[TMP29:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !15 6047 // CHECK3-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP28]], i32 [[TMP29]] 6048 // CHECK3-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4, !llvm.access.group !15 6049 // CHECK3-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 0 6050 // CHECK3-NEXT: store double** [[TMP1]], double*** [[TMP30]], align 4, !llvm.access.group !15 6051 // CHECK3-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 1 6052 // CHECK3-NEXT: store i32* [[I4]], i32** [[TMP31]], align 4, !llvm.access.group !15 6053 // CHECK3-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 2 6054 // CHECK3-NEXT: store double** [[TMP2]], double*** [[TMP32]], align 4, !llvm.access.group !15 6055 // CHECK3-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 3 6056 // CHECK3-NEXT: store double** [[TMP3]], double*** [[TMP33]], align 4, !llvm.access.group !15 6057 // CHECK3-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE5_clEv"(%class.anon.6* nonnull dereferenceable(16) [[REF_TMP]]), !llvm.access.group !15 6058 // CHECK3-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 6059 // CHECK3: omp.body.continue: 6060 // CHECK3-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6061 // CHECK3: omp.inner.for.inc: 6062 // CHECK3-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 6063 // CHECK3-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP34]], 1 6064 // CHECK3-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 6065 // CHECK3-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP16:![0-9]+]] 6066 // CHECK3: omp.inner.for.end: 6067 // CHECK3-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 6068 // CHECK3: omp.dispatch.inc: 6069 // CHECK3-NEXT: br label [[OMP_DISPATCH_COND]] 6070 // CHECK3: omp.dispatch.end: 6071 // CHECK3-NEXT: br label [[OMP_PRECOND_END]] 6072 // CHECK3: omp.precond.end: 6073 // CHECK3-NEXT: ret void 6074 // 6075 // 6076 // CHECK3-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 6077 // CHECK3-SAME: () #[[ATTR4:[0-9]+]] { 6078 // CHECK3-NEXT: entry: 6079 // CHECK3-NEXT: call void @__tgt_register_requires(i64 1) 6080 // CHECK3-NEXT: ret void 6081 // 6082 // 6083 // CHECK4-LABEL: define {{[^@]+}}@main 6084 // CHECK4-SAME: () #[[ATTR0:[0-9]+]] { 6085 // CHECK4-NEXT: entry: 6086 // CHECK4-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 6087 // CHECK4-NEXT: [[A:%.*]] = alloca double*, align 4 6088 // CHECK4-NEXT: [[B:%.*]] = alloca double*, align 4 6089 // CHECK4-NEXT: [[C:%.*]] = alloca double*, align 4 6090 // CHECK4-NEXT: [[N:%.*]] = alloca i32, align 4 6091 // CHECK4-NEXT: [[CH:%.*]] = alloca i32, align 4 6092 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 4 6093 // CHECK4-NEXT: store i32 0, i32* [[RETVAL]], align 4 6094 // CHECK4-NEXT: store i32 10000, i32* [[N]], align 4 6095 // CHECK4-NEXT: store i32 100, i32* [[CH]], align 4 6096 // CHECK4-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 6097 // CHECK4-NEXT: store i32* [[N]], i32** [[TMP0]], align 4 6098 // CHECK4-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 6099 // CHECK4-NEXT: store double** [[A]], double*** [[TMP1]], align 4 6100 // CHECK4-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 6101 // CHECK4-NEXT: store double** [[B]], double*** [[TMP2]], align 4 6102 // CHECK4-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 6103 // CHECK4-NEXT: store double** [[C]], double*** [[TMP3]], align 4 6104 // CHECK4-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 6105 // CHECK4-NEXT: store i32* [[CH]], i32** [[TMP4]], align 4 6106 // CHECK4-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(20) [[REF_TMP]]) 6107 // CHECK4-NEXT: ret i32 0 6108 // 6109 // 6110 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l117 6111 // CHECK4-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2:[0-9]+]] { 6112 // CHECK4-NEXT: entry: 6113 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 6114 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 6115 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 6116 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 6117 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 6118 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 6119 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 6120 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 6121 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3:[0-9]+]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 6122 // CHECK4-NEXT: ret void 6123 // 6124 // 6125 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined. 6126 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6127 // CHECK4-NEXT: entry: 6128 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6129 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6130 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6131 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6132 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6133 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6134 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6135 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6136 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6137 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6138 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6139 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 6140 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 6141 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6142 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6143 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6144 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6145 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6146 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6147 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6148 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6149 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6150 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6151 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6152 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6153 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6154 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6155 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6156 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6157 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6158 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6159 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6160 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6161 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6162 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6163 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6164 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6165 // CHECK4: omp.precond.then: 6166 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 6167 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6168 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 6169 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6170 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6171 // CHECK4-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6172 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 6173 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 6174 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6175 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6176 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 6177 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6178 // CHECK4: cond.true: 6179 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6180 // CHECK4-NEXT: br label [[COND_END:%.*]] 6181 // CHECK4: cond.false: 6182 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6183 // CHECK4-NEXT: br label [[COND_END]] 6184 // CHECK4: cond.end: 6185 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 6186 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 6187 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6188 // CHECK4-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 6189 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6190 // CHECK4: omp.inner.for.cond: 6191 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6192 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6193 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 6194 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6195 // CHECK4: omp.inner.for.body: 6196 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6197 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6198 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 6199 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6200 // CHECK4: omp.inner.for.inc: 6201 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6202 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 6203 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 6204 // CHECK4-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 6205 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6206 // CHECK4: omp.inner.for.end: 6207 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6208 // CHECK4: omp.loop.exit: 6209 // CHECK4-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6210 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 6211 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 6212 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6213 // CHECK4: omp.precond.end: 6214 // CHECK4-NEXT: ret void 6215 // 6216 // 6217 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..1 6218 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6219 // CHECK4-NEXT: entry: 6220 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6221 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6222 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 6223 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 6224 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6225 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6226 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6227 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6228 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6229 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6230 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6231 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6232 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6233 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 6234 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 6235 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6236 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6237 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6238 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_0:%.*]], align 4 6239 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6240 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6241 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6242 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6243 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6244 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6245 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6246 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6247 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6248 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6249 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6250 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6251 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6252 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6253 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6254 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6255 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6256 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6257 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6258 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6259 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6260 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6261 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6262 // CHECK4: omp.precond.then: 6263 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 6264 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6265 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 6266 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6267 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6268 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 6269 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 6270 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6271 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6272 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6273 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 6274 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 6275 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6276 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6277 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 6278 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6279 // CHECK4: cond.true: 6280 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6281 // CHECK4-NEXT: br label [[COND_END:%.*]] 6282 // CHECK4: cond.false: 6283 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6284 // CHECK4-NEXT: br label [[COND_END]] 6285 // CHECK4: cond.end: 6286 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 6287 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 6288 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 6289 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 6290 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6291 // CHECK4: omp.inner.for.cond: 6292 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6293 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6294 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 6295 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6296 // CHECK4: omp.inner.for.body: 6297 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6298 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 6299 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 6300 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 6301 // CHECK4-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 6302 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 6303 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 6304 // CHECK4-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 6305 // CHECK4-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 6306 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 6307 // CHECK4-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 6308 // CHECK4-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 6309 // CHECK4-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 6310 // CHECK4-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 6311 // CHECK4-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 6312 // CHECK4-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 6313 // CHECK4-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 6314 // CHECK4-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 0 6315 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 6316 // CHECK4-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 1 6317 // CHECK4-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 6318 // CHECK4-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 2 6319 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 6320 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_0]], %class.anon.0* [[REF_TMP]], i32 0, i32 3 6321 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 6322 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE_clEv"(%class.anon.0* nonnull dereferenceable(16) [[REF_TMP]]) 6323 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 6324 // CHECK4: omp.body.continue: 6325 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6326 // CHECK4: omp.inner.for.inc: 6327 // CHECK4-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6328 // CHECK4-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 6329 // CHECK4-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 6330 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6331 // CHECK4: omp.inner.for.end: 6332 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6333 // CHECK4: omp.loop.exit: 6334 // CHECK4-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6335 // CHECK4-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 6336 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 6337 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6338 // CHECK4: omp.precond.end: 6339 // CHECK4-NEXT: ret void 6340 // 6341 // 6342 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l160 6343 // CHECK4-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 6344 // CHECK4-NEXT: entry: 6345 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 6346 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 6347 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 6348 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 6349 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 6350 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 6351 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 6352 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 6353 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 6354 // CHECK4-NEXT: ret void 6355 // 6356 // 6357 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..2 6358 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6359 // CHECK4-NEXT: entry: 6360 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6361 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6362 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6363 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6364 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6365 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6366 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6367 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6368 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6369 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6370 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6371 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 6372 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 6373 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6374 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6375 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6376 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6377 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6378 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6379 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6380 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6381 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6382 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6383 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6384 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6385 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6386 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6387 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6388 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6389 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6390 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6391 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6392 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6393 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6394 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6395 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6396 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6397 // CHECK4: omp.precond.then: 6398 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 6399 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6400 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 6401 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6402 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6403 // CHECK4-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6404 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 6405 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 6406 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6407 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6408 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 6409 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6410 // CHECK4: cond.true: 6411 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6412 // CHECK4-NEXT: br label [[COND_END:%.*]] 6413 // CHECK4: cond.false: 6414 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6415 // CHECK4-NEXT: br label [[COND_END]] 6416 // CHECK4: cond.end: 6417 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 6418 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 6419 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6420 // CHECK4-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 6421 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6422 // CHECK4: omp.inner.for.cond: 6423 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6424 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6425 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 6426 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6427 // CHECK4: omp.inner.for.body: 6428 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6429 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6430 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 6431 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6432 // CHECK4: omp.inner.for.inc: 6433 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6434 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 6435 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 6436 // CHECK4-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 6437 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6438 // CHECK4: omp.inner.for.end: 6439 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6440 // CHECK4: omp.loop.exit: 6441 // CHECK4-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6442 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 6443 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 6444 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6445 // CHECK4: omp.precond.end: 6446 // CHECK4-NEXT: ret void 6447 // 6448 // 6449 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..3 6450 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6451 // CHECK4-NEXT: entry: 6452 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6453 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6454 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 6455 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 6456 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6457 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6458 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6459 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6460 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6461 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6462 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6463 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6464 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6465 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 6466 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 6467 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6468 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6469 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6470 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_1:%.*]], align 4 6471 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6472 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6473 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6474 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6475 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6476 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6477 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6478 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6479 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6480 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6481 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6482 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6483 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6484 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6485 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6486 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6487 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6488 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6489 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6490 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6491 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6492 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6493 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6494 // CHECK4: omp.precond.then: 6495 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 6496 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6497 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 6498 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6499 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6500 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 6501 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 6502 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6503 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6504 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6505 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 6506 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 6507 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6508 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6509 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 6510 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6511 // CHECK4: cond.true: 6512 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6513 // CHECK4-NEXT: br label [[COND_END:%.*]] 6514 // CHECK4: cond.false: 6515 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6516 // CHECK4-NEXT: br label [[COND_END]] 6517 // CHECK4: cond.end: 6518 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 6519 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 6520 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 6521 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 6522 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6523 // CHECK4: omp.inner.for.cond: 6524 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6525 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6526 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 6527 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6528 // CHECK4: omp.inner.for.body: 6529 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6530 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 6531 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 6532 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 6533 // CHECK4-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 6534 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 6535 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 6536 // CHECK4-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 6537 // CHECK4-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 6538 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 6539 // CHECK4-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 6540 // CHECK4-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 6541 // CHECK4-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 6542 // CHECK4-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 6543 // CHECK4-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 6544 // CHECK4-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 6545 // CHECK4-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 6546 // CHECK4-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 0 6547 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 6548 // CHECK4-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 1 6549 // CHECK4-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 6550 // CHECK4-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 2 6551 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 6552 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_1]], %class.anon.1* [[REF_TMP]], i32 0, i32 3 6553 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 6554 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE0_clEv"(%class.anon.1* nonnull dereferenceable(16) [[REF_TMP]]) 6555 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 6556 // CHECK4: omp.body.continue: 6557 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6558 // CHECK4: omp.inner.for.inc: 6559 // CHECK4-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6560 // CHECK4-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 6561 // CHECK4-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 6562 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6563 // CHECK4: omp.inner.for.end: 6564 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6565 // CHECK4: omp.loop.exit: 6566 // CHECK4-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6567 // CHECK4-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 6568 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 6569 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6570 // CHECK4: omp.precond.end: 6571 // CHECK4-NEXT: ret void 6572 // 6573 // 6574 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l202 6575 // CHECK4-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 6576 // CHECK4-NEXT: entry: 6577 // CHECK4-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 6578 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 6579 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 6580 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 6581 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 6582 // CHECK4-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 6583 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 6584 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 6585 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 6586 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 6587 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 6588 // CHECK4-NEXT: ret void 6589 // 6590 // 6591 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..6 6592 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6593 // CHECK4-NEXT: entry: 6594 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6595 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6596 // CHECK4-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 6597 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6598 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6599 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6600 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6601 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6602 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6603 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6604 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6605 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6606 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 6607 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 6608 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6609 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6610 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6611 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6612 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6613 // CHECK4-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 6614 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6615 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6616 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6617 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6618 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 6619 // CHECK4-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6620 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 6621 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 6622 // CHECK4-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 6623 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 6624 // CHECK4-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 6625 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6626 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 6627 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6628 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6629 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6630 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6631 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6632 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 6633 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6634 // CHECK4: omp.precond.then: 6635 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 6636 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6637 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 6638 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6639 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6640 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 6641 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6642 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 6643 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 6644 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6645 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6646 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 6647 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6648 // CHECK4: cond.true: 6649 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6650 // CHECK4-NEXT: br label [[COND_END:%.*]] 6651 // CHECK4: cond.false: 6652 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6653 // CHECK4-NEXT: br label [[COND_END]] 6654 // CHECK4: cond.end: 6655 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 6656 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 6657 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6658 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 6659 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6660 // CHECK4: omp.inner.for.cond: 6661 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6662 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6663 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 6664 // CHECK4-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 6665 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6666 // CHECK4: omp.inner.for.body: 6667 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6668 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6669 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 6670 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6671 // CHECK4: omp.inner.for.inc: 6672 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6673 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 6674 // CHECK4-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 6675 // CHECK4-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 6676 // CHECK4-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6677 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 6678 // CHECK4-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 6679 // CHECK4-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 6680 // CHECK4-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6681 // CHECK4-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 6682 // CHECK4-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 6683 // CHECK4-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 6684 // CHECK4-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6685 // CHECK4-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6686 // CHECK4-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP27]], [[TMP28]] 6687 // CHECK4-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 6688 // CHECK4: cond.true10: 6689 // CHECK4-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6690 // CHECK4-NEXT: br label [[COND_END12:%.*]] 6691 // CHECK4: cond.false11: 6692 // CHECK4-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6693 // CHECK4-NEXT: br label [[COND_END12]] 6694 // CHECK4: cond.end12: 6695 // CHECK4-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP29]], [[COND_TRUE10]] ], [ [[TMP30]], [[COND_FALSE11]] ] 6696 // CHECK4-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 6697 // CHECK4-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6698 // CHECK4-NEXT: store i32 [[TMP31]], i32* [[DOTOMP_IV]], align 4 6699 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6700 // CHECK4: omp.inner.for.end: 6701 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6702 // CHECK4: omp.loop.exit: 6703 // CHECK4-NEXT: [[TMP32:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6704 // CHECK4-NEXT: [[TMP33:%.*]] = load i32, i32* [[TMP32]], align 4 6705 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP33]]) 6706 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6707 // CHECK4: omp.precond.end: 6708 // CHECK4-NEXT: ret void 6709 // 6710 // 6711 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..7 6712 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6713 // CHECK4-NEXT: entry: 6714 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6715 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6716 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 6717 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 6718 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6719 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6720 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6721 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6722 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6723 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6724 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6725 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6726 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6727 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 6728 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 6729 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6730 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6731 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6732 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_2:%.*]], align 4 6733 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6734 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6735 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6736 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6737 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6738 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6739 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6740 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6741 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6742 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6743 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6744 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6745 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6746 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6747 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6748 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6749 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6750 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6751 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6752 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6753 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6754 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6755 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6756 // CHECK4: omp.precond.then: 6757 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 6758 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6759 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 6760 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6761 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6762 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 6763 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 6764 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6765 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6766 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6767 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 6768 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 6769 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6770 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6771 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 6772 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6773 // CHECK4: cond.true: 6774 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6775 // CHECK4-NEXT: br label [[COND_END:%.*]] 6776 // CHECK4: cond.false: 6777 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6778 // CHECK4-NEXT: br label [[COND_END]] 6779 // CHECK4: cond.end: 6780 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 6781 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 6782 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 6783 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 6784 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6785 // CHECK4: omp.inner.for.cond: 6786 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6787 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 6788 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 6789 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6790 // CHECK4: omp.inner.for.body: 6791 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6792 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 6793 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 6794 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 6795 // CHECK4-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 6796 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 6797 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 6798 // CHECK4-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 6799 // CHECK4-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 6800 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 6801 // CHECK4-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 6802 // CHECK4-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 6803 // CHECK4-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 6804 // CHECK4-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 6805 // CHECK4-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 6806 // CHECK4-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 6807 // CHECK4-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 6808 // CHECK4-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 0 6809 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 6810 // CHECK4-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 1 6811 // CHECK4-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 6812 // CHECK4-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 2 6813 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 6814 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_2]], %class.anon.2* [[REF_TMP]], i32 0, i32 3 6815 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 6816 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE1_clEv"(%class.anon.2* nonnull dereferenceable(16) [[REF_TMP]]) 6817 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 6818 // CHECK4: omp.body.continue: 6819 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6820 // CHECK4: omp.inner.for.inc: 6821 // CHECK4-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6822 // CHECK4-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 6823 // CHECK4-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 6824 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6825 // CHECK4: omp.inner.for.end: 6826 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6827 // CHECK4: omp.loop.exit: 6828 // CHECK4-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6829 // CHECK4-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 6830 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 6831 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6832 // CHECK4: omp.precond.end: 6833 // CHECK4-NEXT: ret void 6834 // 6835 // 6836 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l235 6837 // CHECK4-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 6838 // CHECK4-NEXT: entry: 6839 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 6840 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 6841 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 6842 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 6843 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 6844 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 6845 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 6846 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 6847 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 6848 // CHECK4-NEXT: ret void 6849 // 6850 // 6851 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..10 6852 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6853 // CHECK4-NEXT: entry: 6854 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6855 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6856 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6857 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6858 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6859 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6860 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6861 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6862 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6863 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6864 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6865 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 6866 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 6867 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6868 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6869 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6870 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6871 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6872 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6873 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6874 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6875 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6876 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6877 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6878 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6879 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6880 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6881 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6882 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6883 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6884 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6885 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6886 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6887 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6888 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6889 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6890 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6891 // CHECK4: omp.precond.then: 6892 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 6893 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6894 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 6895 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6896 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6897 // CHECK4-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6898 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 6899 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 6900 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6901 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6902 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 6903 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 6904 // CHECK4: cond.true: 6905 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6906 // CHECK4-NEXT: br label [[COND_END:%.*]] 6907 // CHECK4: cond.false: 6908 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6909 // CHECK4-NEXT: br label [[COND_END]] 6910 // CHECK4: cond.end: 6911 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 6912 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 6913 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6914 // CHECK4-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 6915 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 6916 // CHECK4: omp.inner.for.cond: 6917 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6918 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6919 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 6920 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 6921 // CHECK4: omp.inner.for.body: 6922 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 6923 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 6924 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 6925 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 6926 // CHECK4: omp.inner.for.inc: 6927 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 6928 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 6929 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 6930 // CHECK4-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 6931 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 6932 // CHECK4: omp.inner.for.end: 6933 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 6934 // CHECK4: omp.loop.exit: 6935 // CHECK4-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6936 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 6937 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 6938 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 6939 // CHECK4: omp.precond.end: 6940 // CHECK4-NEXT: ret void 6941 // 6942 // 6943 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..11 6944 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 6945 // CHECK4-NEXT: entry: 6946 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 6947 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 6948 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 6949 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 6950 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 6951 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 6952 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 6953 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 6954 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 6955 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 6956 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 6957 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 6958 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 6959 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 6960 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 6961 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 6962 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 6963 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 6964 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_3:%.*]], align 4 6965 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 6966 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 6967 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6968 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6969 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 6970 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 6971 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 6972 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 6973 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 6974 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 6975 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 6976 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 6977 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 6978 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 6979 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6980 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 6981 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 6982 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 6983 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 6984 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 6985 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 6986 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 6987 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 6988 // CHECK4: omp.precond.then: 6989 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 6990 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 6991 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 6992 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 6993 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 6994 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 6995 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 6996 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 6997 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 6998 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 6999 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 7000 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 7001 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7002 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7003 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 7004 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 7005 // CHECK4: cond.true: 7006 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7007 // CHECK4-NEXT: br label [[COND_END:%.*]] 7008 // CHECK4: cond.false: 7009 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7010 // CHECK4-NEXT: br label [[COND_END]] 7011 // CHECK4: cond.end: 7012 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 7013 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 7014 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7015 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 7016 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7017 // CHECK4: omp.inner.for.cond: 7018 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7019 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7020 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 7021 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7022 // CHECK4: omp.inner.for.body: 7023 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7024 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 7025 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 7026 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 7027 // CHECK4-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 7028 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 7029 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 7030 // CHECK4-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 7031 // CHECK4-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 7032 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 7033 // CHECK4-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 7034 // CHECK4-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 7035 // CHECK4-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 7036 // CHECK4-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 7037 // CHECK4-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 7038 // CHECK4-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 7039 // CHECK4-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 7040 // CHECK4-NEXT: [[TMP28:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 0 7041 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP28]], align 4 7042 // CHECK4-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 1 7043 // CHECK4-NEXT: store i32* [[I3]], i32** [[TMP29]], align 4 7044 // CHECK4-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 2 7045 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP30]], align 4 7046 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_3]], %class.anon.3* [[REF_TMP]], i32 0, i32 3 7047 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP31]], align 4 7048 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE2_clEv"(%class.anon.3* nonnull dereferenceable(16) [[REF_TMP]]) 7049 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 7050 // CHECK4: omp.body.continue: 7051 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7052 // CHECK4: omp.inner.for.inc: 7053 // CHECK4-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7054 // CHECK4-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 7055 // CHECK4-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 7056 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 7057 // CHECK4: omp.inner.for.end: 7058 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 7059 // CHECK4: omp.loop.exit: 7060 // CHECK4-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7061 // CHECK4-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 7062 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 7063 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7064 // CHECK4: omp.precond.end: 7065 // CHECK4-NEXT: ret void 7066 // 7067 // 7068 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l267 7069 // CHECK4-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 7070 // CHECK4-NEXT: entry: 7071 // CHECK4-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 7072 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 7073 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 7074 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 7075 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 7076 // CHECK4-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 7077 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 7078 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 7079 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 7080 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 7081 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 7082 // CHECK4-NEXT: ret void 7083 // 7084 // 7085 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..14 7086 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 7087 // CHECK4-NEXT: entry: 7088 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 7089 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 7090 // CHECK4-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 7091 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 7092 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 7093 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 7094 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 7095 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 7096 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 7097 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 7098 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7099 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 7100 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 7101 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 7102 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 7103 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 7104 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 7105 // CHECK4-NEXT: [[I4:%.*]] = alloca i32, align 4 7106 // CHECK4-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 7107 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 7108 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 7109 // CHECK4-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 7110 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 7111 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 7112 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 7113 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 7114 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 7115 // CHECK4-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 7116 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 7117 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 7118 // CHECK4-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 7119 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 7120 // CHECK4-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 7121 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 7122 // CHECK4-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 7123 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7124 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 7125 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 7126 // CHECK4-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 7127 // CHECK4-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 7128 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 7129 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7130 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 7131 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 7132 // CHECK4: omp.precond.then: 7133 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 7134 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7135 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 7136 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 7137 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 7138 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7139 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 7140 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 7141 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7142 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7143 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 7144 // CHECK4-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 7145 // CHECK4: cond.true: 7146 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7147 // CHECK4-NEXT: br label [[COND_END:%.*]] 7148 // CHECK4: cond.false: 7149 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7150 // CHECK4-NEXT: br label [[COND_END]] 7151 // CHECK4: cond.end: 7152 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 7153 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 7154 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 7155 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 7156 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7157 // CHECK4: omp.inner.for.cond: 7158 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7159 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7160 // CHECK4-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 7161 // CHECK4-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7162 // CHECK4: omp.inner.for.body: 7163 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 7164 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7165 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 7166 // CHECK4-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 7167 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 7168 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 7169 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7170 // CHECK4: omp.inner.for.inc: 7171 // CHECK4-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7172 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 7173 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 7174 // CHECK4-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 7175 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 7176 // CHECK4: omp.inner.for.end: 7177 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 7178 // CHECK4: omp.loop.exit: 7179 // CHECK4-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7180 // CHECK4-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 7181 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 7182 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7183 // CHECK4: omp.precond.end: 7184 // CHECK4-NEXT: ret void 7185 // 7186 // 7187 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..15 7188 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 7189 // CHECK4-NEXT: entry: 7190 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 7191 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 7192 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 7193 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 7194 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 7195 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 7196 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 7197 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 7198 // CHECK4-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 7199 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 7200 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 7201 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7202 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 7203 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 7204 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 7205 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 7206 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 7207 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 7208 // CHECK4-NEXT: [[I4:%.*]] = alloca i32, align 4 7209 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_4:%.*]], align 4 7210 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 7211 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 7212 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 7213 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7214 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 7215 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 7216 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 7217 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 7218 // CHECK4-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 7219 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 7220 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 7221 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 7222 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 7223 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 7224 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 7225 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7226 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 7227 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 7228 // CHECK4-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 7229 // CHECK4-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 7230 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 7231 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7232 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 7233 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 7234 // CHECK4: omp.precond.then: 7235 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 7236 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7237 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 7238 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 7239 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7240 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 7241 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 7242 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 7243 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 7244 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 7245 // CHECK4-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7246 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 7247 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 7248 // CHECK4-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 7249 // CHECK4: omp.dispatch.cond: 7250 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7251 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7252 // CHECK4-NEXT: [[CMP5:%.*]] = icmp ugt i32 [[TMP13]], [[TMP14]] 7253 // CHECK4-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 7254 // CHECK4: cond.true: 7255 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7256 // CHECK4-NEXT: br label [[COND_END:%.*]] 7257 // CHECK4: cond.false: 7258 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7259 // CHECK4-NEXT: br label [[COND_END]] 7260 // CHECK4: cond.end: 7261 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP15]], [[COND_TRUE]] ], [ [[TMP16]], [[COND_FALSE]] ] 7262 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 7263 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7264 // CHECK4-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 7265 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7266 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7267 // CHECK4-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 7268 // CHECK4-NEXT: br i1 [[CMP6]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 7269 // CHECK4: omp.dispatch.body: 7270 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7271 // CHECK4: omp.inner.for.cond: 7272 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7273 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7274 // CHECK4-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 7275 // CHECK4-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7276 // CHECK4: omp.inner.for.body: 7277 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7278 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 7279 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 7280 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 7281 // CHECK4-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 4 7282 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 7283 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 7284 // CHECK4-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 4 7285 // CHECK4-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 4 7286 // CHECK4-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 7287 // CHECK4-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 7288 // CHECK4-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX8]], align 4 7289 // CHECK4-NEXT: [[ADD9:%.*]] = fadd double [[TMP25]], [[TMP28]] 7290 // CHECK4-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 4 7291 // CHECK4-NEXT: [[TMP30:%.*]] = load i32, i32* [[I4]], align 4 7292 // CHECK4-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP29]], i32 [[TMP30]] 7293 // CHECK4-NEXT: store double [[ADD9]], double* [[ARRAYIDX10]], align 4 7294 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 0 7295 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP31]], align 4 7296 // CHECK4-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 1 7297 // CHECK4-NEXT: store i32* [[I4]], i32** [[TMP32]], align 4 7298 // CHECK4-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 2 7299 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP33]], align 4 7300 // CHECK4-NEXT: [[TMP34:%.*]] = getelementptr inbounds [[CLASS_ANON_4]], %class.anon.4* [[REF_TMP]], i32 0, i32 3 7301 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP34]], align 4 7302 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE3_clEv"(%class.anon.4* nonnull dereferenceable(16) [[REF_TMP]]) 7303 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 7304 // CHECK4: omp.body.continue: 7305 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7306 // CHECK4: omp.inner.for.inc: 7307 // CHECK4-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7308 // CHECK4-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP35]], 1 7309 // CHECK4-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4 7310 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 7311 // CHECK4: omp.inner.for.end: 7312 // CHECK4-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 7313 // CHECK4: omp.dispatch.inc: 7314 // CHECK4-NEXT: [[TMP36:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7315 // CHECK4-NEXT: [[TMP37:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 7316 // CHECK4-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP36]], [[TMP37]] 7317 // CHECK4-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_LB]], align 4 7318 // CHECK4-NEXT: [[TMP38:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7319 // CHECK4-NEXT: [[TMP39:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 7320 // CHECK4-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP38]], [[TMP39]] 7321 // CHECK4-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_UB]], align 4 7322 // CHECK4-NEXT: br label [[OMP_DISPATCH_COND]] 7323 // CHECK4: omp.dispatch.end: 7324 // CHECK4-NEXT: [[TMP40:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7325 // CHECK4-NEXT: [[TMP41:%.*]] = load i32, i32* [[TMP40]], align 4 7326 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP41]]) 7327 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7328 // CHECK4: omp.precond.end: 7329 // CHECK4-NEXT: ret void 7330 // 7331 // 7332 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l300 7333 // CHECK4-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 7334 // CHECK4-NEXT: entry: 7335 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 7336 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 7337 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 7338 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 7339 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 7340 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 7341 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 7342 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 7343 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 7344 // CHECK4-NEXT: ret void 7345 // 7346 // 7347 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..18 7348 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 7349 // CHECK4-NEXT: entry: 7350 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 7351 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 7352 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 7353 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 7354 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 7355 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 7356 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 7357 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 7358 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 7359 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7360 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 7361 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 7362 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 7363 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 7364 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 7365 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 7366 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 7367 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 7368 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 7369 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 7370 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 7371 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 7372 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 7373 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 7374 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 7375 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 7376 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 7377 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 7378 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 7379 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 7380 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 7381 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 7382 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 7383 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 7384 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 7385 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 7386 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 7387 // CHECK4: omp.precond.then: 7388 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 7389 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7390 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 7391 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 7392 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 7393 // CHECK4-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7394 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 7395 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 7396 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7397 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7398 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 7399 // CHECK4-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 7400 // CHECK4: cond.true: 7401 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7402 // CHECK4-NEXT: br label [[COND_END:%.*]] 7403 // CHECK4: cond.false: 7404 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7405 // CHECK4-NEXT: br label [[COND_END]] 7406 // CHECK4: cond.end: 7407 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 7408 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 7409 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 7410 // CHECK4-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 7411 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7412 // CHECK4: omp.inner.for.cond: 7413 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7414 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7415 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 7416 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7417 // CHECK4: omp.inner.for.body: 7418 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 7419 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7420 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 7421 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7422 // CHECK4: omp.inner.for.inc: 7423 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7424 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 7425 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 7426 // CHECK4-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 7427 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 7428 // CHECK4: omp.inner.for.end: 7429 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 7430 // CHECK4: omp.loop.exit: 7431 // CHECK4-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7432 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 7433 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 7434 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7435 // CHECK4: omp.precond.end: 7436 // CHECK4-NEXT: ret void 7437 // 7438 // 7439 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..19 7440 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 7441 // CHECK4-NEXT: entry: 7442 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 7443 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 7444 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 7445 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 7446 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 7447 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 7448 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 7449 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 7450 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 7451 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 7452 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 7453 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7454 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 7455 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 7456 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 7457 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 7458 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 7459 // CHECK4-NEXT: [[I3:%.*]] = alloca i32, align 4 7460 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_5:%.*]], align 4 7461 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 7462 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 7463 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 7464 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7465 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 7466 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 7467 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 7468 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 7469 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 7470 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 7471 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 7472 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 7473 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 7474 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 7475 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 7476 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 7477 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 7478 // CHECK4-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 7479 // CHECK4-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 7480 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 7481 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 7482 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 7483 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 7484 // CHECK4: omp.precond.then: 7485 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 7486 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7487 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 7488 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 7489 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7490 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 7491 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 7492 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 7493 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 7494 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7495 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7496 // CHECK4-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7497 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 7498 // CHECK4-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 7499 // CHECK4-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 7500 // CHECK4: omp.dispatch.cond: 7501 // CHECK4-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7502 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 7503 // CHECK4-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 7504 // CHECK4-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 7505 // CHECK4-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 7506 // CHECK4: omp.dispatch.body: 7507 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7508 // CHECK4-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 7509 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7510 // CHECK4: omp.inner.for.cond: 7511 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 7512 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !12 7513 // CHECK4-NEXT: [[CMP4:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 7514 // CHECK4-NEXT: br i1 [[CMP4]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7515 // CHECK4: omp.inner.for.body: 7516 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 7517 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 7518 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 7519 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I3]], align 4, !llvm.access.group !12 7520 // CHECK4-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !12 7521 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !12 7522 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i32 [[TMP22]] 7523 // CHECK4-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !12 7524 // CHECK4-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !12 7525 // CHECK4-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !12 7526 // CHECK4-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds double, double* [[TMP24]], i32 [[TMP25]] 7527 // CHECK4-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX5]], align 4, !llvm.access.group !12 7528 // CHECK4-NEXT: [[ADD6:%.*]] = fadd double [[TMP23]], [[TMP26]] 7529 // CHECK4-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !12 7530 // CHECK4-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !12 7531 // CHECK4-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP27]], i32 [[TMP28]] 7532 // CHECK4-NEXT: store double [[ADD6]], double* [[ARRAYIDX7]], align 4, !llvm.access.group !12 7533 // CHECK4-NEXT: [[TMP29:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 0 7534 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP29]], align 4, !llvm.access.group !12 7535 // CHECK4-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 1 7536 // CHECK4-NEXT: store i32* [[I3]], i32** [[TMP30]], align 4, !llvm.access.group !12 7537 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 2 7538 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP31]], align 4, !llvm.access.group !12 7539 // CHECK4-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_5]], %class.anon.5* [[REF_TMP]], i32 0, i32 3 7540 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP32]], align 4, !llvm.access.group !12 7541 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE4_clEv"(%class.anon.5* nonnull dereferenceable(16) [[REF_TMP]]), !llvm.access.group !12 7542 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 7543 // CHECK4: omp.body.continue: 7544 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7545 // CHECK4: omp.inner.for.inc: 7546 // CHECK4-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 7547 // CHECK4-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP33]], 1 7548 // CHECK4-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !12 7549 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP13:![0-9]+]] 7550 // CHECK4: omp.inner.for.end: 7551 // CHECK4-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 7552 // CHECK4: omp.dispatch.inc: 7553 // CHECK4-NEXT: br label [[OMP_DISPATCH_COND]] 7554 // CHECK4: omp.dispatch.end: 7555 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7556 // CHECK4: omp.precond.end: 7557 // CHECK4-NEXT: ret void 7558 // 7559 // 7560 // CHECK4-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l329 7561 // CHECK4-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR2]] { 7562 // CHECK4-NEXT: entry: 7563 // CHECK4-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 7564 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 7565 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 7566 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 7567 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 7568 // CHECK4-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 7569 // CHECK4-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 7570 // CHECK4-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 7571 // CHECK4-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 7572 // CHECK4-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 7573 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 7574 // CHECK4-NEXT: ret void 7575 // 7576 // 7577 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..22 7578 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR2]] { 7579 // CHECK4-NEXT: entry: 7580 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 7581 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 7582 // CHECK4-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 7583 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 7584 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 7585 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 7586 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 7587 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 7588 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 7589 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 7590 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7591 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 7592 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 7593 // CHECK4-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 7594 // CHECK4-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 7595 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 7596 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 7597 // CHECK4-NEXT: [[I4:%.*]] = alloca i32, align 4 7598 // CHECK4-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 7599 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 7600 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 7601 // CHECK4-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 7602 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 7603 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 7604 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 7605 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 7606 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 7607 // CHECK4-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 7608 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 7609 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 7610 // CHECK4-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 7611 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 7612 // CHECK4-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 7613 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 7614 // CHECK4-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 7615 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7616 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 7617 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 7618 // CHECK4-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 7619 // CHECK4-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 7620 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 7621 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7622 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 7623 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 7624 // CHECK4: omp.precond.then: 7625 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 7626 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7627 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 7628 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 7629 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 7630 // CHECK4-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7631 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 7632 // CHECK4-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 7633 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7634 // CHECK4-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7635 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 7636 // CHECK4-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 7637 // CHECK4: cond.true: 7638 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7639 // CHECK4-NEXT: br label [[COND_END:%.*]] 7640 // CHECK4: cond.false: 7641 // CHECK4-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7642 // CHECK4-NEXT: br label [[COND_END]] 7643 // CHECK4: cond.end: 7644 // CHECK4-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 7645 // CHECK4-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 7646 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 7647 // CHECK4-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 7648 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7649 // CHECK4: omp.inner.for.cond: 7650 // CHECK4-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7651 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7652 // CHECK4-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 7653 // CHECK4-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7654 // CHECK4: omp.inner.for.body: 7655 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 7656 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 7657 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 7658 // CHECK4-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 7659 // CHECK4-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 7660 // CHECK4-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 7661 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7662 // CHECK4: omp.inner.for.inc: 7663 // CHECK4-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 7664 // CHECK4-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 7665 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 7666 // CHECK4-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 7667 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]] 7668 // CHECK4: omp.inner.for.end: 7669 // CHECK4-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 7670 // CHECK4: omp.loop.exit: 7671 // CHECK4-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7672 // CHECK4-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 7673 // CHECK4-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 7674 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7675 // CHECK4: omp.precond.end: 7676 // CHECK4-NEXT: ret void 7677 // 7678 // 7679 // CHECK4-LABEL: define {{[^@]+}}@.omp_outlined..23 7680 // CHECK4-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR2]] { 7681 // CHECK4-NEXT: entry: 7682 // CHECK4-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 7683 // CHECK4-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 7684 // CHECK4-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 7685 // CHECK4-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 7686 // CHECK4-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 7687 // CHECK4-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 7688 // CHECK4-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 7689 // CHECK4-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 7690 // CHECK4-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 7691 // CHECK4-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 7692 // CHECK4-NEXT: [[TMP:%.*]] = alloca i32, align 4 7693 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7694 // CHECK4-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 7695 // CHECK4-NEXT: [[I:%.*]] = alloca i32, align 4 7696 // CHECK4-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 7697 // CHECK4-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 7698 // CHECK4-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 7699 // CHECK4-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 7700 // CHECK4-NEXT: [[I4:%.*]] = alloca i32, align 4 7701 // CHECK4-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON_6:%.*]], align 4 7702 // CHECK4-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 7703 // CHECK4-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 7704 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 7705 // CHECK4-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7706 // CHECK4-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 7707 // CHECK4-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 7708 // CHECK4-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 7709 // CHECK4-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 7710 // CHECK4-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 7711 // CHECK4-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 7712 // CHECK4-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 7713 // CHECK4-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 7714 // CHECK4-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 7715 // CHECK4-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 7716 // CHECK4-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 7717 // CHECK4-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7718 // CHECK4-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 7719 // CHECK4-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 7720 // CHECK4-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 7721 // CHECK4-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 7722 // CHECK4-NEXT: store i32 0, i32* [[I]], align 4 7723 // CHECK4-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 7724 // CHECK4-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 7725 // CHECK4-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 7726 // CHECK4: omp.precond.then: 7727 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 7728 // CHECK4-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 7729 // CHECK4-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 7730 // CHECK4-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 7731 // CHECK4-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 7732 // CHECK4-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 7733 // CHECK4-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 7734 // CHECK4-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 7735 // CHECK4-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 7736 // CHECK4-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 7737 // CHECK4-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7738 // CHECK4-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 7739 // CHECK4-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7740 // CHECK4-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 7741 // CHECK4-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 7742 // CHECK4-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 7743 // CHECK4: omp.dispatch.cond: 7744 // CHECK4-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 7745 // CHECK4-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 7746 // CHECK4-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 7747 // CHECK4-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 7748 // CHECK4-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 7749 // CHECK4: omp.dispatch.body: 7750 // CHECK4-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 7751 // CHECK4-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 7752 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 7753 // CHECK4: omp.inner.for.cond: 7754 // CHECK4-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 7755 // CHECK4-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !15 7756 // CHECK4-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 7757 // CHECK4-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 7758 // CHECK4: omp.inner.for.body: 7759 // CHECK4-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 7760 // CHECK4-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 7761 // CHECK4-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 7762 // CHECK4-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !15 7763 // CHECK4-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !15 7764 // CHECK4-NEXT: [[TMP23:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !15 7765 // CHECK4-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i32 [[TMP23]] 7766 // CHECK4-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !15 7767 // CHECK4-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !15 7768 // CHECK4-NEXT: [[TMP26:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !15 7769 // CHECK4-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP25]], i32 [[TMP26]] 7770 // CHECK4-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX6]], align 4, !llvm.access.group !15 7771 // CHECK4-NEXT: [[ADD7:%.*]] = fadd double [[TMP24]], [[TMP27]] 7772 // CHECK4-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !15 7773 // CHECK4-NEXT: [[TMP29:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !15 7774 // CHECK4-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP28]], i32 [[TMP29]] 7775 // CHECK4-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4, !llvm.access.group !15 7776 // CHECK4-NEXT: [[TMP30:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 0 7777 // CHECK4-NEXT: store double** [[TMP1]], double*** [[TMP30]], align 4, !llvm.access.group !15 7778 // CHECK4-NEXT: [[TMP31:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 1 7779 // CHECK4-NEXT: store i32* [[I4]], i32** [[TMP31]], align 4, !llvm.access.group !15 7780 // CHECK4-NEXT: [[TMP32:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 2 7781 // CHECK4-NEXT: store double** [[TMP2]], double*** [[TMP32]], align 4, !llvm.access.group !15 7782 // CHECK4-NEXT: [[TMP33:%.*]] = getelementptr inbounds [[CLASS_ANON_6]], %class.anon.6* [[REF_TMP]], i32 0, i32 3 7783 // CHECK4-NEXT: store double** [[TMP3]], double*** [[TMP33]], align 4, !llvm.access.group !15 7784 // CHECK4-NEXT: call void @"_ZZZ4mainENK3$_0clEvENKUlvE5_clEv"(%class.anon.6* nonnull dereferenceable(16) [[REF_TMP]]), !llvm.access.group !15 7785 // CHECK4-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 7786 // CHECK4: omp.body.continue: 7787 // CHECK4-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 7788 // CHECK4: omp.inner.for.inc: 7789 // CHECK4-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 7790 // CHECK4-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP34]], 1 7791 // CHECK4-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !15 7792 // CHECK4-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP16:![0-9]+]] 7793 // CHECK4: omp.inner.for.end: 7794 // CHECK4-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 7795 // CHECK4: omp.dispatch.inc: 7796 // CHECK4-NEXT: br label [[OMP_DISPATCH_COND]] 7797 // CHECK4: omp.dispatch.end: 7798 // CHECK4-NEXT: br label [[OMP_PRECOND_END]] 7799 // CHECK4: omp.precond.end: 7800 // CHECK4-NEXT: ret void 7801 // 7802 // 7803 // CHECK4-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 7804 // CHECK4-SAME: () #[[ATTR4:[0-9]+]] { 7805 // CHECK4-NEXT: entry: 7806 // CHECK4-NEXT: call void @__tgt_register_requires(i64 1) 7807 // CHECK4-NEXT: ret void 7808 // 7809 // 7810 // CHECK5-LABEL: define {{[^@]+}}@main 7811 // CHECK5-SAME: () #[[ATTR0:[0-9]+]] { 7812 // CHECK5-NEXT: entry: 7813 // CHECK5-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 7814 // CHECK5-NEXT: [[A:%.*]] = alloca double*, align 8 7815 // CHECK5-NEXT: [[B:%.*]] = alloca double*, align 8 7816 // CHECK5-NEXT: [[C:%.*]] = alloca double*, align 8 7817 // CHECK5-NEXT: [[N:%.*]] = alloca i32, align 4 7818 // CHECK5-NEXT: [[CH:%.*]] = alloca i32, align 4 7819 // CHECK5-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 8 7820 // CHECK5-NEXT: store i32 0, i32* [[RETVAL]], align 4 7821 // CHECK5-NEXT: store i32 10000, i32* [[N]], align 4 7822 // CHECK5-NEXT: store i32 100, i32* [[CH]], align 4 7823 // CHECK5-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 7824 // CHECK5-NEXT: store i32* [[N]], i32** [[TMP0]], align 8 7825 // CHECK5-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 7826 // CHECK5-NEXT: store double** [[A]], double*** [[TMP1]], align 8 7827 // CHECK5-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 7828 // CHECK5-NEXT: store double** [[B]], double*** [[TMP2]], align 8 7829 // CHECK5-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 7830 // CHECK5-NEXT: store double** [[C]], double*** [[TMP3]], align 8 7831 // CHECK5-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 7832 // CHECK5-NEXT: store i32* [[CH]], i32** [[TMP4]], align 8 7833 // CHECK5-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(40) [[REF_TMP]]) 7834 // CHECK5-NEXT: ret i32 0 7835 // 7836 // 7837 // CHECK6-LABEL: define {{[^@]+}}@main 7838 // CHECK6-SAME: () #[[ATTR0:[0-9]+]] { 7839 // CHECK6-NEXT: entry: 7840 // CHECK6-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 7841 // CHECK6-NEXT: [[A:%.*]] = alloca double*, align 8 7842 // CHECK6-NEXT: [[B:%.*]] = alloca double*, align 8 7843 // CHECK6-NEXT: [[C:%.*]] = alloca double*, align 8 7844 // CHECK6-NEXT: [[N:%.*]] = alloca i32, align 4 7845 // CHECK6-NEXT: [[CH:%.*]] = alloca i32, align 4 7846 // CHECK6-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 8 7847 // CHECK6-NEXT: store i32 0, i32* [[RETVAL]], align 4 7848 // CHECK6-NEXT: store i32 10000, i32* [[N]], align 4 7849 // CHECK6-NEXT: store i32 100, i32* [[CH]], align 4 7850 // CHECK6-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 7851 // CHECK6-NEXT: store i32* [[N]], i32** [[TMP0]], align 8 7852 // CHECK6-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 7853 // CHECK6-NEXT: store double** [[A]], double*** [[TMP1]], align 8 7854 // CHECK6-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 7855 // CHECK6-NEXT: store double** [[B]], double*** [[TMP2]], align 8 7856 // CHECK6-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 7857 // CHECK6-NEXT: store double** [[C]], double*** [[TMP3]], align 8 7858 // CHECK6-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 7859 // CHECK6-NEXT: store i32* [[CH]], i32** [[TMP4]], align 8 7860 // CHECK6-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(40) [[REF_TMP]]) 7861 // CHECK6-NEXT: ret i32 0 7862 // 7863 // 7864 // CHECK7-LABEL: define {{[^@]+}}@main 7865 // CHECK7-SAME: () #[[ATTR0:[0-9]+]] { 7866 // CHECK7-NEXT: entry: 7867 // CHECK7-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 7868 // CHECK7-NEXT: [[A:%.*]] = alloca double*, align 4 7869 // CHECK7-NEXT: [[B:%.*]] = alloca double*, align 4 7870 // CHECK7-NEXT: [[C:%.*]] = alloca double*, align 4 7871 // CHECK7-NEXT: [[N:%.*]] = alloca i32, align 4 7872 // CHECK7-NEXT: [[CH:%.*]] = alloca i32, align 4 7873 // CHECK7-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 4 7874 // CHECK7-NEXT: store i32 0, i32* [[RETVAL]], align 4 7875 // CHECK7-NEXT: store i32 10000, i32* [[N]], align 4 7876 // CHECK7-NEXT: store i32 100, i32* [[CH]], align 4 7877 // CHECK7-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 7878 // CHECK7-NEXT: store i32* [[N]], i32** [[TMP0]], align 4 7879 // CHECK7-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 7880 // CHECK7-NEXT: store double** [[A]], double*** [[TMP1]], align 4 7881 // CHECK7-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 7882 // CHECK7-NEXT: store double** [[B]], double*** [[TMP2]], align 4 7883 // CHECK7-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 7884 // CHECK7-NEXT: store double** [[C]], double*** [[TMP3]], align 4 7885 // CHECK7-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 7886 // CHECK7-NEXT: store i32* [[CH]], i32** [[TMP4]], align 4 7887 // CHECK7-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(20) [[REF_TMP]]) 7888 // CHECK7-NEXT: ret i32 0 7889 // 7890 // 7891 // CHECK8-LABEL: define {{[^@]+}}@main 7892 // CHECK8-SAME: () #[[ATTR0:[0-9]+]] { 7893 // CHECK8-NEXT: entry: 7894 // CHECK8-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 7895 // CHECK8-NEXT: [[A:%.*]] = alloca double*, align 4 7896 // CHECK8-NEXT: [[B:%.*]] = alloca double*, align 4 7897 // CHECK8-NEXT: [[C:%.*]] = alloca double*, align 4 7898 // CHECK8-NEXT: [[N:%.*]] = alloca i32, align 4 7899 // CHECK8-NEXT: [[CH:%.*]] = alloca i32, align 4 7900 // CHECK8-NEXT: [[REF_TMP:%.*]] = alloca [[CLASS_ANON:%.*]], align 4 7901 // CHECK8-NEXT: store i32 0, i32* [[RETVAL]], align 4 7902 // CHECK8-NEXT: store i32 10000, i32* [[N]], align 4 7903 // CHECK8-NEXT: store i32 100, i32* [[CH]], align 4 7904 // CHECK8-NEXT: [[TMP0:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 0 7905 // CHECK8-NEXT: store i32* [[N]], i32** [[TMP0]], align 4 7906 // CHECK8-NEXT: [[TMP1:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 1 7907 // CHECK8-NEXT: store double** [[A]], double*** [[TMP1]], align 4 7908 // CHECK8-NEXT: [[TMP2:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 2 7909 // CHECK8-NEXT: store double** [[B]], double*** [[TMP2]], align 4 7910 // CHECK8-NEXT: [[TMP3:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 3 7911 // CHECK8-NEXT: store double** [[C]], double*** [[TMP3]], align 4 7912 // CHECK8-NEXT: [[TMP4:%.*]] = getelementptr inbounds [[CLASS_ANON]], %class.anon* [[REF_TMP]], i32 0, i32 4 7913 // CHECK8-NEXT: store i32* [[CH]], i32** [[TMP4]], align 4 7914 // CHECK8-NEXT: call void @"_ZZ4mainENK3$_0clEv"(%class.anon* nonnull dereferenceable(20) [[REF_TMP]]) 7915 // CHECK8-NEXT: ret i32 0 7916 // 7917 // 7918 // CHECK9-LABEL: define {{[^@]+}}@main 7919 // CHECK9-SAME: () #[[ATTR0:[0-9]+]] { 7920 // CHECK9-NEXT: entry: 7921 // CHECK9-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 7922 // CHECK9-NEXT: [[A:%.*]] = alloca double*, align 8 7923 // CHECK9-NEXT: [[B:%.*]] = alloca double*, align 8 7924 // CHECK9-NEXT: [[C:%.*]] = alloca double*, align 8 7925 // CHECK9-NEXT: [[N:%.*]] = alloca i32, align 4 7926 // CHECK9-NEXT: [[CH:%.*]] = alloca i32, align 4 7927 // CHECK9-NEXT: [[N_CASTED:%.*]] = alloca i64, align 8 7928 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 8 7929 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 8 7930 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 8 7931 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 7932 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 7933 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 7934 // CHECK9-NEXT: [[N_CASTED3:%.*]] = alloca i64, align 8 7935 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS5:%.*]] = alloca [4 x i8*], align 8 7936 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS6:%.*]] = alloca [4 x i8*], align 8 7937 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS7:%.*]] = alloca [4 x i8*], align 8 7938 // CHECK9-NEXT: [[_TMP8:%.*]] = alloca i32, align 4 7939 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 7940 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_10:%.*]] = alloca i32, align 4 7941 // CHECK9-NEXT: [[CH_CASTED:%.*]] = alloca i64, align 8 7942 // CHECK9-NEXT: [[N_CASTED18:%.*]] = alloca i64, align 8 7943 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS20:%.*]] = alloca [5 x i8*], align 8 7944 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS21:%.*]] = alloca [5 x i8*], align 8 7945 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS22:%.*]] = alloca [5 x i8*], align 8 7946 // CHECK9-NEXT: [[_TMP23:%.*]] = alloca i32, align 4 7947 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_24:%.*]] = alloca i32, align 4 7948 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_25:%.*]] = alloca i32, align 4 7949 // CHECK9-NEXT: [[N_CASTED32:%.*]] = alloca i64, align 8 7950 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS34:%.*]] = alloca [4 x i8*], align 8 7951 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS35:%.*]] = alloca [4 x i8*], align 8 7952 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS36:%.*]] = alloca [4 x i8*], align 8 7953 // CHECK9-NEXT: [[_TMP37:%.*]] = alloca i32, align 4 7954 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_38:%.*]] = alloca i32, align 4 7955 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_39:%.*]] = alloca i32, align 4 7956 // CHECK9-NEXT: [[CH_CASTED46:%.*]] = alloca i64, align 8 7957 // CHECK9-NEXT: [[N_CASTED48:%.*]] = alloca i64, align 8 7958 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS50:%.*]] = alloca [5 x i8*], align 8 7959 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS51:%.*]] = alloca [5 x i8*], align 8 7960 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS52:%.*]] = alloca [5 x i8*], align 8 7961 // CHECK9-NEXT: [[_TMP53:%.*]] = alloca i32, align 4 7962 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_54:%.*]] = alloca i32, align 4 7963 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_55:%.*]] = alloca i32, align 4 7964 // CHECK9-NEXT: [[N_CASTED62:%.*]] = alloca i64, align 8 7965 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS64:%.*]] = alloca [4 x i8*], align 8 7966 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS65:%.*]] = alloca [4 x i8*], align 8 7967 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS66:%.*]] = alloca [4 x i8*], align 8 7968 // CHECK9-NEXT: [[_TMP67:%.*]] = alloca i32, align 4 7969 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_68:%.*]] = alloca i32, align 4 7970 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_69:%.*]] = alloca i32, align 4 7971 // CHECK9-NEXT: [[CH_CASTED76:%.*]] = alloca i64, align 8 7972 // CHECK9-NEXT: [[N_CASTED78:%.*]] = alloca i64, align 8 7973 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS80:%.*]] = alloca [5 x i8*], align 8 7974 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS81:%.*]] = alloca [5 x i8*], align 8 7975 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS82:%.*]] = alloca [5 x i8*], align 8 7976 // CHECK9-NEXT: [[_TMP83:%.*]] = alloca i32, align 4 7977 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_84:%.*]] = alloca i32, align 4 7978 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_85:%.*]] = alloca i32, align 4 7979 // CHECK9-NEXT: store i32 0, i32* [[RETVAL]], align 4 7980 // CHECK9-NEXT: store i32 10000, i32* [[N]], align 4 7981 // CHECK9-NEXT: store i32 100, i32* [[CH]], align 4 7982 // CHECK9-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 7983 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_CASTED]] to i32* 7984 // CHECK9-NEXT: store i32 [[TMP0]], i32* [[CONV]], align 4 7985 // CHECK9-NEXT: [[TMP1:%.*]] = load i64, i64* [[N_CASTED]], align 8 7986 // CHECK9-NEXT: [[TMP2:%.*]] = load double*, double** [[A]], align 8 7987 // CHECK9-NEXT: [[TMP3:%.*]] = load double*, double** [[B]], align 8 7988 // CHECK9-NEXT: [[TMP4:%.*]] = load double*, double** [[C]], align 8 7989 // CHECK9-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 7990 // CHECK9-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i64* 7991 // CHECK9-NEXT: store i64 [[TMP1]], i64* [[TMP6]], align 8 7992 // CHECK9-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 7993 // CHECK9-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i64* 7994 // CHECK9-NEXT: store i64 [[TMP1]], i64* [[TMP8]], align 8 7995 // CHECK9-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0 7996 // CHECK9-NEXT: store i8* null, i8** [[TMP9]], align 8 7997 // CHECK9-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 7998 // CHECK9-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to double** 7999 // CHECK9-NEXT: store double* [[TMP2]], double** [[TMP11]], align 8 8000 // CHECK9-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 8001 // CHECK9-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to double** 8002 // CHECK9-NEXT: store double* [[TMP2]], double** [[TMP13]], align 8 8003 // CHECK9-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 1 8004 // CHECK9-NEXT: store i8* null, i8** [[TMP14]], align 8 8005 // CHECK9-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 8006 // CHECK9-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to double** 8007 // CHECK9-NEXT: store double* [[TMP3]], double** [[TMP16]], align 8 8008 // CHECK9-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 8009 // CHECK9-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to double** 8010 // CHECK9-NEXT: store double* [[TMP3]], double** [[TMP18]], align 8 8011 // CHECK9-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 2 8012 // CHECK9-NEXT: store i8* null, i8** [[TMP19]], align 8 8013 // CHECK9-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 8014 // CHECK9-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to double** 8015 // CHECK9-NEXT: store double* [[TMP4]], double** [[TMP21]], align 8 8016 // CHECK9-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 8017 // CHECK9-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to double** 8018 // CHECK9-NEXT: store double* [[TMP4]], double** [[TMP23]], align 8 8019 // CHECK9-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 3 8020 // CHECK9-NEXT: store i8* null, i8** [[TMP24]], align 8 8021 // CHECK9-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 8022 // CHECK9-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 8023 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 8024 // CHECK9-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 8025 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8026 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 8027 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 8028 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 8029 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 8030 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8031 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 8032 // CHECK9-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 8033 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3:[0-9]+]], i64 -1, i64 [[TMP30]]) 8034 // CHECK9-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8035 // CHECK9-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 8036 // CHECK9-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 8037 // CHECK9: omp_offload.failed: 8038 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369(i64 [[TMP1]], double* [[TMP2]], double* [[TMP3]], double* [[TMP4]]) #[[ATTR2:[0-9]+]] 8039 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT]] 8040 // CHECK9: omp_offload.cont: 8041 // CHECK9-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 8042 // CHECK9-NEXT: [[CONV4:%.*]] = bitcast i64* [[N_CASTED3]] to i32* 8043 // CHECK9-NEXT: store i32 [[TMP33]], i32* [[CONV4]], align 4 8044 // CHECK9-NEXT: [[TMP34:%.*]] = load i64, i64* [[N_CASTED3]], align 8 8045 // CHECK9-NEXT: [[TMP35:%.*]] = load double*, double** [[A]], align 8 8046 // CHECK9-NEXT: [[TMP36:%.*]] = load double*, double** [[B]], align 8 8047 // CHECK9-NEXT: [[TMP37:%.*]] = load double*, double** [[C]], align 8 8048 // CHECK9-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 8049 // CHECK9-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i64* 8050 // CHECK9-NEXT: store i64 [[TMP34]], i64* [[TMP39]], align 8 8051 // CHECK9-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 8052 // CHECK9-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i64* 8053 // CHECK9-NEXT: store i64 [[TMP34]], i64* [[TMP41]], align 8 8054 // CHECK9-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 0 8055 // CHECK9-NEXT: store i8* null, i8** [[TMP42]], align 8 8056 // CHECK9-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 1 8057 // CHECK9-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to double** 8058 // CHECK9-NEXT: store double* [[TMP35]], double** [[TMP44]], align 8 8059 // CHECK9-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 1 8060 // CHECK9-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to double** 8061 // CHECK9-NEXT: store double* [[TMP35]], double** [[TMP46]], align 8 8062 // CHECK9-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 1 8063 // CHECK9-NEXT: store i8* null, i8** [[TMP47]], align 8 8064 // CHECK9-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 2 8065 // CHECK9-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to double** 8066 // CHECK9-NEXT: store double* [[TMP36]], double** [[TMP49]], align 8 8067 // CHECK9-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 2 8068 // CHECK9-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to double** 8069 // CHECK9-NEXT: store double* [[TMP36]], double** [[TMP51]], align 8 8070 // CHECK9-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 2 8071 // CHECK9-NEXT: store i8* null, i8** [[TMP52]], align 8 8072 // CHECK9-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 3 8073 // CHECK9-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to double** 8074 // CHECK9-NEXT: store double* [[TMP37]], double** [[TMP54]], align 8 8075 // CHECK9-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 3 8076 // CHECK9-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to double** 8077 // CHECK9-NEXT: store double* [[TMP37]], double** [[TMP56]], align 8 8078 // CHECK9-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 3 8079 // CHECK9-NEXT: store i8* null, i8** [[TMP57]], align 8 8080 // CHECK9-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 8081 // CHECK9-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 8082 // CHECK9-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 8083 // CHECK9-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_9]], align 4 8084 // CHECK9-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 8085 // CHECK9-NEXT: [[SUB11:%.*]] = sub nsw i32 [[TMP61]], 0 8086 // CHECK9-NEXT: [[DIV12:%.*]] = sdiv i32 [[SUB11]], 1 8087 // CHECK9-NEXT: [[SUB13:%.*]] = sub nsw i32 [[DIV12]], 1 8088 // CHECK9-NEXT: store i32 [[SUB13]], i32* [[DOTCAPTURE_EXPR_10]], align 4 8089 // CHECK9-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_10]], align 4 8090 // CHECK9-NEXT: [[ADD14:%.*]] = add nsw i32 [[TMP62]], 1 8091 // CHECK9-NEXT: [[TMP63:%.*]] = zext i32 [[ADD14]] to i64 8092 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 8093 // CHECK9-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.4, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.5, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8094 // CHECK9-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 8095 // CHECK9-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED15:%.*]], label [[OMP_OFFLOAD_CONT16:%.*]] 8096 // CHECK9: omp_offload.failed15: 8097 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408(i64 [[TMP34]], double* [[TMP35]], double* [[TMP36]], double* [[TMP37]]) #[[ATTR2]] 8098 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT16]] 8099 // CHECK9: omp_offload.cont16: 8100 // CHECK9-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 8101 // CHECK9-NEXT: [[CONV17:%.*]] = bitcast i64* [[CH_CASTED]] to i32* 8102 // CHECK9-NEXT: store i32 [[TMP66]], i32* [[CONV17]], align 4 8103 // CHECK9-NEXT: [[TMP67:%.*]] = load i64, i64* [[CH_CASTED]], align 8 8104 // CHECK9-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 8105 // CHECK9-NEXT: [[CONV19:%.*]] = bitcast i64* [[N_CASTED18]] to i32* 8106 // CHECK9-NEXT: store i32 [[TMP68]], i32* [[CONV19]], align 4 8107 // CHECK9-NEXT: [[TMP69:%.*]] = load i64, i64* [[N_CASTED18]], align 8 8108 // CHECK9-NEXT: [[TMP70:%.*]] = load double*, double** [[A]], align 8 8109 // CHECK9-NEXT: [[TMP71:%.*]] = load double*, double** [[B]], align 8 8110 // CHECK9-NEXT: [[TMP72:%.*]] = load double*, double** [[C]], align 8 8111 // CHECK9-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 8112 // CHECK9-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i64* 8113 // CHECK9-NEXT: store i64 [[TMP67]], i64* [[TMP74]], align 8 8114 // CHECK9-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 8115 // CHECK9-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i64* 8116 // CHECK9-NEXT: store i64 [[TMP67]], i64* [[TMP76]], align 8 8117 // CHECK9-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 0 8118 // CHECK9-NEXT: store i8* null, i8** [[TMP77]], align 8 8119 // CHECK9-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 1 8120 // CHECK9-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i64* 8121 // CHECK9-NEXT: store i64 [[TMP69]], i64* [[TMP79]], align 8 8122 // CHECK9-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 1 8123 // CHECK9-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i64* 8124 // CHECK9-NEXT: store i64 [[TMP69]], i64* [[TMP81]], align 8 8125 // CHECK9-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 1 8126 // CHECK9-NEXT: store i8* null, i8** [[TMP82]], align 8 8127 // CHECK9-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 2 8128 // CHECK9-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to double** 8129 // CHECK9-NEXT: store double* [[TMP70]], double** [[TMP84]], align 8 8130 // CHECK9-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 2 8131 // CHECK9-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to double** 8132 // CHECK9-NEXT: store double* [[TMP70]], double** [[TMP86]], align 8 8133 // CHECK9-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 2 8134 // CHECK9-NEXT: store i8* null, i8** [[TMP87]], align 8 8135 // CHECK9-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 3 8136 // CHECK9-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to double** 8137 // CHECK9-NEXT: store double* [[TMP71]], double** [[TMP89]], align 8 8138 // CHECK9-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 3 8139 // CHECK9-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to double** 8140 // CHECK9-NEXT: store double* [[TMP71]], double** [[TMP91]], align 8 8141 // CHECK9-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 3 8142 // CHECK9-NEXT: store i8* null, i8** [[TMP92]], align 8 8143 // CHECK9-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 4 8144 // CHECK9-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to double** 8145 // CHECK9-NEXT: store double* [[TMP72]], double** [[TMP94]], align 8 8146 // CHECK9-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 4 8147 // CHECK9-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to double** 8148 // CHECK9-NEXT: store double* [[TMP72]], double** [[TMP96]], align 8 8149 // CHECK9-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 4 8150 // CHECK9-NEXT: store i8* null, i8** [[TMP97]], align 8 8151 // CHECK9-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 8152 // CHECK9-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 8153 // CHECK9-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 8154 // CHECK9-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_24]], align 4 8155 // CHECK9-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_24]], align 4 8156 // CHECK9-NEXT: [[SUB26:%.*]] = sub nsw i32 [[TMP101]], 0 8157 // CHECK9-NEXT: [[DIV27:%.*]] = sdiv i32 [[SUB26]], 1 8158 // CHECK9-NEXT: [[SUB28:%.*]] = sub nsw i32 [[DIV27]], 1 8159 // CHECK9-NEXT: store i32 [[SUB28]], i32* [[DOTCAPTURE_EXPR_25]], align 4 8160 // CHECK9-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_25]], align 4 8161 // CHECK9-NEXT: [[ADD29:%.*]] = add nsw i32 [[TMP102]], 1 8162 // CHECK9-NEXT: [[TMP103:%.*]] = zext i32 [[ADD29]] to i64 8163 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 8164 // CHECK9-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.8, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.9, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8165 // CHECK9-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 8166 // CHECK9-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED30:%.*]], label [[OMP_OFFLOAD_CONT31:%.*]] 8167 // CHECK9: omp_offload.failed30: 8168 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447(i64 [[TMP67]], i64 [[TMP69]], double* [[TMP70]], double* [[TMP71]], double* [[TMP72]]) #[[ATTR2]] 8169 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT31]] 8170 // CHECK9: omp_offload.cont31: 8171 // CHECK9-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 8172 // CHECK9-NEXT: [[CONV33:%.*]] = bitcast i64* [[N_CASTED32]] to i32* 8173 // CHECK9-NEXT: store i32 [[TMP106]], i32* [[CONV33]], align 4 8174 // CHECK9-NEXT: [[TMP107:%.*]] = load i64, i64* [[N_CASTED32]], align 8 8175 // CHECK9-NEXT: [[TMP108:%.*]] = load double*, double** [[A]], align 8 8176 // CHECK9-NEXT: [[TMP109:%.*]] = load double*, double** [[B]], align 8 8177 // CHECK9-NEXT: [[TMP110:%.*]] = load double*, double** [[C]], align 8 8178 // CHECK9-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 8179 // CHECK9-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i64* 8180 // CHECK9-NEXT: store i64 [[TMP107]], i64* [[TMP112]], align 8 8181 // CHECK9-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 8182 // CHECK9-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i64* 8183 // CHECK9-NEXT: store i64 [[TMP107]], i64* [[TMP114]], align 8 8184 // CHECK9-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 0 8185 // CHECK9-NEXT: store i8* null, i8** [[TMP115]], align 8 8186 // CHECK9-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 1 8187 // CHECK9-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to double** 8188 // CHECK9-NEXT: store double* [[TMP108]], double** [[TMP117]], align 8 8189 // CHECK9-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 1 8190 // CHECK9-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to double** 8191 // CHECK9-NEXT: store double* [[TMP108]], double** [[TMP119]], align 8 8192 // CHECK9-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 1 8193 // CHECK9-NEXT: store i8* null, i8** [[TMP120]], align 8 8194 // CHECK9-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 2 8195 // CHECK9-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to double** 8196 // CHECK9-NEXT: store double* [[TMP109]], double** [[TMP122]], align 8 8197 // CHECK9-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 2 8198 // CHECK9-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to double** 8199 // CHECK9-NEXT: store double* [[TMP109]], double** [[TMP124]], align 8 8200 // CHECK9-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 2 8201 // CHECK9-NEXT: store i8* null, i8** [[TMP125]], align 8 8202 // CHECK9-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 3 8203 // CHECK9-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to double** 8204 // CHECK9-NEXT: store double* [[TMP110]], double** [[TMP127]], align 8 8205 // CHECK9-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 3 8206 // CHECK9-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to double** 8207 // CHECK9-NEXT: store double* [[TMP110]], double** [[TMP129]], align 8 8208 // CHECK9-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 3 8209 // CHECK9-NEXT: store i8* null, i8** [[TMP130]], align 8 8210 // CHECK9-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 8211 // CHECK9-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 8212 // CHECK9-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 8213 // CHECK9-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_38]], align 4 8214 // CHECK9-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_38]], align 4 8215 // CHECK9-NEXT: [[SUB40:%.*]] = sub nsw i32 [[TMP134]], 0 8216 // CHECK9-NEXT: [[DIV41:%.*]] = sdiv i32 [[SUB40]], 1 8217 // CHECK9-NEXT: [[SUB42:%.*]] = sub nsw i32 [[DIV41]], 1 8218 // CHECK9-NEXT: store i32 [[SUB42]], i32* [[DOTCAPTURE_EXPR_39]], align 4 8219 // CHECK9-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_39]], align 4 8220 // CHECK9-NEXT: [[ADD43:%.*]] = add nsw i32 [[TMP135]], 1 8221 // CHECK9-NEXT: [[TMP136:%.*]] = zext i32 [[ADD43]] to i64 8222 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 8223 // CHECK9-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.12, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.13, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8224 // CHECK9-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 8225 // CHECK9-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED44:%.*]], label [[OMP_OFFLOAD_CONT45:%.*]] 8226 // CHECK9: omp_offload.failed44: 8227 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478(i64 [[TMP107]], double* [[TMP108]], double* [[TMP109]], double* [[TMP110]]) #[[ATTR2]] 8228 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT45]] 8229 // CHECK9: omp_offload.cont45: 8230 // CHECK9-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 8231 // CHECK9-NEXT: [[CONV47:%.*]] = bitcast i64* [[CH_CASTED46]] to i32* 8232 // CHECK9-NEXT: store i32 [[TMP139]], i32* [[CONV47]], align 4 8233 // CHECK9-NEXT: [[TMP140:%.*]] = load i64, i64* [[CH_CASTED46]], align 8 8234 // CHECK9-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 8235 // CHECK9-NEXT: [[CONV49:%.*]] = bitcast i64* [[N_CASTED48]] to i32* 8236 // CHECK9-NEXT: store i32 [[TMP141]], i32* [[CONV49]], align 4 8237 // CHECK9-NEXT: [[TMP142:%.*]] = load i64, i64* [[N_CASTED48]], align 8 8238 // CHECK9-NEXT: [[TMP143:%.*]] = load double*, double** [[A]], align 8 8239 // CHECK9-NEXT: [[TMP144:%.*]] = load double*, double** [[B]], align 8 8240 // CHECK9-NEXT: [[TMP145:%.*]] = load double*, double** [[C]], align 8 8241 // CHECK9-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 8242 // CHECK9-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i64* 8243 // CHECK9-NEXT: store i64 [[TMP140]], i64* [[TMP147]], align 8 8244 // CHECK9-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 8245 // CHECK9-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i64* 8246 // CHECK9-NEXT: store i64 [[TMP140]], i64* [[TMP149]], align 8 8247 // CHECK9-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 0 8248 // CHECK9-NEXT: store i8* null, i8** [[TMP150]], align 8 8249 // CHECK9-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 1 8250 // CHECK9-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i64* 8251 // CHECK9-NEXT: store i64 [[TMP142]], i64* [[TMP152]], align 8 8252 // CHECK9-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 1 8253 // CHECK9-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i64* 8254 // CHECK9-NEXT: store i64 [[TMP142]], i64* [[TMP154]], align 8 8255 // CHECK9-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 1 8256 // CHECK9-NEXT: store i8* null, i8** [[TMP155]], align 8 8257 // CHECK9-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 2 8258 // CHECK9-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to double** 8259 // CHECK9-NEXT: store double* [[TMP143]], double** [[TMP157]], align 8 8260 // CHECK9-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 2 8261 // CHECK9-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to double** 8262 // CHECK9-NEXT: store double* [[TMP143]], double** [[TMP159]], align 8 8263 // CHECK9-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 2 8264 // CHECK9-NEXT: store i8* null, i8** [[TMP160]], align 8 8265 // CHECK9-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 3 8266 // CHECK9-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to double** 8267 // CHECK9-NEXT: store double* [[TMP144]], double** [[TMP162]], align 8 8268 // CHECK9-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 3 8269 // CHECK9-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to double** 8270 // CHECK9-NEXT: store double* [[TMP144]], double** [[TMP164]], align 8 8271 // CHECK9-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 3 8272 // CHECK9-NEXT: store i8* null, i8** [[TMP165]], align 8 8273 // CHECK9-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 4 8274 // CHECK9-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to double** 8275 // CHECK9-NEXT: store double* [[TMP145]], double** [[TMP167]], align 8 8276 // CHECK9-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 4 8277 // CHECK9-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to double** 8278 // CHECK9-NEXT: store double* [[TMP145]], double** [[TMP169]], align 8 8279 // CHECK9-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 4 8280 // CHECK9-NEXT: store i8* null, i8** [[TMP170]], align 8 8281 // CHECK9-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 8282 // CHECK9-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 8283 // CHECK9-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 8284 // CHECK9-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_54]], align 4 8285 // CHECK9-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_54]], align 4 8286 // CHECK9-NEXT: [[SUB56:%.*]] = sub nsw i32 [[TMP174]], 0 8287 // CHECK9-NEXT: [[DIV57:%.*]] = sdiv i32 [[SUB56]], 1 8288 // CHECK9-NEXT: [[SUB58:%.*]] = sub nsw i32 [[DIV57]], 1 8289 // CHECK9-NEXT: store i32 [[SUB58]], i32* [[DOTCAPTURE_EXPR_55]], align 4 8290 // CHECK9-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_55]], align 4 8291 // CHECK9-NEXT: [[ADD59:%.*]] = add nsw i32 [[TMP175]], 1 8292 // CHECK9-NEXT: [[TMP176:%.*]] = zext i32 [[ADD59]] to i64 8293 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 8294 // CHECK9-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.16, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.17, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8295 // CHECK9-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 8296 // CHECK9-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED60:%.*]], label [[OMP_OFFLOAD_CONT61:%.*]] 8297 // CHECK9: omp_offload.failed60: 8298 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506(i64 [[TMP140]], i64 [[TMP142]], double* [[TMP143]], double* [[TMP144]], double* [[TMP145]]) #[[ATTR2]] 8299 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT61]] 8300 // CHECK9: omp_offload.cont61: 8301 // CHECK9-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 8302 // CHECK9-NEXT: [[CONV63:%.*]] = bitcast i64* [[N_CASTED62]] to i32* 8303 // CHECK9-NEXT: store i32 [[TMP179]], i32* [[CONV63]], align 4 8304 // CHECK9-NEXT: [[TMP180:%.*]] = load i64, i64* [[N_CASTED62]], align 8 8305 // CHECK9-NEXT: [[TMP181:%.*]] = load double*, double** [[A]], align 8 8306 // CHECK9-NEXT: [[TMP182:%.*]] = load double*, double** [[B]], align 8 8307 // CHECK9-NEXT: [[TMP183:%.*]] = load double*, double** [[C]], align 8 8308 // CHECK9-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 8309 // CHECK9-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i64* 8310 // CHECK9-NEXT: store i64 [[TMP180]], i64* [[TMP185]], align 8 8311 // CHECK9-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 8312 // CHECK9-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i64* 8313 // CHECK9-NEXT: store i64 [[TMP180]], i64* [[TMP187]], align 8 8314 // CHECK9-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 0 8315 // CHECK9-NEXT: store i8* null, i8** [[TMP188]], align 8 8316 // CHECK9-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 1 8317 // CHECK9-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to double** 8318 // CHECK9-NEXT: store double* [[TMP181]], double** [[TMP190]], align 8 8319 // CHECK9-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 1 8320 // CHECK9-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to double** 8321 // CHECK9-NEXT: store double* [[TMP181]], double** [[TMP192]], align 8 8322 // CHECK9-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 1 8323 // CHECK9-NEXT: store i8* null, i8** [[TMP193]], align 8 8324 // CHECK9-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 2 8325 // CHECK9-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to double** 8326 // CHECK9-NEXT: store double* [[TMP182]], double** [[TMP195]], align 8 8327 // CHECK9-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 2 8328 // CHECK9-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to double** 8329 // CHECK9-NEXT: store double* [[TMP182]], double** [[TMP197]], align 8 8330 // CHECK9-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 2 8331 // CHECK9-NEXT: store i8* null, i8** [[TMP198]], align 8 8332 // CHECK9-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 3 8333 // CHECK9-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to double** 8334 // CHECK9-NEXT: store double* [[TMP183]], double** [[TMP200]], align 8 8335 // CHECK9-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 3 8336 // CHECK9-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to double** 8337 // CHECK9-NEXT: store double* [[TMP183]], double** [[TMP202]], align 8 8338 // CHECK9-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 3 8339 // CHECK9-NEXT: store i8* null, i8** [[TMP203]], align 8 8340 // CHECK9-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 8341 // CHECK9-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 8342 // CHECK9-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 8343 // CHECK9-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_68]], align 4 8344 // CHECK9-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_68]], align 4 8345 // CHECK9-NEXT: [[SUB70:%.*]] = sub nsw i32 [[TMP207]], 0 8346 // CHECK9-NEXT: [[DIV71:%.*]] = sdiv i32 [[SUB70]], 1 8347 // CHECK9-NEXT: [[SUB72:%.*]] = sub nsw i32 [[DIV71]], 1 8348 // CHECK9-NEXT: store i32 [[SUB72]], i32* [[DOTCAPTURE_EXPR_69]], align 4 8349 // CHECK9-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_69]], align 4 8350 // CHECK9-NEXT: [[ADD73:%.*]] = add nsw i32 [[TMP208]], 1 8351 // CHECK9-NEXT: [[TMP209:%.*]] = zext i32 [[ADD73]] to i64 8352 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 8353 // CHECK9-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.20, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.21, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8354 // CHECK9-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 8355 // CHECK9-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED74:%.*]], label [[OMP_OFFLOAD_CONT75:%.*]] 8356 // CHECK9: omp_offload.failed74: 8357 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536(i64 [[TMP180]], double* [[TMP181]], double* [[TMP182]], double* [[TMP183]]) #[[ATTR2]] 8358 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT75]] 8359 // CHECK9: omp_offload.cont75: 8360 // CHECK9-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 8361 // CHECK9-NEXT: [[CONV77:%.*]] = bitcast i64* [[CH_CASTED76]] to i32* 8362 // CHECK9-NEXT: store i32 [[TMP212]], i32* [[CONV77]], align 4 8363 // CHECK9-NEXT: [[TMP213:%.*]] = load i64, i64* [[CH_CASTED76]], align 8 8364 // CHECK9-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 8365 // CHECK9-NEXT: [[CONV79:%.*]] = bitcast i64* [[N_CASTED78]] to i32* 8366 // CHECK9-NEXT: store i32 [[TMP214]], i32* [[CONV79]], align 4 8367 // CHECK9-NEXT: [[TMP215:%.*]] = load i64, i64* [[N_CASTED78]], align 8 8368 // CHECK9-NEXT: [[TMP216:%.*]] = load double*, double** [[A]], align 8 8369 // CHECK9-NEXT: [[TMP217:%.*]] = load double*, double** [[B]], align 8 8370 // CHECK9-NEXT: [[TMP218:%.*]] = load double*, double** [[C]], align 8 8371 // CHECK9-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 8372 // CHECK9-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i64* 8373 // CHECK9-NEXT: store i64 [[TMP213]], i64* [[TMP220]], align 8 8374 // CHECK9-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 8375 // CHECK9-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i64* 8376 // CHECK9-NEXT: store i64 [[TMP213]], i64* [[TMP222]], align 8 8377 // CHECK9-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 0 8378 // CHECK9-NEXT: store i8* null, i8** [[TMP223]], align 8 8379 // CHECK9-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 1 8380 // CHECK9-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i64* 8381 // CHECK9-NEXT: store i64 [[TMP215]], i64* [[TMP225]], align 8 8382 // CHECK9-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 1 8383 // CHECK9-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i64* 8384 // CHECK9-NEXT: store i64 [[TMP215]], i64* [[TMP227]], align 8 8385 // CHECK9-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 1 8386 // CHECK9-NEXT: store i8* null, i8** [[TMP228]], align 8 8387 // CHECK9-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 2 8388 // CHECK9-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to double** 8389 // CHECK9-NEXT: store double* [[TMP216]], double** [[TMP230]], align 8 8390 // CHECK9-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 2 8391 // CHECK9-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to double** 8392 // CHECK9-NEXT: store double* [[TMP216]], double** [[TMP232]], align 8 8393 // CHECK9-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 2 8394 // CHECK9-NEXT: store i8* null, i8** [[TMP233]], align 8 8395 // CHECK9-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 3 8396 // CHECK9-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to double** 8397 // CHECK9-NEXT: store double* [[TMP217]], double** [[TMP235]], align 8 8398 // CHECK9-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 3 8399 // CHECK9-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to double** 8400 // CHECK9-NEXT: store double* [[TMP217]], double** [[TMP237]], align 8 8401 // CHECK9-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 3 8402 // CHECK9-NEXT: store i8* null, i8** [[TMP238]], align 8 8403 // CHECK9-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 4 8404 // CHECK9-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to double** 8405 // CHECK9-NEXT: store double* [[TMP218]], double** [[TMP240]], align 8 8406 // CHECK9-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 4 8407 // CHECK9-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to double** 8408 // CHECK9-NEXT: store double* [[TMP218]], double** [[TMP242]], align 8 8409 // CHECK9-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 4 8410 // CHECK9-NEXT: store i8* null, i8** [[TMP243]], align 8 8411 // CHECK9-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 8412 // CHECK9-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 8413 // CHECK9-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 8414 // CHECK9-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_84]], align 4 8415 // CHECK9-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_84]], align 4 8416 // CHECK9-NEXT: [[SUB86:%.*]] = sub nsw i32 [[TMP247]], 0 8417 // CHECK9-NEXT: [[DIV87:%.*]] = sdiv i32 [[SUB86]], 1 8418 // CHECK9-NEXT: [[SUB88:%.*]] = sub nsw i32 [[DIV87]], 1 8419 // CHECK9-NEXT: store i32 [[SUB88]], i32* [[DOTCAPTURE_EXPR_85]], align 4 8420 // CHECK9-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_85]], align 4 8421 // CHECK9-NEXT: [[ADD89:%.*]] = add nsw i32 [[TMP248]], 1 8422 // CHECK9-NEXT: [[TMP249:%.*]] = zext i32 [[ADD89]] to i64 8423 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 8424 // CHECK9-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.24, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.25, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 8425 // CHECK9-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 8426 // CHECK9-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED90:%.*]], label [[OMP_OFFLOAD_CONT91:%.*]] 8427 // CHECK9: omp_offload.failed90: 8428 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562(i64 [[TMP213]], i64 [[TMP215]], double* [[TMP216]], double* [[TMP217]], double* [[TMP218]]) #[[ATTR2]] 8429 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT91]] 8430 // CHECK9: omp_offload.cont91: 8431 // CHECK9-NEXT: [[CALL:%.*]] = call signext i32 @_Z5tmainIiET_v() 8432 // CHECK9-NEXT: ret i32 [[CALL]] 8433 // 8434 // 8435 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369 8436 // CHECK9-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1:[0-9]+]] { 8437 // CHECK9-NEXT: entry: 8438 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 8439 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 8440 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 8441 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 8442 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 8443 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 8444 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 8445 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 8446 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 8447 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 8448 // CHECK9-NEXT: ret void 8449 // 8450 // 8451 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined. 8452 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 8453 // CHECK9-NEXT: entry: 8454 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 8455 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 8456 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 8457 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 8458 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 8459 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 8460 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 8461 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 8462 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 8463 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 8464 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 8465 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 8466 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 8467 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 8468 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 8469 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 8470 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 8471 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 8472 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 8473 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 8474 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 8475 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 8476 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 8477 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 8478 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 8479 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 8480 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 8481 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 8482 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8483 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 8484 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 8485 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 8486 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 8487 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 8488 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8489 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 8490 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 8491 // CHECK9: omp.precond.then: 8492 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 8493 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8494 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 8495 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 8496 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 8497 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8498 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 8499 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 8500 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8501 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8502 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 8503 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 8504 // CHECK9: cond.true: 8505 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8506 // CHECK9-NEXT: br label [[COND_END:%.*]] 8507 // CHECK9: cond.false: 8508 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8509 // CHECK9-NEXT: br label [[COND_END]] 8510 // CHECK9: cond.end: 8511 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 8512 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 8513 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 8514 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 8515 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 8516 // CHECK9: omp.inner.for.cond: 8517 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8518 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8519 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 8520 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 8521 // CHECK9: omp.inner.for.body: 8522 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 8523 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 8524 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8525 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 8526 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 8527 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 8528 // CHECK9: omp.inner.for.inc: 8529 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8530 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 8531 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 8532 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 8533 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 8534 // CHECK9: omp.inner.for.end: 8535 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 8536 // CHECK9: omp.loop.exit: 8537 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8538 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 8539 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 8540 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 8541 // CHECK9: omp.precond.end: 8542 // CHECK9-NEXT: ret void 8543 // 8544 // 8545 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..1 8546 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 8547 // CHECK9-NEXT: entry: 8548 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 8549 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 8550 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 8551 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 8552 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 8553 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 8554 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 8555 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 8556 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 8557 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 8558 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 8559 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 8560 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 8561 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 8562 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 8563 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 8564 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 8565 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 8566 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 8567 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 8568 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 8569 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 8570 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 8571 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 8572 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 8573 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 8574 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 8575 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 8576 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 8577 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 8578 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 8579 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 8580 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8581 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 8582 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 8583 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 8584 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 8585 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 8586 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8587 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 8588 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 8589 // CHECK9: omp.precond.then: 8590 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 8591 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8592 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 8593 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 8594 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 8595 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 8596 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 8597 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 8598 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 8599 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 8600 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 8601 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8602 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 8603 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 8604 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 8605 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8606 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 8607 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 8608 // CHECK9: cond.true: 8609 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8610 // CHECK9-NEXT: br label [[COND_END:%.*]] 8611 // CHECK9: cond.false: 8612 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 8613 // CHECK9-NEXT: br label [[COND_END]] 8614 // CHECK9: cond.end: 8615 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 8616 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 8617 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 8618 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 8619 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 8620 // CHECK9: omp.inner.for.cond: 8621 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8622 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 8623 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 8624 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 8625 // CHECK9: omp.inner.for.body: 8626 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8627 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 8628 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 8629 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 8630 // CHECK9-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 8631 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 8632 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 8633 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 8634 // CHECK9-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 8635 // CHECK9-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 8636 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 8637 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 8638 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 8639 // CHECK9-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 8640 // CHECK9-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 8641 // CHECK9-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 8642 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 8643 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 8644 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 8645 // CHECK9-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 8646 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 8647 // CHECK9: omp.body.continue: 8648 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 8649 // CHECK9: omp.inner.for.inc: 8650 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8651 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 8652 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 8653 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 8654 // CHECK9: omp.inner.for.end: 8655 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 8656 // CHECK9: omp.loop.exit: 8657 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8658 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 8659 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 8660 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 8661 // CHECK9: omp.precond.end: 8662 // CHECK9-NEXT: ret void 8663 // 8664 // 8665 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408 8666 // CHECK9-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 8667 // CHECK9-NEXT: entry: 8668 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 8669 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 8670 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 8671 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 8672 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 8673 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 8674 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 8675 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 8676 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 8677 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 8678 // CHECK9-NEXT: ret void 8679 // 8680 // 8681 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..2 8682 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 8683 // CHECK9-NEXT: entry: 8684 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 8685 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 8686 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 8687 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 8688 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 8689 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 8690 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 8691 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 8692 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 8693 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 8694 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 8695 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 8696 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 8697 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 8698 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 8699 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 8700 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 8701 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 8702 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 8703 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 8704 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 8705 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 8706 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 8707 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 8708 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 8709 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 8710 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 8711 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 8712 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8713 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 8714 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 8715 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 8716 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 8717 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 8718 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8719 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 8720 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 8721 // CHECK9: omp.precond.then: 8722 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 8723 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8724 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 8725 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 8726 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 8727 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8728 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 8729 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 8730 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8731 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8732 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 8733 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 8734 // CHECK9: cond.true: 8735 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8736 // CHECK9-NEXT: br label [[COND_END:%.*]] 8737 // CHECK9: cond.false: 8738 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8739 // CHECK9-NEXT: br label [[COND_END]] 8740 // CHECK9: cond.end: 8741 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 8742 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 8743 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 8744 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 8745 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 8746 // CHECK9: omp.inner.for.cond: 8747 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8748 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8749 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 8750 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 8751 // CHECK9: omp.inner.for.body: 8752 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 8753 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 8754 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8755 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 8756 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 8757 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 8758 // CHECK9: omp.inner.for.inc: 8759 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8760 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 8761 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 8762 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 8763 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 8764 // CHECK9: omp.inner.for.end: 8765 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 8766 // CHECK9: omp.loop.exit: 8767 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8768 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 8769 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 8770 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 8771 // CHECK9: omp.precond.end: 8772 // CHECK9-NEXT: ret void 8773 // 8774 // 8775 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..3 8776 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 8777 // CHECK9-NEXT: entry: 8778 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 8779 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 8780 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 8781 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 8782 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 8783 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 8784 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 8785 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 8786 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 8787 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 8788 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 8789 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 8790 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 8791 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 8792 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 8793 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 8794 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 8795 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 8796 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 8797 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 8798 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 8799 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 8800 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 8801 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 8802 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 8803 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 8804 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 8805 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 8806 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 8807 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 8808 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 8809 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 8810 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8811 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 8812 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 8813 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 8814 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 8815 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 8816 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8817 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 8818 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 8819 // CHECK9: omp.precond.then: 8820 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 8821 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8822 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 8823 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 8824 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 8825 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 8826 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 8827 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 8828 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 8829 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 8830 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 8831 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8832 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 8833 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 8834 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 8835 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8836 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 8837 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 8838 // CHECK9: cond.true: 8839 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8840 // CHECK9-NEXT: br label [[COND_END:%.*]] 8841 // CHECK9: cond.false: 8842 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 8843 // CHECK9-NEXT: br label [[COND_END]] 8844 // CHECK9: cond.end: 8845 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 8846 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 8847 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 8848 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 8849 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 8850 // CHECK9: omp.inner.for.cond: 8851 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8852 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 8853 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 8854 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 8855 // CHECK9: omp.inner.for.body: 8856 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8857 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 8858 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 8859 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 8860 // CHECK9-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 8861 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 8862 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 8863 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 8864 // CHECK9-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 8865 // CHECK9-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 8866 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 8867 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 8868 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 8869 // CHECK9-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 8870 // CHECK9-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 8871 // CHECK9-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 8872 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 8873 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 8874 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 8875 // CHECK9-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 8876 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 8877 // CHECK9: omp.body.continue: 8878 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 8879 // CHECK9: omp.inner.for.inc: 8880 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8881 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 8882 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 8883 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 8884 // CHECK9: omp.inner.for.end: 8885 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 8886 // CHECK9: omp.loop.exit: 8887 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8888 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 8889 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 8890 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 8891 // CHECK9: omp.precond.end: 8892 // CHECK9-NEXT: ret void 8893 // 8894 // 8895 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447 8896 // CHECK9-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 8897 // CHECK9-NEXT: entry: 8898 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 8899 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 8900 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 8901 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 8902 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 8903 // CHECK9-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 8904 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 8905 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 8906 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 8907 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 8908 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 8909 // CHECK9-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 8910 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 8911 // CHECK9-NEXT: ret void 8912 // 8913 // 8914 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..6 8915 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 8916 // CHECK9-NEXT: entry: 8917 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 8918 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 8919 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 8920 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 8921 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 8922 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 8923 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 8924 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 8925 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 8926 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 8927 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 8928 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 8929 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 8930 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 8931 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 8932 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 8933 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 8934 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 8935 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 8936 // CHECK9-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 8937 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 8938 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 8939 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 8940 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 8941 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 8942 // CHECK9-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 8943 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 8944 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 8945 // CHECK9-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 8946 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 8947 // CHECK9-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 8948 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8949 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 8950 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 8951 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 8952 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 8953 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 8954 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 8955 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 8956 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 8957 // CHECK9: omp.precond.then: 8958 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 8959 // CHECK9-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8960 // CHECK9-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 8961 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 8962 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 8963 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 8964 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 8965 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 8966 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 8967 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8968 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8969 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 8970 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 8971 // CHECK9: cond.true: 8972 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8973 // CHECK9-NEXT: br label [[COND_END:%.*]] 8974 // CHECK9: cond.false: 8975 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8976 // CHECK9-NEXT: br label [[COND_END]] 8977 // CHECK9: cond.end: 8978 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 8979 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 8980 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 8981 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 8982 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 8983 // CHECK9: omp.inner.for.cond: 8984 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8985 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 8986 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 8987 // CHECK9-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 8988 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 8989 // CHECK9: omp.inner.for.body: 8990 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 8991 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 8992 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 8993 // CHECK9-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 8994 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 8995 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 8996 // CHECK9: omp.inner.for.inc: 8997 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 8998 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 8999 // CHECK9-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 9000 // CHECK9-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 9001 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9002 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9003 // CHECK9-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 9004 // CHECK9-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 9005 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9006 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9007 // CHECK9-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP27]], [[TMP28]] 9008 // CHECK9-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 9009 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9010 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9011 // CHECK9-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP29]], [[TMP30]] 9012 // CHECK9-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 9013 // CHECK9: cond.true10: 9014 // CHECK9-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9015 // CHECK9-NEXT: br label [[COND_END12:%.*]] 9016 // CHECK9: cond.false11: 9017 // CHECK9-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9018 // CHECK9-NEXT: br label [[COND_END12]] 9019 // CHECK9: cond.end12: 9020 // CHECK9-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP31]], [[COND_TRUE10]] ], [ [[TMP32]], [[COND_FALSE11]] ] 9021 // CHECK9-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 9022 // CHECK9-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9023 // CHECK9-NEXT: store i32 [[TMP33]], i32* [[DOTOMP_IV]], align 4 9024 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9025 // CHECK9: omp.inner.for.end: 9026 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9027 // CHECK9: omp.loop.exit: 9028 // CHECK9-NEXT: [[TMP34:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9029 // CHECK9-NEXT: [[TMP35:%.*]] = load i32, i32* [[TMP34]], align 4 9030 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP35]]) 9031 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9032 // CHECK9: omp.precond.end: 9033 // CHECK9-NEXT: ret void 9034 // 9035 // 9036 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..7 9037 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9038 // CHECK9-NEXT: entry: 9039 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9040 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9041 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 9042 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 9043 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9044 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9045 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9046 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9047 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9048 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9049 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9050 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9051 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9052 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 9053 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 9054 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9055 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9056 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 9057 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9058 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9059 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9060 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9061 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9062 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9063 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9064 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9065 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9066 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 9067 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 9068 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 9069 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 9070 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 9071 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9072 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 9073 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9074 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 9075 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9076 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9077 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9078 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 9079 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9080 // CHECK9: omp.precond.then: 9081 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 9082 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9083 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 9084 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9085 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 9086 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9087 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 9088 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 9089 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 9090 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9091 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9092 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9093 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 9094 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 9095 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9096 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9097 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 9098 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9099 // CHECK9: cond.true: 9100 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9101 // CHECK9-NEXT: br label [[COND_END:%.*]] 9102 // CHECK9: cond.false: 9103 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9104 // CHECK9-NEXT: br label [[COND_END]] 9105 // CHECK9: cond.end: 9106 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 9107 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 9108 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 9109 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 9110 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9111 // CHECK9: omp.inner.for.cond: 9112 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9113 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9114 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 9115 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9116 // CHECK9: omp.inner.for.body: 9117 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9118 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 9119 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 9120 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 9121 // CHECK9-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 9122 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 9123 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 9124 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 9125 // CHECK9-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 9126 // CHECK9-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 9127 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 9128 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 9129 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 9130 // CHECK9-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 9131 // CHECK9-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 9132 // CHECK9-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 9133 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 9134 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 9135 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 9136 // CHECK9-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 9137 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 9138 // CHECK9: omp.body.continue: 9139 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9140 // CHECK9: omp.inner.for.inc: 9141 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9142 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 9143 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 9144 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9145 // CHECK9: omp.inner.for.end: 9146 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9147 // CHECK9: omp.loop.exit: 9148 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9149 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 9150 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 9151 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9152 // CHECK9: omp.precond.end: 9153 // CHECK9-NEXT: ret void 9154 // 9155 // 9156 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478 9157 // CHECK9-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 9158 // CHECK9-NEXT: entry: 9159 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 9160 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 9161 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 9162 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 9163 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 9164 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 9165 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 9166 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 9167 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 9168 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 9169 // CHECK9-NEXT: ret void 9170 // 9171 // 9172 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..10 9173 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9174 // CHECK9-NEXT: entry: 9175 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9176 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9177 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9178 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9179 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9180 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9181 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9182 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9183 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9184 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9185 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9186 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 9187 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 9188 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9189 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9190 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 9191 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9192 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9193 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9194 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9195 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9196 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9197 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9198 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 9199 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 9200 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 9201 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 9202 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 9203 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9204 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 9205 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9206 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 9207 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9208 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9209 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9210 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 9211 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9212 // CHECK9: omp.precond.then: 9213 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 9214 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9215 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 9216 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9217 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9218 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9219 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 9220 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 9221 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9222 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9223 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 9224 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9225 // CHECK9: cond.true: 9226 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9227 // CHECK9-NEXT: br label [[COND_END:%.*]] 9228 // CHECK9: cond.false: 9229 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9230 // CHECK9-NEXT: br label [[COND_END]] 9231 // CHECK9: cond.end: 9232 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 9233 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 9234 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9235 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 9236 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9237 // CHECK9: omp.inner.for.cond: 9238 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9239 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9240 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 9241 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9242 // CHECK9: omp.inner.for.body: 9243 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9244 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 9245 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9246 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 9247 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 9248 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9249 // CHECK9: omp.inner.for.inc: 9250 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9251 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9252 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 9253 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 9254 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9255 // CHECK9: omp.inner.for.end: 9256 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9257 // CHECK9: omp.loop.exit: 9258 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9259 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 9260 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 9261 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9262 // CHECK9: omp.precond.end: 9263 // CHECK9-NEXT: ret void 9264 // 9265 // 9266 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..11 9267 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9268 // CHECK9-NEXT: entry: 9269 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9270 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9271 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 9272 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 9273 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9274 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9275 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9276 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9277 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9278 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9279 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9280 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9281 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9282 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 9283 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 9284 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9285 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9286 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 9287 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9288 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9289 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9290 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9291 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9292 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9293 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9294 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9295 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9296 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 9297 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 9298 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 9299 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 9300 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 9301 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9302 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 9303 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9304 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 9305 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9306 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9307 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9308 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 9309 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9310 // CHECK9: omp.precond.then: 9311 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 9312 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9313 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 9314 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9315 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 9316 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9317 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 9318 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 9319 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 9320 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9321 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9322 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9323 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 9324 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 9325 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9326 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9327 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 9328 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9329 // CHECK9: cond.true: 9330 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9331 // CHECK9-NEXT: br label [[COND_END:%.*]] 9332 // CHECK9: cond.false: 9333 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9334 // CHECK9-NEXT: br label [[COND_END]] 9335 // CHECK9: cond.end: 9336 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 9337 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 9338 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 9339 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 9340 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9341 // CHECK9: omp.inner.for.cond: 9342 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9343 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9344 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 9345 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9346 // CHECK9: omp.inner.for.body: 9347 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9348 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 9349 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 9350 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 9351 // CHECK9-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 9352 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 9353 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 9354 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 9355 // CHECK9-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 9356 // CHECK9-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 9357 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 9358 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 9359 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 9360 // CHECK9-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 9361 // CHECK9-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 9362 // CHECK9-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 9363 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 9364 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 9365 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 9366 // CHECK9-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 9367 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 9368 // CHECK9: omp.body.continue: 9369 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9370 // CHECK9: omp.inner.for.inc: 9371 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9372 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 9373 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 9374 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9375 // CHECK9: omp.inner.for.end: 9376 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9377 // CHECK9: omp.loop.exit: 9378 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9379 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 9380 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 9381 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9382 // CHECK9: omp.precond.end: 9383 // CHECK9-NEXT: ret void 9384 // 9385 // 9386 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506 9387 // CHECK9-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 9388 // CHECK9-NEXT: entry: 9389 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 9390 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 9391 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 9392 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 9393 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 9394 // CHECK9-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 9395 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 9396 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 9397 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 9398 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 9399 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 9400 // CHECK9-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 9401 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 9402 // CHECK9-NEXT: ret void 9403 // 9404 // 9405 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..14 9406 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9407 // CHECK9-NEXT: entry: 9408 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9409 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9410 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 9411 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9412 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9413 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9414 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9415 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9416 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9417 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9418 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9419 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 9420 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9421 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 9422 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 9423 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9424 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9425 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 9426 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 9427 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9428 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9429 // CHECK9-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 9430 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9431 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9432 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9433 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9434 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 9435 // CHECK9-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9436 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 9437 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 9438 // CHECK9-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 9439 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 9440 // CHECK9-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 9441 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 9442 // CHECK9-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9443 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9444 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 9445 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9446 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 9447 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 9448 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9449 // CHECK9-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9450 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 9451 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9452 // CHECK9: omp.precond.then: 9453 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 9454 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9455 // CHECK9-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 9456 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9457 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9458 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9459 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 9460 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 9461 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9462 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9463 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 9464 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9465 // CHECK9: cond.true: 9466 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9467 // CHECK9-NEXT: br label [[COND_END:%.*]] 9468 // CHECK9: cond.false: 9469 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9470 // CHECK9-NEXT: br label [[COND_END]] 9471 // CHECK9: cond.end: 9472 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 9473 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 9474 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9475 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 9476 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9477 // CHECK9: omp.inner.for.cond: 9478 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9479 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9480 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 9481 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9482 // CHECK9: omp.inner.for.body: 9483 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9484 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 9485 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9486 // CHECK9-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 9487 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9488 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 9489 // CHECK9-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 9490 // CHECK9-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 9491 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 9492 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9493 // CHECK9: omp.inner.for.inc: 9494 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9495 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9496 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 9497 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 9498 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9499 // CHECK9: omp.inner.for.end: 9500 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9501 // CHECK9: omp.loop.exit: 9502 // CHECK9-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9503 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 9504 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 9505 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9506 // CHECK9: omp.precond.end: 9507 // CHECK9-NEXT: ret void 9508 // 9509 // 9510 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..15 9511 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 9512 // CHECK9-NEXT: entry: 9513 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9514 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9515 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 9516 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 9517 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9518 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9519 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9520 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9521 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 9522 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9523 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9524 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9525 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 9526 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9527 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 9528 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 9529 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9530 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9531 // CHECK9-NEXT: [[I6:%.*]] = alloca i32, align 4 9532 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9533 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9534 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9535 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9536 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9537 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9538 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9539 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9540 // CHECK9-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 9541 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9542 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 9543 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 9544 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 9545 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 9546 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 9547 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9548 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9549 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 9550 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9551 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 9552 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 9553 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9554 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9555 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 9556 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9557 // CHECK9: omp.precond.then: 9558 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 9559 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9560 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 9561 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9562 // CHECK9-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 9563 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9564 // CHECK9-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 9565 // CHECK9-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 9566 // CHECK9-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 9567 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9568 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9569 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 9570 // CHECK9-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9571 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 9572 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 9573 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 9574 // CHECK9: omp.dispatch.cond: 9575 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9576 // CHECK9-NEXT: [[CONV7:%.*]] = sext i32 [[TMP13]] to i64 9577 // CHECK9-NEXT: [[TMP14:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9578 // CHECK9-NEXT: [[CMP8:%.*]] = icmp ugt i64 [[CONV7]], [[TMP14]] 9579 // CHECK9-NEXT: br i1 [[CMP8]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9580 // CHECK9: cond.true: 9581 // CHECK9-NEXT: [[TMP15:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9582 // CHECK9-NEXT: br label [[COND_END:%.*]] 9583 // CHECK9: cond.false: 9584 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9585 // CHECK9-NEXT: [[CONV9:%.*]] = sext i32 [[TMP16]] to i64 9586 // CHECK9-NEXT: br label [[COND_END]] 9587 // CHECK9: cond.end: 9588 // CHECK9-NEXT: [[COND:%.*]] = phi i64 [ [[TMP15]], [[COND_TRUE]] ], [ [[CONV9]], [[COND_FALSE]] ] 9589 // CHECK9-NEXT: [[CONV10:%.*]] = trunc i64 [[COND]] to i32 9590 // CHECK9-NEXT: store i32 [[CONV10]], i32* [[DOTOMP_UB]], align 4 9591 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 9592 // CHECK9-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 9593 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9594 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9595 // CHECK9-NEXT: [[CMP11:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 9596 // CHECK9-NEXT: br i1 [[CMP11]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 9597 // CHECK9: omp.dispatch.body: 9598 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9599 // CHECK9: omp.inner.for.cond: 9600 // CHECK9-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9601 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9602 // CHECK9-NEXT: [[CMP12:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 9603 // CHECK9-NEXT: br i1 [[CMP12]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9604 // CHECK9: omp.inner.for.body: 9605 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9606 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 9607 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 9608 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I6]], align 4 9609 // CHECK9-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 8 9610 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I6]], align 4 9611 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP24]] to i64 9612 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM]] 9613 // CHECK9-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 8 9614 // CHECK9-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 8 9615 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I6]], align 4 9616 // CHECK9-NEXT: [[IDXPROM13:%.*]] = sext i32 [[TMP27]] to i64 9617 // CHECK9-NEXT: [[ARRAYIDX14:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM13]] 9618 // CHECK9-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX14]], align 8 9619 // CHECK9-NEXT: [[ADD15:%.*]] = fadd double [[TMP25]], [[TMP28]] 9620 // CHECK9-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 8 9621 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[I6]], align 4 9622 // CHECK9-NEXT: [[IDXPROM16:%.*]] = sext i32 [[TMP30]] to i64 9623 // CHECK9-NEXT: [[ARRAYIDX17:%.*]] = getelementptr inbounds double, double* [[TMP29]], i64 [[IDXPROM16]] 9624 // CHECK9-NEXT: store double [[ADD15]], double* [[ARRAYIDX17]], align 8 9625 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 9626 // CHECK9: omp.body.continue: 9627 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9628 // CHECK9: omp.inner.for.inc: 9629 // CHECK9-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9630 // CHECK9-NEXT: [[ADD18:%.*]] = add nsw i32 [[TMP31]], 1 9631 // CHECK9-NEXT: store i32 [[ADD18]], i32* [[DOTOMP_IV]], align 4 9632 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9633 // CHECK9: omp.inner.for.end: 9634 // CHECK9-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 9635 // CHECK9: omp.dispatch.inc: 9636 // CHECK9-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 9637 // CHECK9-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9638 // CHECK9-NEXT: [[ADD19:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 9639 // CHECK9-NEXT: store i32 [[ADD19]], i32* [[DOTOMP_LB]], align 4 9640 // CHECK9-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9641 // CHECK9-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9642 // CHECK9-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 9643 // CHECK9-NEXT: store i32 [[ADD20]], i32* [[DOTOMP_UB]], align 4 9644 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND]] 9645 // CHECK9: omp.dispatch.end: 9646 // CHECK9-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9647 // CHECK9-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 9648 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 9649 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9650 // CHECK9: omp.precond.end: 9651 // CHECK9-NEXT: ret void 9652 // 9653 // 9654 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536 9655 // CHECK9-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 9656 // CHECK9-NEXT: entry: 9657 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 9658 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 9659 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 9660 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 9661 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 9662 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 9663 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 9664 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 9665 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 9666 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 9667 // CHECK9-NEXT: ret void 9668 // 9669 // 9670 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..18 9671 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9672 // CHECK9-NEXT: entry: 9673 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9674 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9675 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9676 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9677 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9678 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9679 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9680 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9681 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9682 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9683 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9684 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 9685 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 9686 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9687 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9688 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 9689 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9690 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9691 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9692 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9693 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9694 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9695 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9696 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 9697 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 9698 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 9699 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 9700 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 9701 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9702 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 9703 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9704 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 9705 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9706 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9707 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9708 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 9709 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9710 // CHECK9: omp.precond.then: 9711 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 9712 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9713 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 9714 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9715 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9716 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9717 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 9718 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 9719 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9720 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9721 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 9722 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9723 // CHECK9: cond.true: 9724 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9725 // CHECK9-NEXT: br label [[COND_END:%.*]] 9726 // CHECK9: cond.false: 9727 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9728 // CHECK9-NEXT: br label [[COND_END]] 9729 // CHECK9: cond.end: 9730 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 9731 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 9732 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9733 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 9734 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9735 // CHECK9: omp.inner.for.cond: 9736 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9737 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9738 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 9739 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9740 // CHECK9: omp.inner.for.body: 9741 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9742 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 9743 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9744 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 9745 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 9746 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9747 // CHECK9: omp.inner.for.inc: 9748 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9749 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9750 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 9751 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 9752 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9753 // CHECK9: omp.inner.for.end: 9754 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9755 // CHECK9: omp.loop.exit: 9756 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9757 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 9758 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 9759 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9760 // CHECK9: omp.precond.end: 9761 // CHECK9-NEXT: ret void 9762 // 9763 // 9764 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..19 9765 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9766 // CHECK9-NEXT: entry: 9767 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9768 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9769 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 9770 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 9771 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9772 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9773 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9774 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9775 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9776 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9777 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9778 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9779 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9780 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 9781 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 9782 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9783 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9784 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 9785 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9786 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9787 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9788 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9789 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9790 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9791 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9792 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9793 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9794 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 9795 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 9796 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 9797 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 9798 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 9799 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9800 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 9801 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9802 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 9803 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9804 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9805 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9806 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 9807 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9808 // CHECK9: omp.precond.then: 9809 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 9810 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9811 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 9812 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 9813 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 9814 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 9815 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 9816 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 9817 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 9818 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9819 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9820 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 9821 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 9822 // CHECK9-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9823 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 9824 // CHECK9-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 9825 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 9826 // CHECK9: omp.dispatch.cond: 9827 // CHECK9-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9828 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 9829 // CHECK9-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 9830 // CHECK9-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 9831 // CHECK9-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 9832 // CHECK9: omp.dispatch.body: 9833 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 9834 // CHECK9-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 9835 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9836 // CHECK9: omp.inner.for.cond: 9837 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 9838 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !18 9839 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 9840 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9841 // CHECK9: omp.inner.for.body: 9842 // CHECK9-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 9843 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 9844 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 9845 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !18 9846 // CHECK9-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !18 9847 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !18 9848 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP22]] to i64 9849 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i64 [[IDXPROM]] 9850 // CHECK9-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !18 9851 // CHECK9-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !18 9852 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !18 9853 // CHECK9-NEXT: [[IDXPROM6:%.*]] = sext i32 [[TMP25]] to i64 9854 // CHECK9-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP24]], i64 [[IDXPROM6]] 9855 // CHECK9-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX7]], align 8, !llvm.access.group !18 9856 // CHECK9-NEXT: [[ADD8:%.*]] = fadd double [[TMP23]], [[TMP26]] 9857 // CHECK9-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !18 9858 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !18 9859 // CHECK9-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP28]] to i64 9860 // CHECK9-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP27]], i64 [[IDXPROM9]] 9861 // CHECK9-NEXT: store double [[ADD8]], double* [[ARRAYIDX10]], align 8, !llvm.access.group !18 9862 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 9863 // CHECK9: omp.body.continue: 9864 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9865 // CHECK9: omp.inner.for.inc: 9866 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 9867 // CHECK9-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP29]], 1 9868 // CHECK9-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 9869 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP19:![0-9]+]] 9870 // CHECK9: omp.inner.for.end: 9871 // CHECK9-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 9872 // CHECK9: omp.dispatch.inc: 9873 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND]] 9874 // CHECK9: omp.dispatch.end: 9875 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 9876 // CHECK9: omp.precond.end: 9877 // CHECK9-NEXT: ret void 9878 // 9879 // 9880 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562 9881 // CHECK9-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 9882 // CHECK9-NEXT: entry: 9883 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 9884 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 9885 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 9886 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 9887 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 9888 // CHECK9-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 9889 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 9890 // CHECK9-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 9891 // CHECK9-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 9892 // CHECK9-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 9893 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 9894 // CHECK9-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 9895 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 9896 // CHECK9-NEXT: ret void 9897 // 9898 // 9899 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..22 9900 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 9901 // CHECK9-NEXT: entry: 9902 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 9903 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 9904 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 9905 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 9906 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 9907 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 9908 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 9909 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 9910 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 9911 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 9912 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 9913 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 9914 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 9915 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 9916 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 9917 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 9918 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 9919 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 9920 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 9921 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 9922 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 9923 // CHECK9-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 9924 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 9925 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 9926 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 9927 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 9928 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 9929 // CHECK9-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 9930 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 9931 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 9932 // CHECK9-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 9933 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 9934 // CHECK9-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 9935 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 9936 // CHECK9-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 9937 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9938 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 9939 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 9940 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 9941 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 9942 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 9943 // CHECK9-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 9944 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 9945 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 9946 // CHECK9: omp.precond.then: 9947 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 9948 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9949 // CHECK9-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 9950 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 9951 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 9952 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9953 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 9954 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 9955 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9956 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9957 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 9958 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 9959 // CHECK9: cond.true: 9960 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 9961 // CHECK9-NEXT: br label [[COND_END:%.*]] 9962 // CHECK9: cond.false: 9963 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9964 // CHECK9-NEXT: br label [[COND_END]] 9965 // CHECK9: cond.end: 9966 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 9967 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 9968 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9969 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 9970 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 9971 // CHECK9: omp.inner.for.cond: 9972 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9973 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9974 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 9975 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 9976 // CHECK9: omp.inner.for.body: 9977 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 9978 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 9979 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 9980 // CHECK9-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 9981 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 9982 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 9983 // CHECK9-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 9984 // CHECK9-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 9985 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 9986 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 9987 // CHECK9: omp.inner.for.inc: 9988 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 9989 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 9990 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 9991 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 9992 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 9993 // CHECK9: omp.inner.for.end: 9994 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 9995 // CHECK9: omp.loop.exit: 9996 // CHECK9-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 9997 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 9998 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 9999 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 10000 // CHECK9: omp.precond.end: 10001 // CHECK9-NEXT: ret void 10002 // 10003 // 10004 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..23 10005 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 10006 // CHECK9-NEXT: entry: 10007 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 10008 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 10009 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 10010 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 10011 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 10012 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 10013 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 10014 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 10015 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 10016 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 10017 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 10018 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 10019 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 10020 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 10021 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 10022 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 10023 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 10024 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 10025 // CHECK9-NEXT: [[I6:%.*]] = alloca i32, align 4 10026 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 10027 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 10028 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 10029 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 10030 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 10031 // CHECK9-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 10032 // CHECK9-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 10033 // CHECK9-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 10034 // CHECK9-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 10035 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 10036 // CHECK9-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 10037 // CHECK9-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 10038 // CHECK9-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 10039 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 10040 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 10041 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 10042 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10043 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 10044 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 10045 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 10046 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 10047 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 10048 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10049 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 10050 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 10051 // CHECK9: omp.precond.then: 10052 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 10053 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 10054 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 10055 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 10056 // CHECK9-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 10057 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 10058 // CHECK9-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 10059 // CHECK9-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 10060 // CHECK9-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 10061 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 10062 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 10063 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 10064 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 10065 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 10066 // CHECK9-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10067 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 10068 // CHECK9-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 10069 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 10070 // CHECK9: omp.dispatch.cond: 10071 // CHECK9-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10072 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 10073 // CHECK9-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 10074 // CHECK9-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 10075 // CHECK9-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 10076 // CHECK9: omp.dispatch.body: 10077 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 10078 // CHECK9-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 10079 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 10080 // CHECK9: omp.inner.for.cond: 10081 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 10082 // CHECK9-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !21 10083 // CHECK9-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 10084 // CHECK9-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 10085 // CHECK9: omp.inner.for.body: 10086 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 10087 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 10088 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 10089 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I6]], align 4, !llvm.access.group !21 10090 // CHECK9-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !21 10091 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !21 10092 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP23]] to i64 10093 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i64 [[IDXPROM]] 10094 // CHECK9-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !21 10095 // CHECK9-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !21 10096 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !21 10097 // CHECK9-NEXT: [[IDXPROM8:%.*]] = sext i32 [[TMP26]] to i64 10098 // CHECK9-NEXT: [[ARRAYIDX9:%.*]] = getelementptr inbounds double, double* [[TMP25]], i64 [[IDXPROM8]] 10099 // CHECK9-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX9]], align 8, !llvm.access.group !21 10100 // CHECK9-NEXT: [[ADD10:%.*]] = fadd double [[TMP24]], [[TMP27]] 10101 // CHECK9-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !21 10102 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !21 10103 // CHECK9-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP29]] to i64 10104 // CHECK9-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds double, double* [[TMP28]], i64 [[IDXPROM11]] 10105 // CHECK9-NEXT: store double [[ADD10]], double* [[ARRAYIDX12]], align 8, !llvm.access.group !21 10106 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 10107 // CHECK9: omp.body.continue: 10108 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 10109 // CHECK9: omp.inner.for.inc: 10110 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 10111 // CHECK9-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP30]], 1 10112 // CHECK9-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 10113 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP22:![0-9]+]] 10114 // CHECK9: omp.inner.for.end: 10115 // CHECK9-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 10116 // CHECK9: omp.dispatch.inc: 10117 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND]] 10118 // CHECK9: omp.dispatch.end: 10119 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 10120 // CHECK9: omp.precond.end: 10121 // CHECK9-NEXT: ret void 10122 // 10123 // 10124 // CHECK9-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 10125 // CHECK9-SAME: () #[[ATTR3:[0-9]+]] comdat { 10126 // CHECK9-NEXT: entry: 10127 // CHECK9-NEXT: [[A:%.*]] = alloca i32*, align 8 10128 // CHECK9-NEXT: [[B:%.*]] = alloca i32*, align 8 10129 // CHECK9-NEXT: [[C:%.*]] = alloca i32*, align 8 10130 // CHECK9-NEXT: [[N:%.*]] = alloca i32, align 4 10131 // CHECK9-NEXT: [[CH:%.*]] = alloca i32, align 4 10132 // CHECK9-NEXT: [[N_CASTED:%.*]] = alloca i64, align 8 10133 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 8 10134 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 8 10135 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 8 10136 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 10137 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 10138 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 10139 // CHECK9-NEXT: [[N_CASTED3:%.*]] = alloca i64, align 8 10140 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS5:%.*]] = alloca [4 x i8*], align 8 10141 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS6:%.*]] = alloca [4 x i8*], align 8 10142 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS7:%.*]] = alloca [4 x i8*], align 8 10143 // CHECK9-NEXT: [[_TMP8:%.*]] = alloca i32, align 4 10144 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 10145 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_10:%.*]] = alloca i32, align 4 10146 // CHECK9-NEXT: [[CH_CASTED:%.*]] = alloca i64, align 8 10147 // CHECK9-NEXT: [[N_CASTED18:%.*]] = alloca i64, align 8 10148 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS20:%.*]] = alloca [5 x i8*], align 8 10149 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS21:%.*]] = alloca [5 x i8*], align 8 10150 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS22:%.*]] = alloca [5 x i8*], align 8 10151 // CHECK9-NEXT: [[_TMP23:%.*]] = alloca i32, align 4 10152 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_24:%.*]] = alloca i32, align 4 10153 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_25:%.*]] = alloca i32, align 4 10154 // CHECK9-NEXT: [[N_CASTED32:%.*]] = alloca i64, align 8 10155 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS34:%.*]] = alloca [4 x i8*], align 8 10156 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS35:%.*]] = alloca [4 x i8*], align 8 10157 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS36:%.*]] = alloca [4 x i8*], align 8 10158 // CHECK9-NEXT: [[_TMP37:%.*]] = alloca i32, align 4 10159 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_38:%.*]] = alloca i32, align 4 10160 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_39:%.*]] = alloca i32, align 4 10161 // CHECK9-NEXT: [[CH_CASTED46:%.*]] = alloca i64, align 8 10162 // CHECK9-NEXT: [[N_CASTED48:%.*]] = alloca i64, align 8 10163 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS50:%.*]] = alloca [5 x i8*], align 8 10164 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS51:%.*]] = alloca [5 x i8*], align 8 10165 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS52:%.*]] = alloca [5 x i8*], align 8 10166 // CHECK9-NEXT: [[_TMP53:%.*]] = alloca i32, align 4 10167 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_54:%.*]] = alloca i32, align 4 10168 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_55:%.*]] = alloca i32, align 4 10169 // CHECK9-NEXT: [[N_CASTED62:%.*]] = alloca i64, align 8 10170 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS64:%.*]] = alloca [4 x i8*], align 8 10171 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS65:%.*]] = alloca [4 x i8*], align 8 10172 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS66:%.*]] = alloca [4 x i8*], align 8 10173 // CHECK9-NEXT: [[_TMP67:%.*]] = alloca i32, align 4 10174 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_68:%.*]] = alloca i32, align 4 10175 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_69:%.*]] = alloca i32, align 4 10176 // CHECK9-NEXT: [[CH_CASTED76:%.*]] = alloca i64, align 8 10177 // CHECK9-NEXT: [[N_CASTED78:%.*]] = alloca i64, align 8 10178 // CHECK9-NEXT: [[DOTOFFLOAD_BASEPTRS80:%.*]] = alloca [5 x i8*], align 8 10179 // CHECK9-NEXT: [[DOTOFFLOAD_PTRS81:%.*]] = alloca [5 x i8*], align 8 10180 // CHECK9-NEXT: [[DOTOFFLOAD_MAPPERS82:%.*]] = alloca [5 x i8*], align 8 10181 // CHECK9-NEXT: [[_TMP83:%.*]] = alloca i32, align 4 10182 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_84:%.*]] = alloca i32, align 4 10183 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_85:%.*]] = alloca i32, align 4 10184 // CHECK9-NEXT: store i32 10000, i32* [[N]], align 4 10185 // CHECK9-NEXT: store i32 100, i32* [[CH]], align 4 10186 // CHECK9-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 10187 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_CASTED]] to i32* 10188 // CHECK9-NEXT: store i32 [[TMP0]], i32* [[CONV]], align 4 10189 // CHECK9-NEXT: [[TMP1:%.*]] = load i64, i64* [[N_CASTED]], align 8 10190 // CHECK9-NEXT: [[TMP2:%.*]] = load i32*, i32** [[A]], align 8 10191 // CHECK9-NEXT: [[TMP3:%.*]] = load i32*, i32** [[B]], align 8 10192 // CHECK9-NEXT: [[TMP4:%.*]] = load i32*, i32** [[C]], align 8 10193 // CHECK9-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 10194 // CHECK9-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i64* 10195 // CHECK9-NEXT: store i64 [[TMP1]], i64* [[TMP6]], align 8 10196 // CHECK9-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 10197 // CHECK9-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i64* 10198 // CHECK9-NEXT: store i64 [[TMP1]], i64* [[TMP8]], align 8 10199 // CHECK9-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0 10200 // CHECK9-NEXT: store i8* null, i8** [[TMP9]], align 8 10201 // CHECK9-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 10202 // CHECK9-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to i32** 10203 // CHECK9-NEXT: store i32* [[TMP2]], i32** [[TMP11]], align 8 10204 // CHECK9-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 10205 // CHECK9-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to i32** 10206 // CHECK9-NEXT: store i32* [[TMP2]], i32** [[TMP13]], align 8 10207 // CHECK9-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 1 10208 // CHECK9-NEXT: store i8* null, i8** [[TMP14]], align 8 10209 // CHECK9-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 10210 // CHECK9-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to i32** 10211 // CHECK9-NEXT: store i32* [[TMP3]], i32** [[TMP16]], align 8 10212 // CHECK9-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 10213 // CHECK9-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to i32** 10214 // CHECK9-NEXT: store i32* [[TMP3]], i32** [[TMP18]], align 8 10215 // CHECK9-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 2 10216 // CHECK9-NEXT: store i8* null, i8** [[TMP19]], align 8 10217 // CHECK9-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 10218 // CHECK9-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to i32** 10219 // CHECK9-NEXT: store i32* [[TMP4]], i32** [[TMP21]], align 8 10220 // CHECK9-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 10221 // CHECK9-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to i32** 10222 // CHECK9-NEXT: store i32* [[TMP4]], i32** [[TMP23]], align 8 10223 // CHECK9-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 3 10224 // CHECK9-NEXT: store i8* null, i8** [[TMP24]], align 8 10225 // CHECK9-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 10226 // CHECK9-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 10227 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 10228 // CHECK9-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 10229 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10230 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 10231 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 10232 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 10233 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 10234 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10235 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 10236 // CHECK9-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 10237 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP30]]) 10238 // CHECK9-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.28, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.29, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10239 // CHECK9-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 10240 // CHECK9-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 10241 // CHECK9: omp_offload.failed: 10242 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42(i64 [[TMP1]], i32* [[TMP2]], i32* [[TMP3]], i32* [[TMP4]]) #[[ATTR2]] 10243 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT]] 10244 // CHECK9: omp_offload.cont: 10245 // CHECK9-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 10246 // CHECK9-NEXT: [[CONV4:%.*]] = bitcast i64* [[N_CASTED3]] to i32* 10247 // CHECK9-NEXT: store i32 [[TMP33]], i32* [[CONV4]], align 4 10248 // CHECK9-NEXT: [[TMP34:%.*]] = load i64, i64* [[N_CASTED3]], align 8 10249 // CHECK9-NEXT: [[TMP35:%.*]] = load i32*, i32** [[A]], align 8 10250 // CHECK9-NEXT: [[TMP36:%.*]] = load i32*, i32** [[B]], align 8 10251 // CHECK9-NEXT: [[TMP37:%.*]] = load i32*, i32** [[C]], align 8 10252 // CHECK9-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 10253 // CHECK9-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i64* 10254 // CHECK9-NEXT: store i64 [[TMP34]], i64* [[TMP39]], align 8 10255 // CHECK9-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 10256 // CHECK9-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i64* 10257 // CHECK9-NEXT: store i64 [[TMP34]], i64* [[TMP41]], align 8 10258 // CHECK9-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 0 10259 // CHECK9-NEXT: store i8* null, i8** [[TMP42]], align 8 10260 // CHECK9-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 1 10261 // CHECK9-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to i32** 10262 // CHECK9-NEXT: store i32* [[TMP35]], i32** [[TMP44]], align 8 10263 // CHECK9-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 1 10264 // CHECK9-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to i32** 10265 // CHECK9-NEXT: store i32* [[TMP35]], i32** [[TMP46]], align 8 10266 // CHECK9-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 1 10267 // CHECK9-NEXT: store i8* null, i8** [[TMP47]], align 8 10268 // CHECK9-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 2 10269 // CHECK9-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to i32** 10270 // CHECK9-NEXT: store i32* [[TMP36]], i32** [[TMP49]], align 8 10271 // CHECK9-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 2 10272 // CHECK9-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to i32** 10273 // CHECK9-NEXT: store i32* [[TMP36]], i32** [[TMP51]], align 8 10274 // CHECK9-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 2 10275 // CHECK9-NEXT: store i8* null, i8** [[TMP52]], align 8 10276 // CHECK9-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 3 10277 // CHECK9-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to i32** 10278 // CHECK9-NEXT: store i32* [[TMP37]], i32** [[TMP54]], align 8 10279 // CHECK9-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 3 10280 // CHECK9-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to i32** 10281 // CHECK9-NEXT: store i32* [[TMP37]], i32** [[TMP56]], align 8 10282 // CHECK9-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 3 10283 // CHECK9-NEXT: store i8* null, i8** [[TMP57]], align 8 10284 // CHECK9-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 10285 // CHECK9-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 10286 // CHECK9-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 10287 // CHECK9-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_9]], align 4 10288 // CHECK9-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 10289 // CHECK9-NEXT: [[SUB11:%.*]] = sub nsw i32 [[TMP61]], 0 10290 // CHECK9-NEXT: [[DIV12:%.*]] = sdiv i32 [[SUB11]], 1 10291 // CHECK9-NEXT: [[SUB13:%.*]] = sub nsw i32 [[DIV12]], 1 10292 // CHECK9-NEXT: store i32 [[SUB13]], i32* [[DOTCAPTURE_EXPR_10]], align 4 10293 // CHECK9-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_10]], align 4 10294 // CHECK9-NEXT: [[ADD14:%.*]] = add nsw i32 [[TMP62]], 1 10295 // CHECK9-NEXT: [[TMP63:%.*]] = zext i32 [[ADD14]] to i64 10296 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 10297 // CHECK9-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.32, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.33, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10298 // CHECK9-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 10299 // CHECK9-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED15:%.*]], label [[OMP_OFFLOAD_CONT16:%.*]] 10300 // CHECK9: omp_offload.failed15: 10301 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51(i64 [[TMP34]], i32* [[TMP35]], i32* [[TMP36]], i32* [[TMP37]]) #[[ATTR2]] 10302 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT16]] 10303 // CHECK9: omp_offload.cont16: 10304 // CHECK9-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 10305 // CHECK9-NEXT: [[CONV17:%.*]] = bitcast i64* [[CH_CASTED]] to i32* 10306 // CHECK9-NEXT: store i32 [[TMP66]], i32* [[CONV17]], align 4 10307 // CHECK9-NEXT: [[TMP67:%.*]] = load i64, i64* [[CH_CASTED]], align 8 10308 // CHECK9-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 10309 // CHECK9-NEXT: [[CONV19:%.*]] = bitcast i64* [[N_CASTED18]] to i32* 10310 // CHECK9-NEXT: store i32 [[TMP68]], i32* [[CONV19]], align 4 10311 // CHECK9-NEXT: [[TMP69:%.*]] = load i64, i64* [[N_CASTED18]], align 8 10312 // CHECK9-NEXT: [[TMP70:%.*]] = load i32*, i32** [[A]], align 8 10313 // CHECK9-NEXT: [[TMP71:%.*]] = load i32*, i32** [[B]], align 8 10314 // CHECK9-NEXT: [[TMP72:%.*]] = load i32*, i32** [[C]], align 8 10315 // CHECK9-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 10316 // CHECK9-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i64* 10317 // CHECK9-NEXT: store i64 [[TMP67]], i64* [[TMP74]], align 8 10318 // CHECK9-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 10319 // CHECK9-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i64* 10320 // CHECK9-NEXT: store i64 [[TMP67]], i64* [[TMP76]], align 8 10321 // CHECK9-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 0 10322 // CHECK9-NEXT: store i8* null, i8** [[TMP77]], align 8 10323 // CHECK9-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 1 10324 // CHECK9-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i64* 10325 // CHECK9-NEXT: store i64 [[TMP69]], i64* [[TMP79]], align 8 10326 // CHECK9-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 1 10327 // CHECK9-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i64* 10328 // CHECK9-NEXT: store i64 [[TMP69]], i64* [[TMP81]], align 8 10329 // CHECK9-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 1 10330 // CHECK9-NEXT: store i8* null, i8** [[TMP82]], align 8 10331 // CHECK9-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 2 10332 // CHECK9-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to i32** 10333 // CHECK9-NEXT: store i32* [[TMP70]], i32** [[TMP84]], align 8 10334 // CHECK9-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 2 10335 // CHECK9-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to i32** 10336 // CHECK9-NEXT: store i32* [[TMP70]], i32** [[TMP86]], align 8 10337 // CHECK9-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 2 10338 // CHECK9-NEXT: store i8* null, i8** [[TMP87]], align 8 10339 // CHECK9-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 3 10340 // CHECK9-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to i32** 10341 // CHECK9-NEXT: store i32* [[TMP71]], i32** [[TMP89]], align 8 10342 // CHECK9-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 3 10343 // CHECK9-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to i32** 10344 // CHECK9-NEXT: store i32* [[TMP71]], i32** [[TMP91]], align 8 10345 // CHECK9-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 3 10346 // CHECK9-NEXT: store i8* null, i8** [[TMP92]], align 8 10347 // CHECK9-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 4 10348 // CHECK9-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to i32** 10349 // CHECK9-NEXT: store i32* [[TMP72]], i32** [[TMP94]], align 8 10350 // CHECK9-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 4 10351 // CHECK9-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to i32** 10352 // CHECK9-NEXT: store i32* [[TMP72]], i32** [[TMP96]], align 8 10353 // CHECK9-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 4 10354 // CHECK9-NEXT: store i8* null, i8** [[TMP97]], align 8 10355 // CHECK9-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 10356 // CHECK9-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 10357 // CHECK9-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 10358 // CHECK9-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_24]], align 4 10359 // CHECK9-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_24]], align 4 10360 // CHECK9-NEXT: [[SUB26:%.*]] = sub nsw i32 [[TMP101]], 0 10361 // CHECK9-NEXT: [[DIV27:%.*]] = sdiv i32 [[SUB26]], 1 10362 // CHECK9-NEXT: [[SUB28:%.*]] = sub nsw i32 [[DIV27]], 1 10363 // CHECK9-NEXT: store i32 [[SUB28]], i32* [[DOTCAPTURE_EXPR_25]], align 4 10364 // CHECK9-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_25]], align 4 10365 // CHECK9-NEXT: [[ADD29:%.*]] = add nsw i32 [[TMP102]], 1 10366 // CHECK9-NEXT: [[TMP103:%.*]] = zext i32 [[ADD29]] to i64 10367 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 10368 // CHECK9-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.36, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.37, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10369 // CHECK9-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 10370 // CHECK9-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED30:%.*]], label [[OMP_OFFLOAD_CONT31:%.*]] 10371 // CHECK9: omp_offload.failed30: 10372 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59(i64 [[TMP67]], i64 [[TMP69]], i32* [[TMP70]], i32* [[TMP71]], i32* [[TMP72]]) #[[ATTR2]] 10373 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT31]] 10374 // CHECK9: omp_offload.cont31: 10375 // CHECK9-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 10376 // CHECK9-NEXT: [[CONV33:%.*]] = bitcast i64* [[N_CASTED32]] to i32* 10377 // CHECK9-NEXT: store i32 [[TMP106]], i32* [[CONV33]], align 4 10378 // CHECK9-NEXT: [[TMP107:%.*]] = load i64, i64* [[N_CASTED32]], align 8 10379 // CHECK9-NEXT: [[TMP108:%.*]] = load i32*, i32** [[A]], align 8 10380 // CHECK9-NEXT: [[TMP109:%.*]] = load i32*, i32** [[B]], align 8 10381 // CHECK9-NEXT: [[TMP110:%.*]] = load i32*, i32** [[C]], align 8 10382 // CHECK9-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 10383 // CHECK9-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i64* 10384 // CHECK9-NEXT: store i64 [[TMP107]], i64* [[TMP112]], align 8 10385 // CHECK9-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 10386 // CHECK9-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i64* 10387 // CHECK9-NEXT: store i64 [[TMP107]], i64* [[TMP114]], align 8 10388 // CHECK9-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 0 10389 // CHECK9-NEXT: store i8* null, i8** [[TMP115]], align 8 10390 // CHECK9-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 1 10391 // CHECK9-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to i32** 10392 // CHECK9-NEXT: store i32* [[TMP108]], i32** [[TMP117]], align 8 10393 // CHECK9-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 1 10394 // CHECK9-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to i32** 10395 // CHECK9-NEXT: store i32* [[TMP108]], i32** [[TMP119]], align 8 10396 // CHECK9-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 1 10397 // CHECK9-NEXT: store i8* null, i8** [[TMP120]], align 8 10398 // CHECK9-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 2 10399 // CHECK9-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to i32** 10400 // CHECK9-NEXT: store i32* [[TMP109]], i32** [[TMP122]], align 8 10401 // CHECK9-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 2 10402 // CHECK9-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to i32** 10403 // CHECK9-NEXT: store i32* [[TMP109]], i32** [[TMP124]], align 8 10404 // CHECK9-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 2 10405 // CHECK9-NEXT: store i8* null, i8** [[TMP125]], align 8 10406 // CHECK9-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 3 10407 // CHECK9-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to i32** 10408 // CHECK9-NEXT: store i32* [[TMP110]], i32** [[TMP127]], align 8 10409 // CHECK9-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 3 10410 // CHECK9-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to i32** 10411 // CHECK9-NEXT: store i32* [[TMP110]], i32** [[TMP129]], align 8 10412 // CHECK9-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 3 10413 // CHECK9-NEXT: store i8* null, i8** [[TMP130]], align 8 10414 // CHECK9-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 10415 // CHECK9-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 10416 // CHECK9-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 10417 // CHECK9-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_38]], align 4 10418 // CHECK9-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_38]], align 4 10419 // CHECK9-NEXT: [[SUB40:%.*]] = sub nsw i32 [[TMP134]], 0 10420 // CHECK9-NEXT: [[DIV41:%.*]] = sdiv i32 [[SUB40]], 1 10421 // CHECK9-NEXT: [[SUB42:%.*]] = sub nsw i32 [[DIV41]], 1 10422 // CHECK9-NEXT: store i32 [[SUB42]], i32* [[DOTCAPTURE_EXPR_39]], align 4 10423 // CHECK9-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_39]], align 4 10424 // CHECK9-NEXT: [[ADD43:%.*]] = add nsw i32 [[TMP135]], 1 10425 // CHECK9-NEXT: [[TMP136:%.*]] = zext i32 [[ADD43]] to i64 10426 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 10427 // CHECK9-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.40, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.41, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10428 // CHECK9-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 10429 // CHECK9-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED44:%.*]], label [[OMP_OFFLOAD_CONT45:%.*]] 10430 // CHECK9: omp_offload.failed44: 10431 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67(i64 [[TMP107]], i32* [[TMP108]], i32* [[TMP109]], i32* [[TMP110]]) #[[ATTR2]] 10432 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT45]] 10433 // CHECK9: omp_offload.cont45: 10434 // CHECK9-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 10435 // CHECK9-NEXT: [[CONV47:%.*]] = bitcast i64* [[CH_CASTED46]] to i32* 10436 // CHECK9-NEXT: store i32 [[TMP139]], i32* [[CONV47]], align 4 10437 // CHECK9-NEXT: [[TMP140:%.*]] = load i64, i64* [[CH_CASTED46]], align 8 10438 // CHECK9-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 10439 // CHECK9-NEXT: [[CONV49:%.*]] = bitcast i64* [[N_CASTED48]] to i32* 10440 // CHECK9-NEXT: store i32 [[TMP141]], i32* [[CONV49]], align 4 10441 // CHECK9-NEXT: [[TMP142:%.*]] = load i64, i64* [[N_CASTED48]], align 8 10442 // CHECK9-NEXT: [[TMP143:%.*]] = load i32*, i32** [[A]], align 8 10443 // CHECK9-NEXT: [[TMP144:%.*]] = load i32*, i32** [[B]], align 8 10444 // CHECK9-NEXT: [[TMP145:%.*]] = load i32*, i32** [[C]], align 8 10445 // CHECK9-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 10446 // CHECK9-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i64* 10447 // CHECK9-NEXT: store i64 [[TMP140]], i64* [[TMP147]], align 8 10448 // CHECK9-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 10449 // CHECK9-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i64* 10450 // CHECK9-NEXT: store i64 [[TMP140]], i64* [[TMP149]], align 8 10451 // CHECK9-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 0 10452 // CHECK9-NEXT: store i8* null, i8** [[TMP150]], align 8 10453 // CHECK9-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 1 10454 // CHECK9-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i64* 10455 // CHECK9-NEXT: store i64 [[TMP142]], i64* [[TMP152]], align 8 10456 // CHECK9-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 1 10457 // CHECK9-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i64* 10458 // CHECK9-NEXT: store i64 [[TMP142]], i64* [[TMP154]], align 8 10459 // CHECK9-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 1 10460 // CHECK9-NEXT: store i8* null, i8** [[TMP155]], align 8 10461 // CHECK9-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 2 10462 // CHECK9-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to i32** 10463 // CHECK9-NEXT: store i32* [[TMP143]], i32** [[TMP157]], align 8 10464 // CHECK9-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 2 10465 // CHECK9-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to i32** 10466 // CHECK9-NEXT: store i32* [[TMP143]], i32** [[TMP159]], align 8 10467 // CHECK9-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 2 10468 // CHECK9-NEXT: store i8* null, i8** [[TMP160]], align 8 10469 // CHECK9-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 3 10470 // CHECK9-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to i32** 10471 // CHECK9-NEXT: store i32* [[TMP144]], i32** [[TMP162]], align 8 10472 // CHECK9-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 3 10473 // CHECK9-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to i32** 10474 // CHECK9-NEXT: store i32* [[TMP144]], i32** [[TMP164]], align 8 10475 // CHECK9-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 3 10476 // CHECK9-NEXT: store i8* null, i8** [[TMP165]], align 8 10477 // CHECK9-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 4 10478 // CHECK9-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to i32** 10479 // CHECK9-NEXT: store i32* [[TMP145]], i32** [[TMP167]], align 8 10480 // CHECK9-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 4 10481 // CHECK9-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to i32** 10482 // CHECK9-NEXT: store i32* [[TMP145]], i32** [[TMP169]], align 8 10483 // CHECK9-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 4 10484 // CHECK9-NEXT: store i8* null, i8** [[TMP170]], align 8 10485 // CHECK9-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 10486 // CHECK9-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 10487 // CHECK9-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 10488 // CHECK9-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_54]], align 4 10489 // CHECK9-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_54]], align 4 10490 // CHECK9-NEXT: [[SUB56:%.*]] = sub nsw i32 [[TMP174]], 0 10491 // CHECK9-NEXT: [[DIV57:%.*]] = sdiv i32 [[SUB56]], 1 10492 // CHECK9-NEXT: [[SUB58:%.*]] = sub nsw i32 [[DIV57]], 1 10493 // CHECK9-NEXT: store i32 [[SUB58]], i32* [[DOTCAPTURE_EXPR_55]], align 4 10494 // CHECK9-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_55]], align 4 10495 // CHECK9-NEXT: [[ADD59:%.*]] = add nsw i32 [[TMP175]], 1 10496 // CHECK9-NEXT: [[TMP176:%.*]] = zext i32 [[ADD59]] to i64 10497 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 10498 // CHECK9-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.44, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.45, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10499 // CHECK9-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 10500 // CHECK9-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED60:%.*]], label [[OMP_OFFLOAD_CONT61:%.*]] 10501 // CHECK9: omp_offload.failed60: 10502 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75(i64 [[TMP140]], i64 [[TMP142]], i32* [[TMP143]], i32* [[TMP144]], i32* [[TMP145]]) #[[ATTR2]] 10503 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT61]] 10504 // CHECK9: omp_offload.cont61: 10505 // CHECK9-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 10506 // CHECK9-NEXT: [[CONV63:%.*]] = bitcast i64* [[N_CASTED62]] to i32* 10507 // CHECK9-NEXT: store i32 [[TMP179]], i32* [[CONV63]], align 4 10508 // CHECK9-NEXT: [[TMP180:%.*]] = load i64, i64* [[N_CASTED62]], align 8 10509 // CHECK9-NEXT: [[TMP181:%.*]] = load i32*, i32** [[A]], align 8 10510 // CHECK9-NEXT: [[TMP182:%.*]] = load i32*, i32** [[B]], align 8 10511 // CHECK9-NEXT: [[TMP183:%.*]] = load i32*, i32** [[C]], align 8 10512 // CHECK9-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 10513 // CHECK9-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i64* 10514 // CHECK9-NEXT: store i64 [[TMP180]], i64* [[TMP185]], align 8 10515 // CHECK9-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 10516 // CHECK9-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i64* 10517 // CHECK9-NEXT: store i64 [[TMP180]], i64* [[TMP187]], align 8 10518 // CHECK9-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 0 10519 // CHECK9-NEXT: store i8* null, i8** [[TMP188]], align 8 10520 // CHECK9-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 1 10521 // CHECK9-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to i32** 10522 // CHECK9-NEXT: store i32* [[TMP181]], i32** [[TMP190]], align 8 10523 // CHECK9-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 1 10524 // CHECK9-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to i32** 10525 // CHECK9-NEXT: store i32* [[TMP181]], i32** [[TMP192]], align 8 10526 // CHECK9-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 1 10527 // CHECK9-NEXT: store i8* null, i8** [[TMP193]], align 8 10528 // CHECK9-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 2 10529 // CHECK9-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to i32** 10530 // CHECK9-NEXT: store i32* [[TMP182]], i32** [[TMP195]], align 8 10531 // CHECK9-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 2 10532 // CHECK9-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to i32** 10533 // CHECK9-NEXT: store i32* [[TMP182]], i32** [[TMP197]], align 8 10534 // CHECK9-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 2 10535 // CHECK9-NEXT: store i8* null, i8** [[TMP198]], align 8 10536 // CHECK9-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 3 10537 // CHECK9-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to i32** 10538 // CHECK9-NEXT: store i32* [[TMP183]], i32** [[TMP200]], align 8 10539 // CHECK9-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 3 10540 // CHECK9-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to i32** 10541 // CHECK9-NEXT: store i32* [[TMP183]], i32** [[TMP202]], align 8 10542 // CHECK9-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 3 10543 // CHECK9-NEXT: store i8* null, i8** [[TMP203]], align 8 10544 // CHECK9-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 10545 // CHECK9-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 10546 // CHECK9-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 10547 // CHECK9-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_68]], align 4 10548 // CHECK9-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_68]], align 4 10549 // CHECK9-NEXT: [[SUB70:%.*]] = sub nsw i32 [[TMP207]], 0 10550 // CHECK9-NEXT: [[DIV71:%.*]] = sdiv i32 [[SUB70]], 1 10551 // CHECK9-NEXT: [[SUB72:%.*]] = sub nsw i32 [[DIV71]], 1 10552 // CHECK9-NEXT: store i32 [[SUB72]], i32* [[DOTCAPTURE_EXPR_69]], align 4 10553 // CHECK9-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_69]], align 4 10554 // CHECK9-NEXT: [[ADD73:%.*]] = add nsw i32 [[TMP208]], 1 10555 // CHECK9-NEXT: [[TMP209:%.*]] = zext i32 [[ADD73]] to i64 10556 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 10557 // CHECK9-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.48, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.49, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10558 // CHECK9-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 10559 // CHECK9-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED74:%.*]], label [[OMP_OFFLOAD_CONT75:%.*]] 10560 // CHECK9: omp_offload.failed74: 10561 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83(i64 [[TMP180]], i32* [[TMP181]], i32* [[TMP182]], i32* [[TMP183]]) #[[ATTR2]] 10562 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT75]] 10563 // CHECK9: omp_offload.cont75: 10564 // CHECK9-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 10565 // CHECK9-NEXT: [[CONV77:%.*]] = bitcast i64* [[CH_CASTED76]] to i32* 10566 // CHECK9-NEXT: store i32 [[TMP212]], i32* [[CONV77]], align 4 10567 // CHECK9-NEXT: [[TMP213:%.*]] = load i64, i64* [[CH_CASTED76]], align 8 10568 // CHECK9-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 10569 // CHECK9-NEXT: [[CONV79:%.*]] = bitcast i64* [[N_CASTED78]] to i32* 10570 // CHECK9-NEXT: store i32 [[TMP214]], i32* [[CONV79]], align 4 10571 // CHECK9-NEXT: [[TMP215:%.*]] = load i64, i64* [[N_CASTED78]], align 8 10572 // CHECK9-NEXT: [[TMP216:%.*]] = load i32*, i32** [[A]], align 8 10573 // CHECK9-NEXT: [[TMP217:%.*]] = load i32*, i32** [[B]], align 8 10574 // CHECK9-NEXT: [[TMP218:%.*]] = load i32*, i32** [[C]], align 8 10575 // CHECK9-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 10576 // CHECK9-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i64* 10577 // CHECK9-NEXT: store i64 [[TMP213]], i64* [[TMP220]], align 8 10578 // CHECK9-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 10579 // CHECK9-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i64* 10580 // CHECK9-NEXT: store i64 [[TMP213]], i64* [[TMP222]], align 8 10581 // CHECK9-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 0 10582 // CHECK9-NEXT: store i8* null, i8** [[TMP223]], align 8 10583 // CHECK9-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 1 10584 // CHECK9-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i64* 10585 // CHECK9-NEXT: store i64 [[TMP215]], i64* [[TMP225]], align 8 10586 // CHECK9-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 1 10587 // CHECK9-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i64* 10588 // CHECK9-NEXT: store i64 [[TMP215]], i64* [[TMP227]], align 8 10589 // CHECK9-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 1 10590 // CHECK9-NEXT: store i8* null, i8** [[TMP228]], align 8 10591 // CHECK9-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 2 10592 // CHECK9-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to i32** 10593 // CHECK9-NEXT: store i32* [[TMP216]], i32** [[TMP230]], align 8 10594 // CHECK9-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 2 10595 // CHECK9-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to i32** 10596 // CHECK9-NEXT: store i32* [[TMP216]], i32** [[TMP232]], align 8 10597 // CHECK9-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 2 10598 // CHECK9-NEXT: store i8* null, i8** [[TMP233]], align 8 10599 // CHECK9-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 3 10600 // CHECK9-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to i32** 10601 // CHECK9-NEXT: store i32* [[TMP217]], i32** [[TMP235]], align 8 10602 // CHECK9-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 3 10603 // CHECK9-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to i32** 10604 // CHECK9-NEXT: store i32* [[TMP217]], i32** [[TMP237]], align 8 10605 // CHECK9-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 3 10606 // CHECK9-NEXT: store i8* null, i8** [[TMP238]], align 8 10607 // CHECK9-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 4 10608 // CHECK9-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to i32** 10609 // CHECK9-NEXT: store i32* [[TMP218]], i32** [[TMP240]], align 8 10610 // CHECK9-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 4 10611 // CHECK9-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to i32** 10612 // CHECK9-NEXT: store i32* [[TMP218]], i32** [[TMP242]], align 8 10613 // CHECK9-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 4 10614 // CHECK9-NEXT: store i8* null, i8** [[TMP243]], align 8 10615 // CHECK9-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 10616 // CHECK9-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 10617 // CHECK9-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 10618 // CHECK9-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_84]], align 4 10619 // CHECK9-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_84]], align 4 10620 // CHECK9-NEXT: [[SUB86:%.*]] = sub nsw i32 [[TMP247]], 0 10621 // CHECK9-NEXT: [[DIV87:%.*]] = sdiv i32 [[SUB86]], 1 10622 // CHECK9-NEXT: [[SUB88:%.*]] = sub nsw i32 [[DIV87]], 1 10623 // CHECK9-NEXT: store i32 [[SUB88]], i32* [[DOTCAPTURE_EXPR_85]], align 4 10624 // CHECK9-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_85]], align 4 10625 // CHECK9-NEXT: [[ADD89:%.*]] = add nsw i32 [[TMP248]], 1 10626 // CHECK9-NEXT: [[TMP249:%.*]] = zext i32 [[ADD89]] to i64 10627 // CHECK9-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 10628 // CHECK9-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.52, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.53, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 10629 // CHECK9-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 10630 // CHECK9-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED90:%.*]], label [[OMP_OFFLOAD_CONT91:%.*]] 10631 // CHECK9: omp_offload.failed90: 10632 // CHECK9-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91(i64 [[TMP213]], i64 [[TMP215]], i32* [[TMP216]], i32* [[TMP217]], i32* [[TMP218]]) #[[ATTR2]] 10633 // CHECK9-NEXT: br label [[OMP_OFFLOAD_CONT91]] 10634 // CHECK9: omp_offload.cont91: 10635 // CHECK9-NEXT: ret i32 0 10636 // 10637 // 10638 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42 10639 // CHECK9-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 10640 // CHECK9-NEXT: entry: 10641 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 10642 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 10643 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 10644 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 10645 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 10646 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 10647 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 10648 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 10649 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 10650 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..26 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 10651 // CHECK9-NEXT: ret void 10652 // 10653 // 10654 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..26 10655 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 10656 // CHECK9-NEXT: entry: 10657 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 10658 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 10659 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 10660 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 10661 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 10662 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 10663 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 10664 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 10665 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 10666 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 10667 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 10668 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 10669 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 10670 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 10671 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 10672 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 10673 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 10674 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 10675 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 10676 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 10677 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 10678 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 10679 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 10680 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 10681 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 10682 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 10683 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 10684 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 10685 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10686 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 10687 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 10688 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 10689 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 10690 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 10691 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10692 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 10693 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 10694 // CHECK9: omp.precond.then: 10695 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 10696 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10697 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 10698 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 10699 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 10700 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10701 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 10702 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 10703 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10704 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10705 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 10706 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 10707 // CHECK9: cond.true: 10708 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10709 // CHECK9-NEXT: br label [[COND_END:%.*]] 10710 // CHECK9: cond.false: 10711 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10712 // CHECK9-NEXT: br label [[COND_END]] 10713 // CHECK9: cond.end: 10714 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 10715 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 10716 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 10717 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 10718 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 10719 // CHECK9: omp.inner.for.cond: 10720 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10721 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10722 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 10723 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 10724 // CHECK9: omp.inner.for.body: 10725 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 10726 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 10727 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10728 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 10729 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..27 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 10730 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 10731 // CHECK9: omp.inner.for.inc: 10732 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10733 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 10734 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 10735 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 10736 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 10737 // CHECK9: omp.inner.for.end: 10738 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 10739 // CHECK9: omp.loop.exit: 10740 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10741 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 10742 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 10743 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 10744 // CHECK9: omp.precond.end: 10745 // CHECK9-NEXT: ret void 10746 // 10747 // 10748 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..27 10749 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 10750 // CHECK9-NEXT: entry: 10751 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 10752 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 10753 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 10754 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 10755 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 10756 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 10757 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 10758 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 10759 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 10760 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 10761 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 10762 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 10763 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 10764 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 10765 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 10766 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 10767 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 10768 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 10769 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 10770 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 10771 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 10772 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 10773 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 10774 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 10775 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 10776 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 10777 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 10778 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 10779 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 10780 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 10781 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 10782 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 10783 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10784 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 10785 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 10786 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 10787 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 10788 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 10789 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10790 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 10791 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 10792 // CHECK9: omp.precond.then: 10793 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 10794 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10795 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 10796 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 10797 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 10798 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 10799 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 10800 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 10801 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 10802 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 10803 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 10804 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10805 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 10806 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 10807 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 10808 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10809 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 10810 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 10811 // CHECK9: cond.true: 10812 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10813 // CHECK9-NEXT: br label [[COND_END:%.*]] 10814 // CHECK9: cond.false: 10815 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 10816 // CHECK9-NEXT: br label [[COND_END]] 10817 // CHECK9: cond.end: 10818 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 10819 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 10820 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 10821 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 10822 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 10823 // CHECK9: omp.inner.for.cond: 10824 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10825 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 10826 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 10827 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 10828 // CHECK9: omp.inner.for.body: 10829 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10830 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 10831 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 10832 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 10833 // CHECK9-NEXT: [[TMP20:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10834 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[TMP20]], align 4 10835 // CHECK9-NEXT: [[TMP22:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* @[[GLOB3]], i32 [[TMP21]], i32 2) 10836 // CHECK9-NEXT: [[TMP23:%.*]] = icmp ne i32 [[TMP22]], 0 10837 // CHECK9-NEXT: br i1 [[TMP23]], label [[DOTCANCEL_EXIT:%.*]], label [[DOTCANCEL_CONTINUE:%.*]] 10838 // CHECK9: .cancel.exit: 10839 // CHECK9-NEXT: br label [[CANCEL_EXIT:%.*]] 10840 // CHECK9: .cancel.continue: 10841 // CHECK9-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP2]], align 8 10842 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4 10843 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP25]] to i64 10844 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i64 [[IDXPROM]] 10845 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 10846 // CHECK9-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP3]], align 8 10847 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4 10848 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP28]] to i64 10849 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i64 [[IDXPROM7]] 10850 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 10851 // CHECK9-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 10852 // CHECK9-NEXT: [[TMP30:%.*]] = load i32*, i32** [[TMP1]], align 8 10853 // CHECK9-NEXT: [[TMP31:%.*]] = load i32, i32* [[I4]], align 4 10854 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP31]] to i64 10855 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i64 [[IDXPROM10]] 10856 // CHECK9-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 10857 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 10858 // CHECK9: omp.body.continue: 10859 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 10860 // CHECK9: omp.inner.for.inc: 10861 // CHECK9-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10862 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 10863 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 10864 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 10865 // CHECK9: omp.inner.for.end: 10866 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 10867 // CHECK9: omp.loop.exit: 10868 // CHECK9-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10869 // CHECK9-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 10870 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 10871 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 10872 // CHECK9: cancel.exit: 10873 // CHECK9-NEXT: [[TMP35:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10874 // CHECK9-NEXT: [[TMP36:%.*]] = load i32, i32* [[TMP35]], align 4 10875 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP36]]) 10876 // CHECK9-NEXT: br label [[CANCEL_CONT:%.*]] 10877 // CHECK9: omp.precond.end: 10878 // CHECK9-NEXT: br label [[CANCEL_CONT]] 10879 // CHECK9: cancel.cont: 10880 // CHECK9-NEXT: ret void 10881 // 10882 // 10883 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51 10884 // CHECK9-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 10885 // CHECK9-NEXT: entry: 10886 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 10887 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 10888 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 10889 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 10890 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 10891 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 10892 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 10893 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 10894 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 10895 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 10896 // CHECK9-NEXT: ret void 10897 // 10898 // 10899 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..30 10900 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 10901 // CHECK9-NEXT: entry: 10902 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 10903 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 10904 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 10905 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 10906 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 10907 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 10908 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 10909 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 10910 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 10911 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 10912 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 10913 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 10914 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 10915 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 10916 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 10917 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 10918 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 10919 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 10920 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 10921 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 10922 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 10923 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 10924 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 10925 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 10926 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 10927 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 10928 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 10929 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 10930 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10931 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 10932 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 10933 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 10934 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 10935 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 10936 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 10937 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 10938 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 10939 // CHECK9: omp.precond.then: 10940 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 10941 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10942 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 10943 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 10944 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 10945 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10946 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 10947 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 10948 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10949 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10950 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 10951 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 10952 // CHECK9: cond.true: 10953 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 10954 // CHECK9-NEXT: br label [[COND_END:%.*]] 10955 // CHECK9: cond.false: 10956 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10957 // CHECK9-NEXT: br label [[COND_END]] 10958 // CHECK9: cond.end: 10959 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 10960 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 10961 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 10962 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 10963 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 10964 // CHECK9: omp.inner.for.cond: 10965 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10966 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10967 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 10968 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 10969 // CHECK9: omp.inner.for.body: 10970 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 10971 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 10972 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 10973 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 10974 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 10975 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 10976 // CHECK9: omp.inner.for.inc: 10977 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 10978 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 10979 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 10980 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 10981 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 10982 // CHECK9: omp.inner.for.end: 10983 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 10984 // CHECK9: omp.loop.exit: 10985 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 10986 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 10987 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 10988 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 10989 // CHECK9: omp.precond.end: 10990 // CHECK9-NEXT: ret void 10991 // 10992 // 10993 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..31 10994 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 10995 // CHECK9-NEXT: entry: 10996 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 10997 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 10998 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 10999 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 11000 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11001 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11002 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11003 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11004 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11005 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11006 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11007 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11008 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11009 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 11010 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 11011 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11012 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11013 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 11014 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11015 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11016 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11017 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11018 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11019 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11020 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11021 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11022 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11023 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11024 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11025 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11026 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 11027 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 11028 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11029 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 11030 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11031 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 11032 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11033 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11034 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11035 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 11036 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11037 // CHECK9: omp.precond.then: 11038 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 11039 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11040 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 11041 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11042 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 11043 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11044 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 11045 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 11046 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 11047 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11048 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11049 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11050 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 11051 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 11052 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11053 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11054 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 11055 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11056 // CHECK9: cond.true: 11057 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11058 // CHECK9-NEXT: br label [[COND_END:%.*]] 11059 // CHECK9: cond.false: 11060 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11061 // CHECK9-NEXT: br label [[COND_END]] 11062 // CHECK9: cond.end: 11063 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 11064 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 11065 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 11066 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 11067 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11068 // CHECK9: omp.inner.for.cond: 11069 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11070 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11071 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 11072 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11073 // CHECK9: omp.inner.for.body: 11074 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11075 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 11076 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 11077 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 11078 // CHECK9-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 8 11079 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 11080 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 11081 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i64 [[IDXPROM]] 11082 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 11083 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 8 11084 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 11085 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 11086 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM7]] 11087 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 11088 // CHECK9-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 11089 // CHECK9-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 8 11090 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 11091 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 11092 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM10]] 11093 // CHECK9-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 11094 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 11095 // CHECK9: omp.body.continue: 11096 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11097 // CHECK9: omp.inner.for.inc: 11098 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11099 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 11100 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 11101 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11102 // CHECK9: omp.inner.for.end: 11103 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11104 // CHECK9: omp.loop.exit: 11105 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11106 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 11107 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 11108 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11109 // CHECK9: omp.precond.end: 11110 // CHECK9-NEXT: ret void 11111 // 11112 // 11113 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59 11114 // CHECK9-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 11115 // CHECK9-NEXT: entry: 11116 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 11117 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 11118 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 11119 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 11120 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 11121 // CHECK9-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 11122 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 11123 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 11124 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 11125 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 11126 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 11127 // CHECK9-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 11128 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 11129 // CHECK9-NEXT: ret void 11130 // 11131 // 11132 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..34 11133 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11134 // CHECK9-NEXT: entry: 11135 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11136 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11137 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 11138 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11139 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11140 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11141 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11142 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11143 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11144 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11145 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11146 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11147 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 11148 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 11149 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11150 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11151 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 11152 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11153 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11154 // CHECK9-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 11155 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11156 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11157 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11158 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11159 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 11160 // CHECK9-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11161 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11162 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11163 // CHECK9-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11164 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 11165 // CHECK9-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 11166 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11167 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 11168 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11169 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 11170 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11171 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11172 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11173 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 11174 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11175 // CHECK9: omp.precond.then: 11176 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 11177 // CHECK9-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11178 // CHECK9-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 11179 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11180 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11181 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 11182 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11183 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 11184 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 11185 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11186 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11187 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 11188 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11189 // CHECK9: cond.true: 11190 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11191 // CHECK9-NEXT: br label [[COND_END:%.*]] 11192 // CHECK9: cond.false: 11193 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11194 // CHECK9-NEXT: br label [[COND_END]] 11195 // CHECK9: cond.end: 11196 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 11197 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 11198 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11199 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 11200 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11201 // CHECK9: omp.inner.for.cond: 11202 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11203 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11204 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 11205 // CHECK9-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 11206 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11207 // CHECK9: omp.inner.for.body: 11208 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11209 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 11210 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11211 // CHECK9-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 11212 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]]) 11213 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11214 // CHECK9: omp.inner.for.inc: 11215 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11216 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11217 // CHECK9-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 11218 // CHECK9-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 11219 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11220 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11221 // CHECK9-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 11222 // CHECK9-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 11223 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11224 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11225 // CHECK9-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP27]], [[TMP28]] 11226 // CHECK9-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 11227 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11228 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11229 // CHECK9-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP29]], [[TMP30]] 11230 // CHECK9-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 11231 // CHECK9: cond.true10: 11232 // CHECK9-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11233 // CHECK9-NEXT: br label [[COND_END12:%.*]] 11234 // CHECK9: cond.false11: 11235 // CHECK9-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11236 // CHECK9-NEXT: br label [[COND_END12]] 11237 // CHECK9: cond.end12: 11238 // CHECK9-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP31]], [[COND_TRUE10]] ], [ [[TMP32]], [[COND_FALSE11]] ] 11239 // CHECK9-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 11240 // CHECK9-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11241 // CHECK9-NEXT: store i32 [[TMP33]], i32* [[DOTOMP_IV]], align 4 11242 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11243 // CHECK9: omp.inner.for.end: 11244 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11245 // CHECK9: omp.loop.exit: 11246 // CHECK9-NEXT: [[TMP34:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11247 // CHECK9-NEXT: [[TMP35:%.*]] = load i32, i32* [[TMP34]], align 4 11248 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP35]]) 11249 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11250 // CHECK9: omp.precond.end: 11251 // CHECK9-NEXT: ret void 11252 // 11253 // 11254 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..35 11255 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11256 // CHECK9-NEXT: entry: 11257 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11258 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11259 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 11260 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 11261 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11262 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11263 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11264 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11265 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11266 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11267 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11268 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11269 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11270 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 11271 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 11272 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11273 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11274 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 11275 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11276 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11277 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11278 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11279 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11280 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11281 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11282 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11283 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11284 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11285 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11286 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11287 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 11288 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 11289 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11290 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 11291 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11292 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 11293 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11294 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11295 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11296 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 11297 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11298 // CHECK9: omp.precond.then: 11299 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 11300 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11301 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 11302 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11303 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 11304 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11305 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 11306 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 11307 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 11308 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11309 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11310 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11311 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 11312 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 11313 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11314 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11315 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 11316 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11317 // CHECK9: cond.true: 11318 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11319 // CHECK9-NEXT: br label [[COND_END:%.*]] 11320 // CHECK9: cond.false: 11321 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11322 // CHECK9-NEXT: br label [[COND_END]] 11323 // CHECK9: cond.end: 11324 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 11325 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 11326 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 11327 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 11328 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11329 // CHECK9: omp.inner.for.cond: 11330 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11331 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11332 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 11333 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11334 // CHECK9: omp.inner.for.body: 11335 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11336 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 11337 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 11338 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 11339 // CHECK9-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 8 11340 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 11341 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 11342 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i64 [[IDXPROM]] 11343 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 11344 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 8 11345 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 11346 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 11347 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM7]] 11348 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 11349 // CHECK9-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 11350 // CHECK9-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 8 11351 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 11352 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 11353 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM10]] 11354 // CHECK9-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 11355 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 11356 // CHECK9: omp.body.continue: 11357 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11358 // CHECK9: omp.inner.for.inc: 11359 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11360 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 11361 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 11362 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11363 // CHECK9: omp.inner.for.end: 11364 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11365 // CHECK9: omp.loop.exit: 11366 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11367 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 11368 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 11369 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11370 // CHECK9: omp.precond.end: 11371 // CHECK9-NEXT: ret void 11372 // 11373 // 11374 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67 11375 // CHECK9-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 11376 // CHECK9-NEXT: entry: 11377 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 11378 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 11379 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 11380 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 11381 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 11382 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 11383 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 11384 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 11385 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 11386 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..38 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 11387 // CHECK9-NEXT: ret void 11388 // 11389 // 11390 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..38 11391 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11392 // CHECK9-NEXT: entry: 11393 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11394 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11395 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11396 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11397 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11398 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11399 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11400 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11401 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11402 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11403 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11404 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 11405 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 11406 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11407 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11408 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 11409 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11410 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11411 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11412 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11413 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11414 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11415 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11416 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11417 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11418 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11419 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 11420 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 11421 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11422 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 11423 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11424 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 11425 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11426 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11427 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11428 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 11429 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11430 // CHECK9: omp.precond.then: 11431 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 11432 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11433 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 11434 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11435 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11436 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11437 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 11438 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 11439 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11440 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11441 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 11442 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11443 // CHECK9: cond.true: 11444 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11445 // CHECK9-NEXT: br label [[COND_END:%.*]] 11446 // CHECK9: cond.false: 11447 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11448 // CHECK9-NEXT: br label [[COND_END]] 11449 // CHECK9: cond.end: 11450 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 11451 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 11452 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11453 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 11454 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11455 // CHECK9: omp.inner.for.cond: 11456 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11457 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11458 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 11459 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11460 // CHECK9: omp.inner.for.body: 11461 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11462 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 11463 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11464 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 11465 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 11466 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11467 // CHECK9: omp.inner.for.inc: 11468 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11469 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11470 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 11471 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 11472 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11473 // CHECK9: omp.inner.for.end: 11474 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11475 // CHECK9: omp.loop.exit: 11476 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11477 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 11478 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 11479 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11480 // CHECK9: omp.precond.end: 11481 // CHECK9-NEXT: ret void 11482 // 11483 // 11484 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..39 11485 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11486 // CHECK9-NEXT: entry: 11487 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11488 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11489 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 11490 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 11491 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11492 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11493 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11494 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11495 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11496 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11497 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11498 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11499 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11500 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 11501 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 11502 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11503 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11504 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 11505 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11506 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11507 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11508 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11509 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11510 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11511 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11512 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11513 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11514 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11515 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11516 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11517 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 11518 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 11519 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11520 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 11521 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11522 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 11523 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11524 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11525 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11526 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 11527 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11528 // CHECK9: omp.precond.then: 11529 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 11530 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11531 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 11532 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11533 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 11534 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11535 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 11536 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 11537 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 11538 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11539 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11540 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11541 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 11542 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 11543 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11544 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11545 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 11546 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11547 // CHECK9: cond.true: 11548 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11549 // CHECK9-NEXT: br label [[COND_END:%.*]] 11550 // CHECK9: cond.false: 11551 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11552 // CHECK9-NEXT: br label [[COND_END]] 11553 // CHECK9: cond.end: 11554 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 11555 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 11556 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 11557 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 11558 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11559 // CHECK9: omp.inner.for.cond: 11560 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11561 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11562 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 11563 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11564 // CHECK9: omp.inner.for.body: 11565 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11566 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 11567 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 11568 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 11569 // CHECK9-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 8 11570 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 11571 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 11572 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i64 [[IDXPROM]] 11573 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 11574 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 8 11575 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 11576 // CHECK9-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 11577 // CHECK9-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM7]] 11578 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 11579 // CHECK9-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 11580 // CHECK9-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 8 11581 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 11582 // CHECK9-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 11583 // CHECK9-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM10]] 11584 // CHECK9-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 11585 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 11586 // CHECK9: omp.body.continue: 11587 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11588 // CHECK9: omp.inner.for.inc: 11589 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11590 // CHECK9-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 11591 // CHECK9-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 11592 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11593 // CHECK9: omp.inner.for.end: 11594 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11595 // CHECK9: omp.loop.exit: 11596 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11597 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 11598 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 11599 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11600 // CHECK9: omp.precond.end: 11601 // CHECK9-NEXT: ret void 11602 // 11603 // 11604 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75 11605 // CHECK9-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 11606 // CHECK9-NEXT: entry: 11607 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 11608 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 11609 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 11610 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 11611 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 11612 // CHECK9-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 11613 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 11614 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 11615 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 11616 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 11617 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 11618 // CHECK9-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 11619 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..42 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 11620 // CHECK9-NEXT: ret void 11621 // 11622 // 11623 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..42 11624 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11625 // CHECK9-NEXT: entry: 11626 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11627 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11628 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 11629 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11630 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11631 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11632 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11633 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11634 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11635 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11636 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11637 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 11638 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11639 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 11640 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 11641 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11642 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11643 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 11644 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 11645 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11646 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11647 // CHECK9-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 11648 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11649 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11650 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11651 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11652 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 11653 // CHECK9-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11654 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11655 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11656 // CHECK9-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11657 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 11658 // CHECK9-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 11659 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 11660 // CHECK9-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11661 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11662 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 11663 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11664 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 11665 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 11666 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11667 // CHECK9-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11668 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 11669 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11670 // CHECK9: omp.precond.then: 11671 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 11672 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 11673 // CHECK9-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 11674 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11675 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11676 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11677 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 11678 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 11679 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11680 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 11681 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 11682 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11683 // CHECK9: cond.true: 11684 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 11685 // CHECK9-NEXT: br label [[COND_END:%.*]] 11686 // CHECK9: cond.false: 11687 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11688 // CHECK9-NEXT: br label [[COND_END]] 11689 // CHECK9: cond.end: 11690 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 11691 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 11692 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11693 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 11694 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11695 // CHECK9: omp.inner.for.cond: 11696 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11697 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11698 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 11699 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11700 // CHECK9: omp.inner.for.body: 11701 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11702 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 11703 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11704 // CHECK9-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 11705 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11706 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 11707 // CHECK9-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 11708 // CHECK9-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 11709 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**, i64)* @.omp_outlined..43 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i64 [[TMP24]]) 11710 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11711 // CHECK9: omp.inner.for.inc: 11712 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11713 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11714 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 11715 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 11716 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11717 // CHECK9: omp.inner.for.end: 11718 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11719 // CHECK9: omp.loop.exit: 11720 // CHECK9-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11721 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 11722 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 11723 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11724 // CHECK9: omp.precond.end: 11725 // CHECK9-NEXT: ret void 11726 // 11727 // 11728 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..43 11729 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 11730 // CHECK9-NEXT: entry: 11731 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11732 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11733 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 11734 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 11735 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11736 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11737 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11738 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11739 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 11740 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11741 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11742 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11743 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 11744 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11745 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 11746 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 11747 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11748 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11749 // CHECK9-NEXT: [[I6:%.*]] = alloca i32, align 4 11750 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11751 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11752 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11753 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11754 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11755 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11756 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11757 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11758 // CHECK9-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 11759 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11760 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11761 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11762 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11763 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 11764 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 11765 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11766 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11767 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 11768 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11769 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 11770 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 11771 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11772 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11773 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 11774 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11775 // CHECK9: omp.precond.then: 11776 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 11777 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 11778 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 11779 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 11780 // CHECK9-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 11781 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11782 // CHECK9-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 11783 // CHECK9-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 11784 // CHECK9-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 11785 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11786 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11787 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 11788 // CHECK9-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11789 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 11790 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 11791 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 11792 // CHECK9: omp.dispatch.cond: 11793 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11794 // CHECK9-NEXT: [[CONV7:%.*]] = sext i32 [[TMP13]] to i64 11795 // CHECK9-NEXT: [[TMP14:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11796 // CHECK9-NEXT: [[CMP8:%.*]] = icmp ugt i64 [[CONV7]], [[TMP14]] 11797 // CHECK9-NEXT: br i1 [[CMP8]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11798 // CHECK9: cond.true: 11799 // CHECK9-NEXT: [[TMP15:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 11800 // CHECK9-NEXT: br label [[COND_END:%.*]] 11801 // CHECK9: cond.false: 11802 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11803 // CHECK9-NEXT: [[CONV9:%.*]] = sext i32 [[TMP16]] to i64 11804 // CHECK9-NEXT: br label [[COND_END]] 11805 // CHECK9: cond.end: 11806 // CHECK9-NEXT: [[COND:%.*]] = phi i64 [ [[TMP15]], [[COND_TRUE]] ], [ [[CONV9]], [[COND_FALSE]] ] 11807 // CHECK9-NEXT: [[CONV10:%.*]] = trunc i64 [[COND]] to i32 11808 // CHECK9-NEXT: store i32 [[CONV10]], i32* [[DOTOMP_UB]], align 4 11809 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 11810 // CHECK9-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 11811 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11812 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11813 // CHECK9-NEXT: [[CMP11:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 11814 // CHECK9-NEXT: br i1 [[CMP11]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 11815 // CHECK9: omp.dispatch.body: 11816 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11817 // CHECK9: omp.inner.for.cond: 11818 // CHECK9-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11819 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11820 // CHECK9-NEXT: [[CMP12:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 11821 // CHECK9-NEXT: br i1 [[CMP12]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11822 // CHECK9: omp.inner.for.body: 11823 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11824 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 11825 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 11826 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I6]], align 4 11827 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP2]], align 8 11828 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[I6]], align 4 11829 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP24]] to i64 11830 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM]] 11831 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 11832 // CHECK9-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP3]], align 8 11833 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[I6]], align 4 11834 // CHECK9-NEXT: [[IDXPROM13:%.*]] = sext i32 [[TMP27]] to i64 11835 // CHECK9-NEXT: [[ARRAYIDX14:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM13]] 11836 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[ARRAYIDX14]], align 4 11837 // CHECK9-NEXT: [[ADD15:%.*]] = add nsw i32 [[TMP25]], [[TMP28]] 11838 // CHECK9-NEXT: [[TMP29:%.*]] = load i32*, i32** [[TMP1]], align 8 11839 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[I6]], align 4 11840 // CHECK9-NEXT: [[IDXPROM16:%.*]] = sext i32 [[TMP30]] to i64 11841 // CHECK9-NEXT: [[ARRAYIDX17:%.*]] = getelementptr inbounds i32, i32* [[TMP29]], i64 [[IDXPROM16]] 11842 // CHECK9-NEXT: store i32 [[ADD15]], i32* [[ARRAYIDX17]], align 4 11843 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 11844 // CHECK9: omp.body.continue: 11845 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11846 // CHECK9: omp.inner.for.inc: 11847 // CHECK9-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11848 // CHECK9-NEXT: [[ADD18:%.*]] = add nsw i32 [[TMP31]], 1 11849 // CHECK9-NEXT: store i32 [[ADD18]], i32* [[DOTOMP_IV]], align 4 11850 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11851 // CHECK9: omp.inner.for.end: 11852 // CHECK9-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 11853 // CHECK9: omp.dispatch.inc: 11854 // CHECK9-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 11855 // CHECK9-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11856 // CHECK9-NEXT: [[ADD19:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 11857 // CHECK9-NEXT: store i32 [[ADD19]], i32* [[DOTOMP_LB]], align 4 11858 // CHECK9-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 11859 // CHECK9-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11860 // CHECK9-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 11861 // CHECK9-NEXT: store i32 [[ADD20]], i32* [[DOTOMP_UB]], align 4 11862 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND]] 11863 // CHECK9: omp.dispatch.end: 11864 // CHECK9-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11865 // CHECK9-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 11866 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 11867 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11868 // CHECK9: omp.precond.end: 11869 // CHECK9-NEXT: ret void 11870 // 11871 // 11872 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83 11873 // CHECK9-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 11874 // CHECK9-NEXT: entry: 11875 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 11876 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 11877 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 11878 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 11879 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 11880 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 11881 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 11882 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 11883 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 11884 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..46 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 11885 // CHECK9-NEXT: ret void 11886 // 11887 // 11888 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..46 11889 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11890 // CHECK9-NEXT: entry: 11891 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11892 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11893 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11894 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11895 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11896 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11897 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11898 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11899 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11900 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11901 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11902 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 11903 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 11904 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 11905 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 11906 // CHECK9-NEXT: [[I3:%.*]] = alloca i32, align 4 11907 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 11908 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 11909 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 11910 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 11911 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 11912 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 11913 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 11914 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 11915 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 11916 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 11917 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 11918 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 11919 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11920 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 11921 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 11922 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 11923 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 11924 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 11925 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 11926 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 11927 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 11928 // CHECK9: omp.precond.then: 11929 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 11930 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11931 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 11932 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 11933 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 11934 // CHECK9-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11935 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 11936 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 11937 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11938 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11939 // CHECK9-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 11940 // CHECK9-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 11941 // CHECK9: cond.true: 11942 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 11943 // CHECK9-NEXT: br label [[COND_END:%.*]] 11944 // CHECK9: cond.false: 11945 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11946 // CHECK9-NEXT: br label [[COND_END]] 11947 // CHECK9: cond.end: 11948 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 11949 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 11950 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11951 // CHECK9-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 11952 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 11953 // CHECK9: omp.inner.for.cond: 11954 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11955 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11956 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 11957 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 11958 // CHECK9: omp.inner.for.body: 11959 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 11960 // CHECK9-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 11961 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 11962 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 11963 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..47 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 11964 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 11965 // CHECK9: omp.inner.for.inc: 11966 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 11967 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 11968 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 11969 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 11970 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 11971 // CHECK9: omp.inner.for.end: 11972 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 11973 // CHECK9: omp.loop.exit: 11974 // CHECK9-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 11975 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 11976 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 11977 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 11978 // CHECK9: omp.precond.end: 11979 // CHECK9-NEXT: ret void 11980 // 11981 // 11982 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..47 11983 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 11984 // CHECK9-NEXT: entry: 11985 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 11986 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 11987 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 11988 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 11989 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 11990 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 11991 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 11992 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 11993 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 11994 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 11995 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 11996 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 11997 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 11998 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 11999 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 12000 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 12001 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 12002 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 12003 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 12004 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 12005 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 12006 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 12007 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 12008 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 12009 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 12010 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 12011 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 12012 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 12013 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 12014 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 12015 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 12016 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 12017 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 12018 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 12019 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 12020 // CHECK9-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 12021 // CHECK9-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 12022 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 12023 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 12024 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 12025 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 12026 // CHECK9: omp.precond.then: 12027 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 12028 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12029 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 12030 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 12031 // CHECK9-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 12032 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 12033 // CHECK9-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 12034 // CHECK9-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 12035 // CHECK9-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 12036 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 12037 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 12038 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 12039 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 12040 // CHECK9-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12041 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 12042 // CHECK9-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 12043 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 12044 // CHECK9: omp.dispatch.cond: 12045 // CHECK9-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12046 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 12047 // CHECK9-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 12048 // CHECK9-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 12049 // CHECK9-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 12050 // CHECK9: omp.dispatch.body: 12051 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 12052 // CHECK9-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 12053 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 12054 // CHECK9: omp.inner.for.cond: 12055 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 12056 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !24 12057 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 12058 // CHECK9-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 12059 // CHECK9: omp.inner.for.body: 12060 // CHECK9-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 12061 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 12062 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 12063 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !24 12064 // CHECK9-NEXT: [[TMP21:%.*]] = load i32*, i32** [[TMP2]], align 8, !llvm.access.group !24 12065 // CHECK9-NEXT: [[TMP22:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !24 12066 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP22]] to i64 12067 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP21]], i64 [[IDXPROM]] 12068 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !24 12069 // CHECK9-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP3]], align 8, !llvm.access.group !24 12070 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !24 12071 // CHECK9-NEXT: [[IDXPROM6:%.*]] = sext i32 [[TMP25]] to i64 12072 // CHECK9-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i64 [[IDXPROM6]] 12073 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX7]], align 4, !llvm.access.group !24 12074 // CHECK9-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP23]], [[TMP26]] 12075 // CHECK9-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP1]], align 8, !llvm.access.group !24 12076 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !24 12077 // CHECK9-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP28]] to i64 12078 // CHECK9-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i64 [[IDXPROM9]] 12079 // CHECK9-NEXT: store i32 [[ADD8]], i32* [[ARRAYIDX10]], align 4, !llvm.access.group !24 12080 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 12081 // CHECK9: omp.body.continue: 12082 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 12083 // CHECK9: omp.inner.for.inc: 12084 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 12085 // CHECK9-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP29]], 1 12086 // CHECK9-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 12087 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP25:![0-9]+]] 12088 // CHECK9: omp.inner.for.end: 12089 // CHECK9-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 12090 // CHECK9: omp.dispatch.inc: 12091 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND]] 12092 // CHECK9: omp.dispatch.end: 12093 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 12094 // CHECK9: omp.precond.end: 12095 // CHECK9-NEXT: ret void 12096 // 12097 // 12098 // CHECK9-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91 12099 // CHECK9-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 12100 // CHECK9-NEXT: entry: 12101 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 12102 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 12103 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 12104 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 12105 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 12106 // CHECK9-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 12107 // CHECK9-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 12108 // CHECK9-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 12109 // CHECK9-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 12110 // CHECK9-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 12111 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 12112 // CHECK9-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 12113 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..50 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 12114 // CHECK9-NEXT: ret void 12115 // 12116 // 12117 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..50 12118 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 12119 // CHECK9-NEXT: entry: 12120 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 12121 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 12122 // CHECK9-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 12123 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 12124 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 12125 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 12126 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 12127 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 12128 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 12129 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 12130 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 12131 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 12132 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 12133 // CHECK9-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 12134 // CHECK9-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 12135 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 12136 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 12137 // CHECK9-NEXT: [[I4:%.*]] = alloca i32, align 4 12138 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 12139 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 12140 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 12141 // CHECK9-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 12142 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 12143 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 12144 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 12145 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 12146 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 12147 // CHECK9-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 12148 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 12149 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 12150 // CHECK9-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 12151 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 12152 // CHECK9-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 12153 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 12154 // CHECK9-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 12155 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12156 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 12157 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 12158 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 12159 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 12160 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 12161 // CHECK9-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12162 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 12163 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 12164 // CHECK9: omp.precond.then: 12165 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 12166 // CHECK9-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 12167 // CHECK9-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 12168 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 12169 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 12170 // CHECK9-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12171 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 12172 // CHECK9-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 12173 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12174 // CHECK9-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 12175 // CHECK9-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 12176 // CHECK9-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 12177 // CHECK9: cond.true: 12178 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 12179 // CHECK9-NEXT: br label [[COND_END:%.*]] 12180 // CHECK9: cond.false: 12181 // CHECK9-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12182 // CHECK9-NEXT: br label [[COND_END]] 12183 // CHECK9: cond.end: 12184 // CHECK9-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 12185 // CHECK9-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 12186 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 12187 // CHECK9-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 12188 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 12189 // CHECK9: omp.inner.for.cond: 12190 // CHECK9-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 12191 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12192 // CHECK9-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 12193 // CHECK9-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 12194 // CHECK9: omp.inner.for.body: 12195 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 12196 // CHECK9-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 12197 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12198 // CHECK9-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 12199 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 12200 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 12201 // CHECK9-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 12202 // CHECK9-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 12203 // CHECK9-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**, i64)* @.omp_outlined..51 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i64 [[TMP24]]) 12204 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 12205 // CHECK9: omp.inner.for.inc: 12206 // CHECK9-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 12207 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 12208 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 12209 // CHECK9-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 12210 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]] 12211 // CHECK9: omp.inner.for.end: 12212 // CHECK9-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 12213 // CHECK9: omp.loop.exit: 12214 // CHECK9-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12215 // CHECK9-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 12216 // CHECK9-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 12217 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 12218 // CHECK9: omp.precond.end: 12219 // CHECK9-NEXT: ret void 12220 // 12221 // 12222 // CHECK9-LABEL: define {{[^@]+}}@.omp_outlined..51 12223 // CHECK9-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 12224 // CHECK9-NEXT: entry: 12225 // CHECK9-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 12226 // CHECK9-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 12227 // CHECK9-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 12228 // CHECK9-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 12229 // CHECK9-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 12230 // CHECK9-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 12231 // CHECK9-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 12232 // CHECK9-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 12233 // CHECK9-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 12234 // CHECK9-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 12235 // CHECK9-NEXT: [[TMP:%.*]] = alloca i32, align 4 12236 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 12237 // CHECK9-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 12238 // CHECK9-NEXT: [[I:%.*]] = alloca i32, align 4 12239 // CHECK9-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 12240 // CHECK9-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 12241 // CHECK9-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 12242 // CHECK9-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 12243 // CHECK9-NEXT: [[I6:%.*]] = alloca i32, align 4 12244 // CHECK9-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 12245 // CHECK9-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 12246 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 12247 // CHECK9-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 12248 // CHECK9-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 12249 // CHECK9-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 12250 // CHECK9-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 12251 // CHECK9-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 12252 // CHECK9-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 12253 // CHECK9-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 12254 // CHECK9-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 12255 // CHECK9-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 12256 // CHECK9-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 12257 // CHECK9-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 12258 // CHECK9-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 12259 // CHECK9-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 12260 // CHECK9-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12261 // CHECK9-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 12262 // CHECK9-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 12263 // CHECK9-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 12264 // CHECK9-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 12265 // CHECK9-NEXT: store i32 0, i32* [[I]], align 4 12266 // CHECK9-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12267 // CHECK9-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 12268 // CHECK9-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 12269 // CHECK9: omp.precond.then: 12270 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 12271 // CHECK9-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 12272 // CHECK9-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 12273 // CHECK9-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 12274 // CHECK9-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 12275 // CHECK9-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 12276 // CHECK9-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 12277 // CHECK9-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 12278 // CHECK9-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 12279 // CHECK9-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 12280 // CHECK9-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 12281 // CHECK9-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 12282 // CHECK9-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 12283 // CHECK9-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 12284 // CHECK9-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12285 // CHECK9-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 12286 // CHECK9-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 12287 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 12288 // CHECK9: omp.dispatch.cond: 12289 // CHECK9-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12290 // CHECK9-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 12291 // CHECK9-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 12292 // CHECK9-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 12293 // CHECK9-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 12294 // CHECK9: omp.dispatch.body: 12295 // CHECK9-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 12296 // CHECK9-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 12297 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 12298 // CHECK9: omp.inner.for.cond: 12299 // CHECK9-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 12300 // CHECK9-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !27 12301 // CHECK9-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 12302 // CHECK9-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 12303 // CHECK9: omp.inner.for.body: 12304 // CHECK9-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 12305 // CHECK9-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 12306 // CHECK9-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 12307 // CHECK9-NEXT: store i32 [[ADD]], i32* [[I6]], align 4, !llvm.access.group !27 12308 // CHECK9-NEXT: [[TMP22:%.*]] = load i32*, i32** [[TMP2]], align 8, !llvm.access.group !27 12309 // CHECK9-NEXT: [[TMP23:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !27 12310 // CHECK9-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP23]] to i64 12311 // CHECK9-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP22]], i64 [[IDXPROM]] 12312 // CHECK9-NEXT: [[TMP24:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !27 12313 // CHECK9-NEXT: [[TMP25:%.*]] = load i32*, i32** [[TMP3]], align 8, !llvm.access.group !27 12314 // CHECK9-NEXT: [[TMP26:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !27 12315 // CHECK9-NEXT: [[IDXPROM8:%.*]] = sext i32 [[TMP26]] to i64 12316 // CHECK9-NEXT: [[ARRAYIDX9:%.*]] = getelementptr inbounds i32, i32* [[TMP25]], i64 [[IDXPROM8]] 12317 // CHECK9-NEXT: [[TMP27:%.*]] = load i32, i32* [[ARRAYIDX9]], align 4, !llvm.access.group !27 12318 // CHECK9-NEXT: [[ADD10:%.*]] = add nsw i32 [[TMP24]], [[TMP27]] 12319 // CHECK9-NEXT: [[TMP28:%.*]] = load i32*, i32** [[TMP1]], align 8, !llvm.access.group !27 12320 // CHECK9-NEXT: [[TMP29:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !27 12321 // CHECK9-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP29]] to i64 12322 // CHECK9-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds i32, i32* [[TMP28]], i64 [[IDXPROM11]] 12323 // CHECK9-NEXT: store i32 [[ADD10]], i32* [[ARRAYIDX12]], align 4, !llvm.access.group !27 12324 // CHECK9-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 12325 // CHECK9: omp.body.continue: 12326 // CHECK9-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 12327 // CHECK9: omp.inner.for.inc: 12328 // CHECK9-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 12329 // CHECK9-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP30]], 1 12330 // CHECK9-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 12331 // CHECK9-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP28:![0-9]+]] 12332 // CHECK9: omp.inner.for.end: 12333 // CHECK9-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 12334 // CHECK9: omp.dispatch.inc: 12335 // CHECK9-NEXT: br label [[OMP_DISPATCH_COND]] 12336 // CHECK9: omp.dispatch.end: 12337 // CHECK9-NEXT: br label [[OMP_PRECOND_END]] 12338 // CHECK9: omp.precond.end: 12339 // CHECK9-NEXT: ret void 12340 // 12341 // 12342 // CHECK9-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 12343 // CHECK9-SAME: () #[[ATTR4:[0-9]+]] { 12344 // CHECK9-NEXT: entry: 12345 // CHECK9-NEXT: call void @__tgt_register_requires(i64 1) 12346 // CHECK9-NEXT: ret void 12347 // 12348 // 12349 // CHECK10-LABEL: define {{[^@]+}}@main 12350 // CHECK10-SAME: () #[[ATTR0:[0-9]+]] { 12351 // CHECK10-NEXT: entry: 12352 // CHECK10-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 12353 // CHECK10-NEXT: [[A:%.*]] = alloca double*, align 8 12354 // CHECK10-NEXT: [[B:%.*]] = alloca double*, align 8 12355 // CHECK10-NEXT: [[C:%.*]] = alloca double*, align 8 12356 // CHECK10-NEXT: [[N:%.*]] = alloca i32, align 4 12357 // CHECK10-NEXT: [[CH:%.*]] = alloca i32, align 4 12358 // CHECK10-NEXT: [[N_CASTED:%.*]] = alloca i64, align 8 12359 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 8 12360 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 8 12361 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 8 12362 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 12363 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 12364 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 12365 // CHECK10-NEXT: [[N_CASTED3:%.*]] = alloca i64, align 8 12366 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS5:%.*]] = alloca [4 x i8*], align 8 12367 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS6:%.*]] = alloca [4 x i8*], align 8 12368 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS7:%.*]] = alloca [4 x i8*], align 8 12369 // CHECK10-NEXT: [[_TMP8:%.*]] = alloca i32, align 4 12370 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 12371 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_10:%.*]] = alloca i32, align 4 12372 // CHECK10-NEXT: [[CH_CASTED:%.*]] = alloca i64, align 8 12373 // CHECK10-NEXT: [[N_CASTED18:%.*]] = alloca i64, align 8 12374 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS20:%.*]] = alloca [5 x i8*], align 8 12375 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS21:%.*]] = alloca [5 x i8*], align 8 12376 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS22:%.*]] = alloca [5 x i8*], align 8 12377 // CHECK10-NEXT: [[_TMP23:%.*]] = alloca i32, align 4 12378 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_24:%.*]] = alloca i32, align 4 12379 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_25:%.*]] = alloca i32, align 4 12380 // CHECK10-NEXT: [[N_CASTED32:%.*]] = alloca i64, align 8 12381 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS34:%.*]] = alloca [4 x i8*], align 8 12382 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS35:%.*]] = alloca [4 x i8*], align 8 12383 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS36:%.*]] = alloca [4 x i8*], align 8 12384 // CHECK10-NEXT: [[_TMP37:%.*]] = alloca i32, align 4 12385 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_38:%.*]] = alloca i32, align 4 12386 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_39:%.*]] = alloca i32, align 4 12387 // CHECK10-NEXT: [[CH_CASTED46:%.*]] = alloca i64, align 8 12388 // CHECK10-NEXT: [[N_CASTED48:%.*]] = alloca i64, align 8 12389 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS50:%.*]] = alloca [5 x i8*], align 8 12390 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS51:%.*]] = alloca [5 x i8*], align 8 12391 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS52:%.*]] = alloca [5 x i8*], align 8 12392 // CHECK10-NEXT: [[_TMP53:%.*]] = alloca i32, align 4 12393 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_54:%.*]] = alloca i32, align 4 12394 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_55:%.*]] = alloca i32, align 4 12395 // CHECK10-NEXT: [[N_CASTED62:%.*]] = alloca i64, align 8 12396 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS64:%.*]] = alloca [4 x i8*], align 8 12397 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS65:%.*]] = alloca [4 x i8*], align 8 12398 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS66:%.*]] = alloca [4 x i8*], align 8 12399 // CHECK10-NEXT: [[_TMP67:%.*]] = alloca i32, align 4 12400 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_68:%.*]] = alloca i32, align 4 12401 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_69:%.*]] = alloca i32, align 4 12402 // CHECK10-NEXT: [[CH_CASTED76:%.*]] = alloca i64, align 8 12403 // CHECK10-NEXT: [[N_CASTED78:%.*]] = alloca i64, align 8 12404 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS80:%.*]] = alloca [5 x i8*], align 8 12405 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS81:%.*]] = alloca [5 x i8*], align 8 12406 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS82:%.*]] = alloca [5 x i8*], align 8 12407 // CHECK10-NEXT: [[_TMP83:%.*]] = alloca i32, align 4 12408 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_84:%.*]] = alloca i32, align 4 12409 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_85:%.*]] = alloca i32, align 4 12410 // CHECK10-NEXT: store i32 0, i32* [[RETVAL]], align 4 12411 // CHECK10-NEXT: store i32 10000, i32* [[N]], align 4 12412 // CHECK10-NEXT: store i32 100, i32* [[CH]], align 4 12413 // CHECK10-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 12414 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_CASTED]] to i32* 12415 // CHECK10-NEXT: store i32 [[TMP0]], i32* [[CONV]], align 4 12416 // CHECK10-NEXT: [[TMP1:%.*]] = load i64, i64* [[N_CASTED]], align 8 12417 // CHECK10-NEXT: [[TMP2:%.*]] = load double*, double** [[A]], align 8 12418 // CHECK10-NEXT: [[TMP3:%.*]] = load double*, double** [[B]], align 8 12419 // CHECK10-NEXT: [[TMP4:%.*]] = load double*, double** [[C]], align 8 12420 // CHECK10-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 12421 // CHECK10-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i64* 12422 // CHECK10-NEXT: store i64 [[TMP1]], i64* [[TMP6]], align 8 12423 // CHECK10-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 12424 // CHECK10-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i64* 12425 // CHECK10-NEXT: store i64 [[TMP1]], i64* [[TMP8]], align 8 12426 // CHECK10-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0 12427 // CHECK10-NEXT: store i8* null, i8** [[TMP9]], align 8 12428 // CHECK10-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 12429 // CHECK10-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to double** 12430 // CHECK10-NEXT: store double* [[TMP2]], double** [[TMP11]], align 8 12431 // CHECK10-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 12432 // CHECK10-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to double** 12433 // CHECK10-NEXT: store double* [[TMP2]], double** [[TMP13]], align 8 12434 // CHECK10-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 1 12435 // CHECK10-NEXT: store i8* null, i8** [[TMP14]], align 8 12436 // CHECK10-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 12437 // CHECK10-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to double** 12438 // CHECK10-NEXT: store double* [[TMP3]], double** [[TMP16]], align 8 12439 // CHECK10-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 12440 // CHECK10-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to double** 12441 // CHECK10-NEXT: store double* [[TMP3]], double** [[TMP18]], align 8 12442 // CHECK10-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 2 12443 // CHECK10-NEXT: store i8* null, i8** [[TMP19]], align 8 12444 // CHECK10-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 12445 // CHECK10-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to double** 12446 // CHECK10-NEXT: store double* [[TMP4]], double** [[TMP21]], align 8 12447 // CHECK10-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 12448 // CHECK10-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to double** 12449 // CHECK10-NEXT: store double* [[TMP4]], double** [[TMP23]], align 8 12450 // CHECK10-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 3 12451 // CHECK10-NEXT: store i8* null, i8** [[TMP24]], align 8 12452 // CHECK10-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 12453 // CHECK10-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 12454 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 12455 // CHECK10-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 12456 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 12457 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 12458 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 12459 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 12460 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 12461 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12462 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 12463 // CHECK10-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 12464 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3:[0-9]+]], i64 -1, i64 [[TMP30]]) 12465 // CHECK10-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12466 // CHECK10-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 12467 // CHECK10-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 12468 // CHECK10: omp_offload.failed: 12469 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369(i64 [[TMP1]], double* [[TMP2]], double* [[TMP3]], double* [[TMP4]]) #[[ATTR2:[0-9]+]] 12470 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT]] 12471 // CHECK10: omp_offload.cont: 12472 // CHECK10-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 12473 // CHECK10-NEXT: [[CONV4:%.*]] = bitcast i64* [[N_CASTED3]] to i32* 12474 // CHECK10-NEXT: store i32 [[TMP33]], i32* [[CONV4]], align 4 12475 // CHECK10-NEXT: [[TMP34:%.*]] = load i64, i64* [[N_CASTED3]], align 8 12476 // CHECK10-NEXT: [[TMP35:%.*]] = load double*, double** [[A]], align 8 12477 // CHECK10-NEXT: [[TMP36:%.*]] = load double*, double** [[B]], align 8 12478 // CHECK10-NEXT: [[TMP37:%.*]] = load double*, double** [[C]], align 8 12479 // CHECK10-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 12480 // CHECK10-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i64* 12481 // CHECK10-NEXT: store i64 [[TMP34]], i64* [[TMP39]], align 8 12482 // CHECK10-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 12483 // CHECK10-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i64* 12484 // CHECK10-NEXT: store i64 [[TMP34]], i64* [[TMP41]], align 8 12485 // CHECK10-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 0 12486 // CHECK10-NEXT: store i8* null, i8** [[TMP42]], align 8 12487 // CHECK10-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 1 12488 // CHECK10-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to double** 12489 // CHECK10-NEXT: store double* [[TMP35]], double** [[TMP44]], align 8 12490 // CHECK10-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 1 12491 // CHECK10-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to double** 12492 // CHECK10-NEXT: store double* [[TMP35]], double** [[TMP46]], align 8 12493 // CHECK10-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 1 12494 // CHECK10-NEXT: store i8* null, i8** [[TMP47]], align 8 12495 // CHECK10-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 2 12496 // CHECK10-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to double** 12497 // CHECK10-NEXT: store double* [[TMP36]], double** [[TMP49]], align 8 12498 // CHECK10-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 2 12499 // CHECK10-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to double** 12500 // CHECK10-NEXT: store double* [[TMP36]], double** [[TMP51]], align 8 12501 // CHECK10-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 2 12502 // CHECK10-NEXT: store i8* null, i8** [[TMP52]], align 8 12503 // CHECK10-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 3 12504 // CHECK10-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to double** 12505 // CHECK10-NEXT: store double* [[TMP37]], double** [[TMP54]], align 8 12506 // CHECK10-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 3 12507 // CHECK10-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to double** 12508 // CHECK10-NEXT: store double* [[TMP37]], double** [[TMP56]], align 8 12509 // CHECK10-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 3 12510 // CHECK10-NEXT: store i8* null, i8** [[TMP57]], align 8 12511 // CHECK10-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 12512 // CHECK10-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 12513 // CHECK10-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 12514 // CHECK10-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_9]], align 4 12515 // CHECK10-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 12516 // CHECK10-NEXT: [[SUB11:%.*]] = sub nsw i32 [[TMP61]], 0 12517 // CHECK10-NEXT: [[DIV12:%.*]] = sdiv i32 [[SUB11]], 1 12518 // CHECK10-NEXT: [[SUB13:%.*]] = sub nsw i32 [[DIV12]], 1 12519 // CHECK10-NEXT: store i32 [[SUB13]], i32* [[DOTCAPTURE_EXPR_10]], align 4 12520 // CHECK10-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_10]], align 4 12521 // CHECK10-NEXT: [[ADD14:%.*]] = add nsw i32 [[TMP62]], 1 12522 // CHECK10-NEXT: [[TMP63:%.*]] = zext i32 [[ADD14]] to i64 12523 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 12524 // CHECK10-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.4, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.5, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12525 // CHECK10-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 12526 // CHECK10-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED15:%.*]], label [[OMP_OFFLOAD_CONT16:%.*]] 12527 // CHECK10: omp_offload.failed15: 12528 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408(i64 [[TMP34]], double* [[TMP35]], double* [[TMP36]], double* [[TMP37]]) #[[ATTR2]] 12529 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT16]] 12530 // CHECK10: omp_offload.cont16: 12531 // CHECK10-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 12532 // CHECK10-NEXT: [[CONV17:%.*]] = bitcast i64* [[CH_CASTED]] to i32* 12533 // CHECK10-NEXT: store i32 [[TMP66]], i32* [[CONV17]], align 4 12534 // CHECK10-NEXT: [[TMP67:%.*]] = load i64, i64* [[CH_CASTED]], align 8 12535 // CHECK10-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 12536 // CHECK10-NEXT: [[CONV19:%.*]] = bitcast i64* [[N_CASTED18]] to i32* 12537 // CHECK10-NEXT: store i32 [[TMP68]], i32* [[CONV19]], align 4 12538 // CHECK10-NEXT: [[TMP69:%.*]] = load i64, i64* [[N_CASTED18]], align 8 12539 // CHECK10-NEXT: [[TMP70:%.*]] = load double*, double** [[A]], align 8 12540 // CHECK10-NEXT: [[TMP71:%.*]] = load double*, double** [[B]], align 8 12541 // CHECK10-NEXT: [[TMP72:%.*]] = load double*, double** [[C]], align 8 12542 // CHECK10-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 12543 // CHECK10-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i64* 12544 // CHECK10-NEXT: store i64 [[TMP67]], i64* [[TMP74]], align 8 12545 // CHECK10-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 12546 // CHECK10-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i64* 12547 // CHECK10-NEXT: store i64 [[TMP67]], i64* [[TMP76]], align 8 12548 // CHECK10-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 0 12549 // CHECK10-NEXT: store i8* null, i8** [[TMP77]], align 8 12550 // CHECK10-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 1 12551 // CHECK10-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i64* 12552 // CHECK10-NEXT: store i64 [[TMP69]], i64* [[TMP79]], align 8 12553 // CHECK10-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 1 12554 // CHECK10-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i64* 12555 // CHECK10-NEXT: store i64 [[TMP69]], i64* [[TMP81]], align 8 12556 // CHECK10-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 1 12557 // CHECK10-NEXT: store i8* null, i8** [[TMP82]], align 8 12558 // CHECK10-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 2 12559 // CHECK10-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to double** 12560 // CHECK10-NEXT: store double* [[TMP70]], double** [[TMP84]], align 8 12561 // CHECK10-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 2 12562 // CHECK10-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to double** 12563 // CHECK10-NEXT: store double* [[TMP70]], double** [[TMP86]], align 8 12564 // CHECK10-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 2 12565 // CHECK10-NEXT: store i8* null, i8** [[TMP87]], align 8 12566 // CHECK10-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 3 12567 // CHECK10-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to double** 12568 // CHECK10-NEXT: store double* [[TMP71]], double** [[TMP89]], align 8 12569 // CHECK10-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 3 12570 // CHECK10-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to double** 12571 // CHECK10-NEXT: store double* [[TMP71]], double** [[TMP91]], align 8 12572 // CHECK10-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 3 12573 // CHECK10-NEXT: store i8* null, i8** [[TMP92]], align 8 12574 // CHECK10-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 4 12575 // CHECK10-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to double** 12576 // CHECK10-NEXT: store double* [[TMP72]], double** [[TMP94]], align 8 12577 // CHECK10-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 4 12578 // CHECK10-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to double** 12579 // CHECK10-NEXT: store double* [[TMP72]], double** [[TMP96]], align 8 12580 // CHECK10-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 4 12581 // CHECK10-NEXT: store i8* null, i8** [[TMP97]], align 8 12582 // CHECK10-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 12583 // CHECK10-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 12584 // CHECK10-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 12585 // CHECK10-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_24]], align 4 12586 // CHECK10-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_24]], align 4 12587 // CHECK10-NEXT: [[SUB26:%.*]] = sub nsw i32 [[TMP101]], 0 12588 // CHECK10-NEXT: [[DIV27:%.*]] = sdiv i32 [[SUB26]], 1 12589 // CHECK10-NEXT: [[SUB28:%.*]] = sub nsw i32 [[DIV27]], 1 12590 // CHECK10-NEXT: store i32 [[SUB28]], i32* [[DOTCAPTURE_EXPR_25]], align 4 12591 // CHECK10-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_25]], align 4 12592 // CHECK10-NEXT: [[ADD29:%.*]] = add nsw i32 [[TMP102]], 1 12593 // CHECK10-NEXT: [[TMP103:%.*]] = zext i32 [[ADD29]] to i64 12594 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 12595 // CHECK10-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.8, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.9, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12596 // CHECK10-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 12597 // CHECK10-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED30:%.*]], label [[OMP_OFFLOAD_CONT31:%.*]] 12598 // CHECK10: omp_offload.failed30: 12599 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447(i64 [[TMP67]], i64 [[TMP69]], double* [[TMP70]], double* [[TMP71]], double* [[TMP72]]) #[[ATTR2]] 12600 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT31]] 12601 // CHECK10: omp_offload.cont31: 12602 // CHECK10-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 12603 // CHECK10-NEXT: [[CONV33:%.*]] = bitcast i64* [[N_CASTED32]] to i32* 12604 // CHECK10-NEXT: store i32 [[TMP106]], i32* [[CONV33]], align 4 12605 // CHECK10-NEXT: [[TMP107:%.*]] = load i64, i64* [[N_CASTED32]], align 8 12606 // CHECK10-NEXT: [[TMP108:%.*]] = load double*, double** [[A]], align 8 12607 // CHECK10-NEXT: [[TMP109:%.*]] = load double*, double** [[B]], align 8 12608 // CHECK10-NEXT: [[TMP110:%.*]] = load double*, double** [[C]], align 8 12609 // CHECK10-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 12610 // CHECK10-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i64* 12611 // CHECK10-NEXT: store i64 [[TMP107]], i64* [[TMP112]], align 8 12612 // CHECK10-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 12613 // CHECK10-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i64* 12614 // CHECK10-NEXT: store i64 [[TMP107]], i64* [[TMP114]], align 8 12615 // CHECK10-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 0 12616 // CHECK10-NEXT: store i8* null, i8** [[TMP115]], align 8 12617 // CHECK10-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 1 12618 // CHECK10-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to double** 12619 // CHECK10-NEXT: store double* [[TMP108]], double** [[TMP117]], align 8 12620 // CHECK10-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 1 12621 // CHECK10-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to double** 12622 // CHECK10-NEXT: store double* [[TMP108]], double** [[TMP119]], align 8 12623 // CHECK10-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 1 12624 // CHECK10-NEXT: store i8* null, i8** [[TMP120]], align 8 12625 // CHECK10-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 2 12626 // CHECK10-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to double** 12627 // CHECK10-NEXT: store double* [[TMP109]], double** [[TMP122]], align 8 12628 // CHECK10-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 2 12629 // CHECK10-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to double** 12630 // CHECK10-NEXT: store double* [[TMP109]], double** [[TMP124]], align 8 12631 // CHECK10-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 2 12632 // CHECK10-NEXT: store i8* null, i8** [[TMP125]], align 8 12633 // CHECK10-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 3 12634 // CHECK10-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to double** 12635 // CHECK10-NEXT: store double* [[TMP110]], double** [[TMP127]], align 8 12636 // CHECK10-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 3 12637 // CHECK10-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to double** 12638 // CHECK10-NEXT: store double* [[TMP110]], double** [[TMP129]], align 8 12639 // CHECK10-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 3 12640 // CHECK10-NEXT: store i8* null, i8** [[TMP130]], align 8 12641 // CHECK10-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 12642 // CHECK10-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 12643 // CHECK10-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 12644 // CHECK10-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_38]], align 4 12645 // CHECK10-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_38]], align 4 12646 // CHECK10-NEXT: [[SUB40:%.*]] = sub nsw i32 [[TMP134]], 0 12647 // CHECK10-NEXT: [[DIV41:%.*]] = sdiv i32 [[SUB40]], 1 12648 // CHECK10-NEXT: [[SUB42:%.*]] = sub nsw i32 [[DIV41]], 1 12649 // CHECK10-NEXT: store i32 [[SUB42]], i32* [[DOTCAPTURE_EXPR_39]], align 4 12650 // CHECK10-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_39]], align 4 12651 // CHECK10-NEXT: [[ADD43:%.*]] = add nsw i32 [[TMP135]], 1 12652 // CHECK10-NEXT: [[TMP136:%.*]] = zext i32 [[ADD43]] to i64 12653 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 12654 // CHECK10-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.12, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.13, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12655 // CHECK10-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 12656 // CHECK10-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED44:%.*]], label [[OMP_OFFLOAD_CONT45:%.*]] 12657 // CHECK10: omp_offload.failed44: 12658 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478(i64 [[TMP107]], double* [[TMP108]], double* [[TMP109]], double* [[TMP110]]) #[[ATTR2]] 12659 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT45]] 12660 // CHECK10: omp_offload.cont45: 12661 // CHECK10-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 12662 // CHECK10-NEXT: [[CONV47:%.*]] = bitcast i64* [[CH_CASTED46]] to i32* 12663 // CHECK10-NEXT: store i32 [[TMP139]], i32* [[CONV47]], align 4 12664 // CHECK10-NEXT: [[TMP140:%.*]] = load i64, i64* [[CH_CASTED46]], align 8 12665 // CHECK10-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 12666 // CHECK10-NEXT: [[CONV49:%.*]] = bitcast i64* [[N_CASTED48]] to i32* 12667 // CHECK10-NEXT: store i32 [[TMP141]], i32* [[CONV49]], align 4 12668 // CHECK10-NEXT: [[TMP142:%.*]] = load i64, i64* [[N_CASTED48]], align 8 12669 // CHECK10-NEXT: [[TMP143:%.*]] = load double*, double** [[A]], align 8 12670 // CHECK10-NEXT: [[TMP144:%.*]] = load double*, double** [[B]], align 8 12671 // CHECK10-NEXT: [[TMP145:%.*]] = load double*, double** [[C]], align 8 12672 // CHECK10-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 12673 // CHECK10-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i64* 12674 // CHECK10-NEXT: store i64 [[TMP140]], i64* [[TMP147]], align 8 12675 // CHECK10-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 12676 // CHECK10-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i64* 12677 // CHECK10-NEXT: store i64 [[TMP140]], i64* [[TMP149]], align 8 12678 // CHECK10-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 0 12679 // CHECK10-NEXT: store i8* null, i8** [[TMP150]], align 8 12680 // CHECK10-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 1 12681 // CHECK10-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i64* 12682 // CHECK10-NEXT: store i64 [[TMP142]], i64* [[TMP152]], align 8 12683 // CHECK10-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 1 12684 // CHECK10-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i64* 12685 // CHECK10-NEXT: store i64 [[TMP142]], i64* [[TMP154]], align 8 12686 // CHECK10-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 1 12687 // CHECK10-NEXT: store i8* null, i8** [[TMP155]], align 8 12688 // CHECK10-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 2 12689 // CHECK10-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to double** 12690 // CHECK10-NEXT: store double* [[TMP143]], double** [[TMP157]], align 8 12691 // CHECK10-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 2 12692 // CHECK10-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to double** 12693 // CHECK10-NEXT: store double* [[TMP143]], double** [[TMP159]], align 8 12694 // CHECK10-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 2 12695 // CHECK10-NEXT: store i8* null, i8** [[TMP160]], align 8 12696 // CHECK10-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 3 12697 // CHECK10-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to double** 12698 // CHECK10-NEXT: store double* [[TMP144]], double** [[TMP162]], align 8 12699 // CHECK10-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 3 12700 // CHECK10-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to double** 12701 // CHECK10-NEXT: store double* [[TMP144]], double** [[TMP164]], align 8 12702 // CHECK10-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 3 12703 // CHECK10-NEXT: store i8* null, i8** [[TMP165]], align 8 12704 // CHECK10-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 4 12705 // CHECK10-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to double** 12706 // CHECK10-NEXT: store double* [[TMP145]], double** [[TMP167]], align 8 12707 // CHECK10-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 4 12708 // CHECK10-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to double** 12709 // CHECK10-NEXT: store double* [[TMP145]], double** [[TMP169]], align 8 12710 // CHECK10-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 4 12711 // CHECK10-NEXT: store i8* null, i8** [[TMP170]], align 8 12712 // CHECK10-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 12713 // CHECK10-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 12714 // CHECK10-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 12715 // CHECK10-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_54]], align 4 12716 // CHECK10-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_54]], align 4 12717 // CHECK10-NEXT: [[SUB56:%.*]] = sub nsw i32 [[TMP174]], 0 12718 // CHECK10-NEXT: [[DIV57:%.*]] = sdiv i32 [[SUB56]], 1 12719 // CHECK10-NEXT: [[SUB58:%.*]] = sub nsw i32 [[DIV57]], 1 12720 // CHECK10-NEXT: store i32 [[SUB58]], i32* [[DOTCAPTURE_EXPR_55]], align 4 12721 // CHECK10-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_55]], align 4 12722 // CHECK10-NEXT: [[ADD59:%.*]] = add nsw i32 [[TMP175]], 1 12723 // CHECK10-NEXT: [[TMP176:%.*]] = zext i32 [[ADD59]] to i64 12724 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 12725 // CHECK10-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.16, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.17, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12726 // CHECK10-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 12727 // CHECK10-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED60:%.*]], label [[OMP_OFFLOAD_CONT61:%.*]] 12728 // CHECK10: omp_offload.failed60: 12729 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506(i64 [[TMP140]], i64 [[TMP142]], double* [[TMP143]], double* [[TMP144]], double* [[TMP145]]) #[[ATTR2]] 12730 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT61]] 12731 // CHECK10: omp_offload.cont61: 12732 // CHECK10-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 12733 // CHECK10-NEXT: [[CONV63:%.*]] = bitcast i64* [[N_CASTED62]] to i32* 12734 // CHECK10-NEXT: store i32 [[TMP179]], i32* [[CONV63]], align 4 12735 // CHECK10-NEXT: [[TMP180:%.*]] = load i64, i64* [[N_CASTED62]], align 8 12736 // CHECK10-NEXT: [[TMP181:%.*]] = load double*, double** [[A]], align 8 12737 // CHECK10-NEXT: [[TMP182:%.*]] = load double*, double** [[B]], align 8 12738 // CHECK10-NEXT: [[TMP183:%.*]] = load double*, double** [[C]], align 8 12739 // CHECK10-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 12740 // CHECK10-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i64* 12741 // CHECK10-NEXT: store i64 [[TMP180]], i64* [[TMP185]], align 8 12742 // CHECK10-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 12743 // CHECK10-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i64* 12744 // CHECK10-NEXT: store i64 [[TMP180]], i64* [[TMP187]], align 8 12745 // CHECK10-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 0 12746 // CHECK10-NEXT: store i8* null, i8** [[TMP188]], align 8 12747 // CHECK10-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 1 12748 // CHECK10-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to double** 12749 // CHECK10-NEXT: store double* [[TMP181]], double** [[TMP190]], align 8 12750 // CHECK10-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 1 12751 // CHECK10-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to double** 12752 // CHECK10-NEXT: store double* [[TMP181]], double** [[TMP192]], align 8 12753 // CHECK10-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 1 12754 // CHECK10-NEXT: store i8* null, i8** [[TMP193]], align 8 12755 // CHECK10-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 2 12756 // CHECK10-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to double** 12757 // CHECK10-NEXT: store double* [[TMP182]], double** [[TMP195]], align 8 12758 // CHECK10-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 2 12759 // CHECK10-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to double** 12760 // CHECK10-NEXT: store double* [[TMP182]], double** [[TMP197]], align 8 12761 // CHECK10-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 2 12762 // CHECK10-NEXT: store i8* null, i8** [[TMP198]], align 8 12763 // CHECK10-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 3 12764 // CHECK10-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to double** 12765 // CHECK10-NEXT: store double* [[TMP183]], double** [[TMP200]], align 8 12766 // CHECK10-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 3 12767 // CHECK10-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to double** 12768 // CHECK10-NEXT: store double* [[TMP183]], double** [[TMP202]], align 8 12769 // CHECK10-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 3 12770 // CHECK10-NEXT: store i8* null, i8** [[TMP203]], align 8 12771 // CHECK10-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 12772 // CHECK10-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 12773 // CHECK10-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 12774 // CHECK10-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_68]], align 4 12775 // CHECK10-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_68]], align 4 12776 // CHECK10-NEXT: [[SUB70:%.*]] = sub nsw i32 [[TMP207]], 0 12777 // CHECK10-NEXT: [[DIV71:%.*]] = sdiv i32 [[SUB70]], 1 12778 // CHECK10-NEXT: [[SUB72:%.*]] = sub nsw i32 [[DIV71]], 1 12779 // CHECK10-NEXT: store i32 [[SUB72]], i32* [[DOTCAPTURE_EXPR_69]], align 4 12780 // CHECK10-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_69]], align 4 12781 // CHECK10-NEXT: [[ADD73:%.*]] = add nsw i32 [[TMP208]], 1 12782 // CHECK10-NEXT: [[TMP209:%.*]] = zext i32 [[ADD73]] to i64 12783 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 12784 // CHECK10-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.20, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.21, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12785 // CHECK10-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 12786 // CHECK10-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED74:%.*]], label [[OMP_OFFLOAD_CONT75:%.*]] 12787 // CHECK10: omp_offload.failed74: 12788 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536(i64 [[TMP180]], double* [[TMP181]], double* [[TMP182]], double* [[TMP183]]) #[[ATTR2]] 12789 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT75]] 12790 // CHECK10: omp_offload.cont75: 12791 // CHECK10-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 12792 // CHECK10-NEXT: [[CONV77:%.*]] = bitcast i64* [[CH_CASTED76]] to i32* 12793 // CHECK10-NEXT: store i32 [[TMP212]], i32* [[CONV77]], align 4 12794 // CHECK10-NEXT: [[TMP213:%.*]] = load i64, i64* [[CH_CASTED76]], align 8 12795 // CHECK10-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 12796 // CHECK10-NEXT: [[CONV79:%.*]] = bitcast i64* [[N_CASTED78]] to i32* 12797 // CHECK10-NEXT: store i32 [[TMP214]], i32* [[CONV79]], align 4 12798 // CHECK10-NEXT: [[TMP215:%.*]] = load i64, i64* [[N_CASTED78]], align 8 12799 // CHECK10-NEXT: [[TMP216:%.*]] = load double*, double** [[A]], align 8 12800 // CHECK10-NEXT: [[TMP217:%.*]] = load double*, double** [[B]], align 8 12801 // CHECK10-NEXT: [[TMP218:%.*]] = load double*, double** [[C]], align 8 12802 // CHECK10-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 12803 // CHECK10-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i64* 12804 // CHECK10-NEXT: store i64 [[TMP213]], i64* [[TMP220]], align 8 12805 // CHECK10-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 12806 // CHECK10-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i64* 12807 // CHECK10-NEXT: store i64 [[TMP213]], i64* [[TMP222]], align 8 12808 // CHECK10-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 0 12809 // CHECK10-NEXT: store i8* null, i8** [[TMP223]], align 8 12810 // CHECK10-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 1 12811 // CHECK10-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i64* 12812 // CHECK10-NEXT: store i64 [[TMP215]], i64* [[TMP225]], align 8 12813 // CHECK10-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 1 12814 // CHECK10-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i64* 12815 // CHECK10-NEXT: store i64 [[TMP215]], i64* [[TMP227]], align 8 12816 // CHECK10-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 1 12817 // CHECK10-NEXT: store i8* null, i8** [[TMP228]], align 8 12818 // CHECK10-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 2 12819 // CHECK10-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to double** 12820 // CHECK10-NEXT: store double* [[TMP216]], double** [[TMP230]], align 8 12821 // CHECK10-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 2 12822 // CHECK10-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to double** 12823 // CHECK10-NEXT: store double* [[TMP216]], double** [[TMP232]], align 8 12824 // CHECK10-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 2 12825 // CHECK10-NEXT: store i8* null, i8** [[TMP233]], align 8 12826 // CHECK10-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 3 12827 // CHECK10-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to double** 12828 // CHECK10-NEXT: store double* [[TMP217]], double** [[TMP235]], align 8 12829 // CHECK10-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 3 12830 // CHECK10-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to double** 12831 // CHECK10-NEXT: store double* [[TMP217]], double** [[TMP237]], align 8 12832 // CHECK10-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 3 12833 // CHECK10-NEXT: store i8* null, i8** [[TMP238]], align 8 12834 // CHECK10-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 4 12835 // CHECK10-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to double** 12836 // CHECK10-NEXT: store double* [[TMP218]], double** [[TMP240]], align 8 12837 // CHECK10-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 4 12838 // CHECK10-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to double** 12839 // CHECK10-NEXT: store double* [[TMP218]], double** [[TMP242]], align 8 12840 // CHECK10-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 4 12841 // CHECK10-NEXT: store i8* null, i8** [[TMP243]], align 8 12842 // CHECK10-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 12843 // CHECK10-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 12844 // CHECK10-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 12845 // CHECK10-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_84]], align 4 12846 // CHECK10-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_84]], align 4 12847 // CHECK10-NEXT: [[SUB86:%.*]] = sub nsw i32 [[TMP247]], 0 12848 // CHECK10-NEXT: [[DIV87:%.*]] = sdiv i32 [[SUB86]], 1 12849 // CHECK10-NEXT: [[SUB88:%.*]] = sub nsw i32 [[DIV87]], 1 12850 // CHECK10-NEXT: store i32 [[SUB88]], i32* [[DOTCAPTURE_EXPR_85]], align 4 12851 // CHECK10-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_85]], align 4 12852 // CHECK10-NEXT: [[ADD89:%.*]] = add nsw i32 [[TMP248]], 1 12853 // CHECK10-NEXT: [[TMP249:%.*]] = zext i32 [[ADD89]] to i64 12854 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 12855 // CHECK10-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.24, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.25, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 12856 // CHECK10-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 12857 // CHECK10-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED90:%.*]], label [[OMP_OFFLOAD_CONT91:%.*]] 12858 // CHECK10: omp_offload.failed90: 12859 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562(i64 [[TMP213]], i64 [[TMP215]], double* [[TMP216]], double* [[TMP217]], double* [[TMP218]]) #[[ATTR2]] 12860 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT91]] 12861 // CHECK10: omp_offload.cont91: 12862 // CHECK10-NEXT: [[CALL:%.*]] = call signext i32 @_Z5tmainIiET_v() 12863 // CHECK10-NEXT: ret i32 [[CALL]] 12864 // 12865 // 12866 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369 12867 // CHECK10-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1:[0-9]+]] { 12868 // CHECK10-NEXT: entry: 12869 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 12870 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 12871 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 12872 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 12873 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 12874 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 12875 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 12876 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 12877 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 12878 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 12879 // CHECK10-NEXT: ret void 12880 // 12881 // 12882 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined. 12883 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 12884 // CHECK10-NEXT: entry: 12885 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 12886 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 12887 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 12888 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 12889 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 12890 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 12891 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 12892 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 12893 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 12894 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 12895 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 12896 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 12897 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 12898 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 12899 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 12900 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 12901 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 12902 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 12903 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 12904 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 12905 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 12906 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 12907 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 12908 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 12909 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 12910 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 12911 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 12912 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 12913 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 12914 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 12915 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 12916 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 12917 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 12918 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 12919 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 12920 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 12921 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 12922 // CHECK10: omp.precond.then: 12923 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 12924 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12925 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 12926 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 12927 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 12928 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12929 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 12930 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 12931 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12932 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12933 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 12934 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 12935 // CHECK10: cond.true: 12936 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 12937 // CHECK10-NEXT: br label [[COND_END:%.*]] 12938 // CHECK10: cond.false: 12939 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12940 // CHECK10-NEXT: br label [[COND_END]] 12941 // CHECK10: cond.end: 12942 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 12943 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 12944 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 12945 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 12946 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 12947 // CHECK10: omp.inner.for.cond: 12948 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 12949 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12950 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 12951 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 12952 // CHECK10: omp.inner.for.body: 12953 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 12954 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 12955 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 12956 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 12957 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 12958 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 12959 // CHECK10: omp.inner.for.inc: 12960 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 12961 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 12962 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 12963 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 12964 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 12965 // CHECK10: omp.inner.for.end: 12966 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 12967 // CHECK10: omp.loop.exit: 12968 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 12969 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 12970 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 12971 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 12972 // CHECK10: omp.precond.end: 12973 // CHECK10-NEXT: ret void 12974 // 12975 // 12976 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..1 12977 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 12978 // CHECK10-NEXT: entry: 12979 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 12980 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 12981 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 12982 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 12983 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 12984 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 12985 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 12986 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 12987 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 12988 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 12989 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 12990 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 12991 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 12992 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 12993 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 12994 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 12995 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 12996 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 12997 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 12998 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 12999 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13000 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13001 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13002 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13003 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13004 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13005 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13006 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13007 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13008 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13009 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13010 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 13011 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13012 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13013 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13014 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13015 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13016 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13017 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13018 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13019 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13020 // CHECK10: omp.precond.then: 13021 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 13022 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13023 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 13024 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13025 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 13026 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13027 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 13028 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 13029 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 13030 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13031 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13032 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13033 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 13034 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13035 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13036 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13037 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 13038 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13039 // CHECK10: cond.true: 13040 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13041 // CHECK10-NEXT: br label [[COND_END:%.*]] 13042 // CHECK10: cond.false: 13043 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13044 // CHECK10-NEXT: br label [[COND_END]] 13045 // CHECK10: cond.end: 13046 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 13047 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 13048 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 13049 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 13050 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13051 // CHECK10: omp.inner.for.cond: 13052 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13053 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13054 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 13055 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13056 // CHECK10: omp.inner.for.body: 13057 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13058 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 13059 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 13060 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 13061 // CHECK10-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 13062 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 13063 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 13064 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 13065 // CHECK10-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 13066 // CHECK10-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 13067 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 13068 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 13069 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 13070 // CHECK10-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 13071 // CHECK10-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 13072 // CHECK10-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 13073 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 13074 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 13075 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 13076 // CHECK10-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 13077 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 13078 // CHECK10: omp.body.continue: 13079 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13080 // CHECK10: omp.inner.for.inc: 13081 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13082 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 13083 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 13084 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13085 // CHECK10: omp.inner.for.end: 13086 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13087 // CHECK10: omp.loop.exit: 13088 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13089 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 13090 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 13091 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13092 // CHECK10: omp.precond.end: 13093 // CHECK10-NEXT: ret void 13094 // 13095 // 13096 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408 13097 // CHECK10-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 13098 // CHECK10-NEXT: entry: 13099 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 13100 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 13101 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 13102 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 13103 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 13104 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 13105 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 13106 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 13107 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 13108 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 13109 // CHECK10-NEXT: ret void 13110 // 13111 // 13112 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..2 13113 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13114 // CHECK10-NEXT: entry: 13115 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13116 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13117 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13118 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13119 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13120 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13121 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13122 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13123 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13124 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13125 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13126 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 13127 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 13128 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13129 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13130 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 13131 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13132 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13133 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13134 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13135 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13136 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13137 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13138 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13139 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13140 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13141 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13142 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 13143 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13144 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13145 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13146 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13147 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13148 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13149 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13150 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13151 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13152 // CHECK10: omp.precond.then: 13153 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 13154 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13155 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 13156 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13157 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13158 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13159 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 13160 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13161 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13162 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13163 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 13164 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13165 // CHECK10: cond.true: 13166 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13167 // CHECK10-NEXT: br label [[COND_END:%.*]] 13168 // CHECK10: cond.false: 13169 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13170 // CHECK10-NEXT: br label [[COND_END]] 13171 // CHECK10: cond.end: 13172 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 13173 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 13174 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13175 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 13176 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13177 // CHECK10: omp.inner.for.cond: 13178 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13179 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13180 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 13181 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13182 // CHECK10: omp.inner.for.body: 13183 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13184 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 13185 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13186 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 13187 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 13188 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13189 // CHECK10: omp.inner.for.inc: 13190 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13191 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 13192 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 13193 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 13194 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13195 // CHECK10: omp.inner.for.end: 13196 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13197 // CHECK10: omp.loop.exit: 13198 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13199 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 13200 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 13201 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13202 // CHECK10: omp.precond.end: 13203 // CHECK10-NEXT: ret void 13204 // 13205 // 13206 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..3 13207 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13208 // CHECK10-NEXT: entry: 13209 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13210 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13211 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 13212 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 13213 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13214 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13215 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13216 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13217 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13218 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13219 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13220 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13221 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13222 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 13223 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 13224 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13225 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13226 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 13227 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13228 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13229 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13230 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13231 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13232 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13233 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13234 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13235 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13236 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13237 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13238 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13239 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13240 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 13241 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13242 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13243 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13244 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13245 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13246 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13247 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13248 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13249 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13250 // CHECK10: omp.precond.then: 13251 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 13252 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13253 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 13254 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13255 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 13256 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13257 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 13258 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 13259 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 13260 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13261 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13262 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13263 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 13264 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13265 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13266 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13267 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 13268 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13269 // CHECK10: cond.true: 13270 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13271 // CHECK10-NEXT: br label [[COND_END:%.*]] 13272 // CHECK10: cond.false: 13273 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13274 // CHECK10-NEXT: br label [[COND_END]] 13275 // CHECK10: cond.end: 13276 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 13277 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 13278 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 13279 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 13280 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13281 // CHECK10: omp.inner.for.cond: 13282 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13283 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13284 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 13285 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13286 // CHECK10: omp.inner.for.body: 13287 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13288 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 13289 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 13290 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 13291 // CHECK10-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 13292 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 13293 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 13294 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 13295 // CHECK10-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 13296 // CHECK10-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 13297 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 13298 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 13299 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 13300 // CHECK10-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 13301 // CHECK10-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 13302 // CHECK10-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 13303 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 13304 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 13305 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 13306 // CHECK10-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 13307 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 13308 // CHECK10: omp.body.continue: 13309 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13310 // CHECK10: omp.inner.for.inc: 13311 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13312 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 13313 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 13314 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13315 // CHECK10: omp.inner.for.end: 13316 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13317 // CHECK10: omp.loop.exit: 13318 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13319 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 13320 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 13321 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13322 // CHECK10: omp.precond.end: 13323 // CHECK10-NEXT: ret void 13324 // 13325 // 13326 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447 13327 // CHECK10-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 13328 // CHECK10-NEXT: entry: 13329 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 13330 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 13331 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 13332 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 13333 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 13334 // CHECK10-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 13335 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 13336 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 13337 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 13338 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 13339 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 13340 // CHECK10-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 13341 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 13342 // CHECK10-NEXT: ret void 13343 // 13344 // 13345 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..6 13346 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13347 // CHECK10-NEXT: entry: 13348 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13349 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13350 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 13351 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13352 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13353 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13354 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13355 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13356 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13357 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13358 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13359 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13360 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 13361 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 13362 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13363 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13364 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 13365 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13366 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13367 // CHECK10-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 13368 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13369 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13370 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13371 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13372 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 13373 // CHECK10-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13374 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 13375 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 13376 // CHECK10-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 13377 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 13378 // CHECK10-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 13379 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13380 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 13381 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13382 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13383 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13384 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13385 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13386 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 13387 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13388 // CHECK10: omp.precond.then: 13389 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 13390 // CHECK10-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13391 // CHECK10-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 13392 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13393 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13394 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 13395 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13396 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 13397 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 13398 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13399 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13400 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 13401 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13402 // CHECK10: cond.true: 13403 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13404 // CHECK10-NEXT: br label [[COND_END:%.*]] 13405 // CHECK10: cond.false: 13406 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13407 // CHECK10-NEXT: br label [[COND_END]] 13408 // CHECK10: cond.end: 13409 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 13410 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 13411 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13412 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 13413 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13414 // CHECK10: omp.inner.for.cond: 13415 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13416 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13417 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 13418 // CHECK10-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 13419 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13420 // CHECK10: omp.inner.for.body: 13421 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13422 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 13423 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13424 // CHECK10-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 13425 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 13426 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13427 // CHECK10: omp.inner.for.inc: 13428 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13429 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 13430 // CHECK10-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 13431 // CHECK10-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 13432 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13433 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 13434 // CHECK10-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 13435 // CHECK10-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 13436 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13437 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 13438 // CHECK10-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP27]], [[TMP28]] 13439 // CHECK10-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 13440 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13441 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13442 // CHECK10-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP29]], [[TMP30]] 13443 // CHECK10-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 13444 // CHECK10: cond.true10: 13445 // CHECK10-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13446 // CHECK10-NEXT: br label [[COND_END12:%.*]] 13447 // CHECK10: cond.false11: 13448 // CHECK10-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13449 // CHECK10-NEXT: br label [[COND_END12]] 13450 // CHECK10: cond.end12: 13451 // CHECK10-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP31]], [[COND_TRUE10]] ], [ [[TMP32]], [[COND_FALSE11]] ] 13452 // CHECK10-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 13453 // CHECK10-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13454 // CHECK10-NEXT: store i32 [[TMP33]], i32* [[DOTOMP_IV]], align 4 13455 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13456 // CHECK10: omp.inner.for.end: 13457 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13458 // CHECK10: omp.loop.exit: 13459 // CHECK10-NEXT: [[TMP34:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13460 // CHECK10-NEXT: [[TMP35:%.*]] = load i32, i32* [[TMP34]], align 4 13461 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP35]]) 13462 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13463 // CHECK10: omp.precond.end: 13464 // CHECK10-NEXT: ret void 13465 // 13466 // 13467 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..7 13468 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13469 // CHECK10-NEXT: entry: 13470 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13471 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13472 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 13473 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 13474 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13475 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13476 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13477 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13478 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13479 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13480 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13481 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13482 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13483 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 13484 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 13485 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13486 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13487 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 13488 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13489 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13490 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13491 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13492 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13493 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13494 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13495 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13496 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13497 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13498 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13499 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13500 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13501 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 13502 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13503 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13504 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13505 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13506 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13507 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13508 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13509 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13510 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13511 // CHECK10: omp.precond.then: 13512 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 13513 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13514 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 13515 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13516 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 13517 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13518 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 13519 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 13520 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 13521 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13522 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13523 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13524 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 13525 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13526 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13527 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13528 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 13529 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13530 // CHECK10: cond.true: 13531 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13532 // CHECK10-NEXT: br label [[COND_END:%.*]] 13533 // CHECK10: cond.false: 13534 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13535 // CHECK10-NEXT: br label [[COND_END]] 13536 // CHECK10: cond.end: 13537 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 13538 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 13539 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 13540 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 13541 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13542 // CHECK10: omp.inner.for.cond: 13543 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13544 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13545 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 13546 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13547 // CHECK10: omp.inner.for.body: 13548 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13549 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 13550 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 13551 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 13552 // CHECK10-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 13553 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 13554 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 13555 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 13556 // CHECK10-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 13557 // CHECK10-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 13558 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 13559 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 13560 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 13561 // CHECK10-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 13562 // CHECK10-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 13563 // CHECK10-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 13564 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 13565 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 13566 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 13567 // CHECK10-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 13568 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 13569 // CHECK10: omp.body.continue: 13570 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13571 // CHECK10: omp.inner.for.inc: 13572 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13573 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 13574 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 13575 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13576 // CHECK10: omp.inner.for.end: 13577 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13578 // CHECK10: omp.loop.exit: 13579 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13580 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 13581 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 13582 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13583 // CHECK10: omp.precond.end: 13584 // CHECK10-NEXT: ret void 13585 // 13586 // 13587 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478 13588 // CHECK10-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 13589 // CHECK10-NEXT: entry: 13590 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 13591 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 13592 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 13593 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 13594 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 13595 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 13596 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 13597 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 13598 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 13599 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 13600 // CHECK10-NEXT: ret void 13601 // 13602 // 13603 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..10 13604 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13605 // CHECK10-NEXT: entry: 13606 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13607 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13608 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13609 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13610 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13611 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13612 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13613 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13614 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13615 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13616 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13617 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 13618 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 13619 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13620 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13621 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 13622 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13623 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13624 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13625 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13626 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13627 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13628 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13629 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13630 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13631 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13632 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13633 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 13634 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13635 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13636 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13637 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13638 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13639 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13640 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13641 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13642 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13643 // CHECK10: omp.precond.then: 13644 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 13645 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13646 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 13647 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13648 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13649 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13650 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 13651 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13652 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13653 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13654 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 13655 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13656 // CHECK10: cond.true: 13657 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13658 // CHECK10-NEXT: br label [[COND_END:%.*]] 13659 // CHECK10: cond.false: 13660 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13661 // CHECK10-NEXT: br label [[COND_END]] 13662 // CHECK10: cond.end: 13663 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 13664 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 13665 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13666 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 13667 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13668 // CHECK10: omp.inner.for.cond: 13669 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13670 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13671 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 13672 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13673 // CHECK10: omp.inner.for.body: 13674 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13675 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 13676 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13677 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 13678 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 13679 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13680 // CHECK10: omp.inner.for.inc: 13681 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13682 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 13683 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 13684 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 13685 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13686 // CHECK10: omp.inner.for.end: 13687 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13688 // CHECK10: omp.loop.exit: 13689 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13690 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 13691 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 13692 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13693 // CHECK10: omp.precond.end: 13694 // CHECK10-NEXT: ret void 13695 // 13696 // 13697 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..11 13698 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13699 // CHECK10-NEXT: entry: 13700 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13701 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13702 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 13703 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 13704 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13705 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13706 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13707 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13708 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13709 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13710 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13711 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13712 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13713 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 13714 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 13715 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13716 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13717 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 13718 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13719 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13720 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13721 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13722 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13723 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13724 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13725 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13726 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13727 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13728 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13729 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13730 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13731 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 13732 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13733 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13734 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13735 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 13736 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13737 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13738 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13739 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13740 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13741 // CHECK10: omp.precond.then: 13742 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 13743 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13744 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 13745 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13746 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 13747 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13748 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 13749 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 13750 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 13751 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13752 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13753 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13754 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 13755 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13756 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13757 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13758 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 13759 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13760 // CHECK10: cond.true: 13761 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13762 // CHECK10-NEXT: br label [[COND_END:%.*]] 13763 // CHECK10: cond.false: 13764 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13765 // CHECK10-NEXT: br label [[COND_END]] 13766 // CHECK10: cond.end: 13767 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 13768 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 13769 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 13770 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 13771 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13772 // CHECK10: omp.inner.for.cond: 13773 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13774 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 13775 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 13776 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13777 // CHECK10: omp.inner.for.body: 13778 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13779 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 13780 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 13781 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 13782 // CHECK10-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 8 13783 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 13784 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 13785 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i64 [[IDXPROM]] 13786 // CHECK10-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 8 13787 // CHECK10-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 8 13788 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 13789 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 13790 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM7]] 13791 // CHECK10-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX8]], align 8 13792 // CHECK10-NEXT: [[ADD9:%.*]] = fadd double [[TMP22]], [[TMP25]] 13793 // CHECK10-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 8 13794 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 13795 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 13796 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM10]] 13797 // CHECK10-NEXT: store double [[ADD9]], double* [[ARRAYIDX11]], align 8 13798 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 13799 // CHECK10: omp.body.continue: 13800 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13801 // CHECK10: omp.inner.for.inc: 13802 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13803 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 13804 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 13805 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13806 // CHECK10: omp.inner.for.end: 13807 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13808 // CHECK10: omp.loop.exit: 13809 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13810 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 13811 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 13812 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13813 // CHECK10: omp.precond.end: 13814 // CHECK10-NEXT: ret void 13815 // 13816 // 13817 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506 13818 // CHECK10-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 13819 // CHECK10-NEXT: entry: 13820 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 13821 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 13822 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 13823 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 13824 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 13825 // CHECK10-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 13826 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 13827 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 13828 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 13829 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 13830 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 13831 // CHECK10-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 13832 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 13833 // CHECK10-NEXT: ret void 13834 // 13835 // 13836 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..14 13837 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 13838 // CHECK10-NEXT: entry: 13839 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13840 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13841 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 13842 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13843 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13844 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13845 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13846 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 13847 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13848 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13849 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13850 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 13851 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13852 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 13853 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 13854 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13855 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13856 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 13857 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 13858 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13859 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13860 // CHECK10-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 13861 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13862 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13863 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13864 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13865 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 13866 // CHECK10-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13867 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 13868 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 13869 // CHECK10-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 13870 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 13871 // CHECK10-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 13872 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 13873 // CHECK10-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13874 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13875 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 13876 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13877 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 13878 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 13879 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13880 // CHECK10-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13881 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 13882 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13883 // CHECK10: omp.precond.then: 13884 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 13885 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 13886 // CHECK10-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 13887 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13888 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 13889 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13890 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 13891 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 13892 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13893 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 13894 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 13895 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 13896 // CHECK10: cond.true: 13897 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 13898 // CHECK10-NEXT: br label [[COND_END:%.*]] 13899 // CHECK10: cond.false: 13900 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13901 // CHECK10-NEXT: br label [[COND_END]] 13902 // CHECK10: cond.end: 13903 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 13904 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 13905 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13906 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 13907 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 13908 // CHECK10: omp.inner.for.cond: 13909 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13910 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13911 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 13912 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 13913 // CHECK10: omp.inner.for.body: 13914 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 13915 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 13916 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 13917 // CHECK10-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 13918 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 13919 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 13920 // CHECK10-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 13921 // CHECK10-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 13922 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 13923 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 13924 // CHECK10: omp.inner.for.inc: 13925 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 13926 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 13927 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 13928 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 13929 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 13930 // CHECK10: omp.inner.for.end: 13931 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 13932 // CHECK10: omp.loop.exit: 13933 // CHECK10-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 13934 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 13935 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 13936 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 13937 // CHECK10: omp.precond.end: 13938 // CHECK10-NEXT: ret void 13939 // 13940 // 13941 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..15 13942 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 13943 // CHECK10-NEXT: entry: 13944 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 13945 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 13946 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 13947 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 13948 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 13949 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 13950 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 13951 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 13952 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 13953 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 13954 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 13955 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 13956 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 13957 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 13958 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 13959 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 13960 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 13961 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 13962 // CHECK10-NEXT: [[I6:%.*]] = alloca i32, align 4 13963 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 13964 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 13965 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13966 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13967 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 13968 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 13969 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 13970 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 13971 // CHECK10-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 13972 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 13973 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 13974 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 13975 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 13976 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 13977 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 13978 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 13979 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13980 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 13981 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 13982 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 13983 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 13984 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 13985 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 13986 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 13987 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 13988 // CHECK10: omp.precond.then: 13989 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 13990 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 13991 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 13992 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 13993 // CHECK10-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 13994 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 13995 // CHECK10-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 13996 // CHECK10-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 13997 // CHECK10-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 13998 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 13999 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 14000 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 14001 // CHECK10-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14002 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 14003 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 14004 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 14005 // CHECK10: omp.dispatch.cond: 14006 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14007 // CHECK10-NEXT: [[CONV7:%.*]] = sext i32 [[TMP13]] to i64 14008 // CHECK10-NEXT: [[TMP14:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 14009 // CHECK10-NEXT: [[CMP8:%.*]] = icmp ugt i64 [[CONV7]], [[TMP14]] 14010 // CHECK10-NEXT: br i1 [[CMP8]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 14011 // CHECK10: cond.true: 14012 // CHECK10-NEXT: [[TMP15:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 14013 // CHECK10-NEXT: br label [[COND_END:%.*]] 14014 // CHECK10: cond.false: 14015 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14016 // CHECK10-NEXT: [[CONV9:%.*]] = sext i32 [[TMP16]] to i64 14017 // CHECK10-NEXT: br label [[COND_END]] 14018 // CHECK10: cond.end: 14019 // CHECK10-NEXT: [[COND:%.*]] = phi i64 [ [[TMP15]], [[COND_TRUE]] ], [ [[CONV9]], [[COND_FALSE]] ] 14020 // CHECK10-NEXT: [[CONV10:%.*]] = trunc i64 [[COND]] to i32 14021 // CHECK10-NEXT: store i32 [[CONV10]], i32* [[DOTOMP_UB]], align 4 14022 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 14023 // CHECK10-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 14024 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14025 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14026 // CHECK10-NEXT: [[CMP11:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 14027 // CHECK10-NEXT: br i1 [[CMP11]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 14028 // CHECK10: omp.dispatch.body: 14029 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 14030 // CHECK10: omp.inner.for.cond: 14031 // CHECK10-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14032 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14033 // CHECK10-NEXT: [[CMP12:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 14034 // CHECK10-NEXT: br i1 [[CMP12]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 14035 // CHECK10: omp.inner.for.body: 14036 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14037 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 14038 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 14039 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I6]], align 4 14040 // CHECK10-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 8 14041 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I6]], align 4 14042 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP24]] to i64 14043 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i64 [[IDXPROM]] 14044 // CHECK10-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 8 14045 // CHECK10-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 8 14046 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I6]], align 4 14047 // CHECK10-NEXT: [[IDXPROM13:%.*]] = sext i32 [[TMP27]] to i64 14048 // CHECK10-NEXT: [[ARRAYIDX14:%.*]] = getelementptr inbounds double, double* [[TMP26]], i64 [[IDXPROM13]] 14049 // CHECK10-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX14]], align 8 14050 // CHECK10-NEXT: [[ADD15:%.*]] = fadd double [[TMP25]], [[TMP28]] 14051 // CHECK10-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 8 14052 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[I6]], align 4 14053 // CHECK10-NEXT: [[IDXPROM16:%.*]] = sext i32 [[TMP30]] to i64 14054 // CHECK10-NEXT: [[ARRAYIDX17:%.*]] = getelementptr inbounds double, double* [[TMP29]], i64 [[IDXPROM16]] 14055 // CHECK10-NEXT: store double [[ADD15]], double* [[ARRAYIDX17]], align 8 14056 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 14057 // CHECK10: omp.body.continue: 14058 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 14059 // CHECK10: omp.inner.for.inc: 14060 // CHECK10-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14061 // CHECK10-NEXT: [[ADD18:%.*]] = add nsw i32 [[TMP31]], 1 14062 // CHECK10-NEXT: store i32 [[ADD18]], i32* [[DOTOMP_IV]], align 4 14063 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 14064 // CHECK10: omp.inner.for.end: 14065 // CHECK10-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 14066 // CHECK10: omp.dispatch.inc: 14067 // CHECK10-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 14068 // CHECK10-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 14069 // CHECK10-NEXT: [[ADD19:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 14070 // CHECK10-NEXT: store i32 [[ADD19]], i32* [[DOTOMP_LB]], align 4 14071 // CHECK10-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14072 // CHECK10-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 14073 // CHECK10-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 14074 // CHECK10-NEXT: store i32 [[ADD20]], i32* [[DOTOMP_UB]], align 4 14075 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND]] 14076 // CHECK10: omp.dispatch.end: 14077 // CHECK10-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14078 // CHECK10-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 14079 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 14080 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 14081 // CHECK10: omp.precond.end: 14082 // CHECK10-NEXT: ret void 14083 // 14084 // 14085 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536 14086 // CHECK10-SAME: (i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 14087 // CHECK10-NEXT: entry: 14088 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 14089 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 14090 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 14091 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 14092 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 14093 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 14094 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 14095 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 14096 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 14097 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[CONV]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 14098 // CHECK10-NEXT: ret void 14099 // 14100 // 14101 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..18 14102 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 14103 // CHECK10-NEXT: entry: 14104 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 14105 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 14106 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 14107 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 14108 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 14109 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 14110 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 14111 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 14112 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 14113 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 14114 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 14115 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 14116 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 14117 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 14118 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 14119 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 14120 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 14121 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 14122 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 14123 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 14124 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 14125 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 14126 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 14127 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 14128 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 14129 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 14130 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 14131 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 14132 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 14133 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 14134 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 14135 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 14136 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 14137 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 14138 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 14139 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 14140 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 14141 // CHECK10: omp.precond.then: 14142 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 14143 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14144 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 14145 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 14146 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 14147 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14148 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 14149 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 14150 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14151 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14152 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 14153 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 14154 // CHECK10: cond.true: 14155 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14156 // CHECK10-NEXT: br label [[COND_END:%.*]] 14157 // CHECK10: cond.false: 14158 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14159 // CHECK10-NEXT: br label [[COND_END]] 14160 // CHECK10: cond.end: 14161 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 14162 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 14163 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 14164 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 14165 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 14166 // CHECK10: omp.inner.for.cond: 14167 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14168 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14169 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 14170 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 14171 // CHECK10: omp.inner.for.body: 14172 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 14173 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 14174 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14175 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 14176 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 14177 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 14178 // CHECK10: omp.inner.for.inc: 14179 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14180 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 14181 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 14182 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 14183 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 14184 // CHECK10: omp.inner.for.end: 14185 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 14186 // CHECK10: omp.loop.exit: 14187 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14188 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 14189 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 14190 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 14191 // CHECK10: omp.precond.end: 14192 // CHECK10-NEXT: ret void 14193 // 14194 // 14195 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..19 14196 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 14197 // CHECK10-NEXT: entry: 14198 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 14199 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 14200 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 14201 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 14202 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 14203 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 14204 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 14205 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 14206 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 14207 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 14208 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 14209 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 14210 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 14211 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 14212 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 14213 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 14214 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 14215 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 14216 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 14217 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 14218 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 14219 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 14220 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 14221 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 14222 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 14223 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 14224 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 14225 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 14226 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 14227 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 14228 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 14229 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 14230 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 14231 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 14232 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 14233 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 14234 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 14235 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 14236 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 14237 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 14238 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 14239 // CHECK10: omp.precond.then: 14240 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 14241 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14242 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 14243 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 14244 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 14245 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 14246 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 14247 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 14248 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 14249 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 14250 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 14251 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 14252 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14253 // CHECK10-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14254 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 14255 // CHECK10-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 14256 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 14257 // CHECK10: omp.dispatch.cond: 14258 // CHECK10-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14259 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 14260 // CHECK10-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 14261 // CHECK10-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 14262 // CHECK10-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 14263 // CHECK10: omp.dispatch.body: 14264 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 14265 // CHECK10-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 14266 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 14267 // CHECK10: omp.inner.for.cond: 14268 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 14269 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !18 14270 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 14271 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 14272 // CHECK10: omp.inner.for.body: 14273 // CHECK10-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 14274 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 14275 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 14276 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !18 14277 // CHECK10-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !18 14278 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !18 14279 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP22]] to i64 14280 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i64 [[IDXPROM]] 14281 // CHECK10-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !18 14282 // CHECK10-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !18 14283 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !18 14284 // CHECK10-NEXT: [[IDXPROM6:%.*]] = sext i32 [[TMP25]] to i64 14285 // CHECK10-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP24]], i64 [[IDXPROM6]] 14286 // CHECK10-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX7]], align 8, !llvm.access.group !18 14287 // CHECK10-NEXT: [[ADD8:%.*]] = fadd double [[TMP23]], [[TMP26]] 14288 // CHECK10-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !18 14289 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !18 14290 // CHECK10-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP28]] to i64 14291 // CHECK10-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP27]], i64 [[IDXPROM9]] 14292 // CHECK10-NEXT: store double [[ADD8]], double* [[ARRAYIDX10]], align 8, !llvm.access.group !18 14293 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 14294 // CHECK10: omp.body.continue: 14295 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 14296 // CHECK10: omp.inner.for.inc: 14297 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 14298 // CHECK10-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP29]], 1 14299 // CHECK10-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !18 14300 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP19:![0-9]+]] 14301 // CHECK10: omp.inner.for.end: 14302 // CHECK10-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 14303 // CHECK10: omp.dispatch.inc: 14304 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND]] 14305 // CHECK10: omp.dispatch.end: 14306 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 14307 // CHECK10: omp.precond.end: 14308 // CHECK10-NEXT: ret void 14309 // 14310 // 14311 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562 14312 // CHECK10-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 14313 // CHECK10-NEXT: entry: 14314 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 14315 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 14316 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double*, align 8 14317 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double*, align 8 14318 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double*, align 8 14319 // CHECK10-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 14320 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 14321 // CHECK10-NEXT: store double* [[A]], double** [[A_ADDR]], align 8 14322 // CHECK10-NEXT: store double* [[B]], double** [[B_ADDR]], align 8 14323 // CHECK10-NEXT: store double* [[C]], double** [[C_ADDR]], align 8 14324 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 14325 // CHECK10-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 14326 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 14327 // CHECK10-NEXT: ret void 14328 // 14329 // 14330 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..22 14331 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 14332 // CHECK10-NEXT: entry: 14333 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 14334 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 14335 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 14336 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 14337 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 14338 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 14339 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 14340 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 14341 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 14342 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 14343 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 14344 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 14345 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 14346 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 14347 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 14348 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 14349 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 14350 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 14351 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 14352 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 14353 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 14354 // CHECK10-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 14355 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 14356 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 14357 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 14358 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 14359 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 14360 // CHECK10-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 14361 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 8 14362 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 8 14363 // CHECK10-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 8 14364 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 14365 // CHECK10-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 14366 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 14367 // CHECK10-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 14368 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14369 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 14370 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 14371 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 14372 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 14373 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 14374 // CHECK10-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14375 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 14376 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 14377 // CHECK10: omp.precond.then: 14378 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 14379 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 14380 // CHECK10-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 14381 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 14382 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 14383 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14384 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 14385 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 14386 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14387 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 14388 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 14389 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 14390 // CHECK10: cond.true: 14391 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 14392 // CHECK10-NEXT: br label [[COND_END:%.*]] 14393 // CHECK10: cond.false: 14394 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14395 // CHECK10-NEXT: br label [[COND_END]] 14396 // CHECK10: cond.end: 14397 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 14398 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 14399 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 14400 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 14401 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 14402 // CHECK10: omp.inner.for.cond: 14403 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14404 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14405 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 14406 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 14407 // CHECK10: omp.inner.for.body: 14408 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 14409 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 14410 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 14411 // CHECK10-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 14412 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 14413 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 14414 // CHECK10-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 14415 // CHECK10-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 14416 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, double**, double**, double**, i64)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i64 [[TMP24]]) 14417 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 14418 // CHECK10: omp.inner.for.inc: 14419 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 14420 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 14421 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 14422 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 14423 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 14424 // CHECK10: omp.inner.for.end: 14425 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 14426 // CHECK10: omp.loop.exit: 14427 // CHECK10-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14428 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 14429 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 14430 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 14431 // CHECK10: omp.precond.end: 14432 // CHECK10-NEXT: ret void 14433 // 14434 // 14435 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..23 14436 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 8 dereferenceable(8) [[A:%.*]], double** nonnull align 8 dereferenceable(8) [[B:%.*]], double** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 14437 // CHECK10-NEXT: entry: 14438 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 14439 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 14440 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 14441 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 14442 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 14443 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca double**, align 8 14444 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca double**, align 8 14445 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca double**, align 8 14446 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 14447 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 14448 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 14449 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 14450 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 14451 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 14452 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 14453 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 14454 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 14455 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 14456 // CHECK10-NEXT: [[I6:%.*]] = alloca i32, align 4 14457 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 14458 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 14459 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 14460 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 14461 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 14462 // CHECK10-NEXT: store double** [[A]], double*** [[A_ADDR]], align 8 14463 // CHECK10-NEXT: store double** [[B]], double*** [[B_ADDR]], align 8 14464 // CHECK10-NEXT: store double** [[C]], double*** [[C_ADDR]], align 8 14465 // CHECK10-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 14466 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 14467 // CHECK10-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 8 14468 // CHECK10-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 8 14469 // CHECK10-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 8 14470 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 14471 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 14472 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 14473 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14474 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 14475 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 14476 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 14477 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 14478 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 14479 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14480 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 14481 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 14482 // CHECK10: omp.precond.then: 14483 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 14484 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 14485 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 14486 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 14487 // CHECK10-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 14488 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 14489 // CHECK10-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 14490 // CHECK10-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 14491 // CHECK10-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 14492 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 14493 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 14494 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 14495 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 14496 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 14497 // CHECK10-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14498 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 14499 // CHECK10-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 14500 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 14501 // CHECK10: omp.dispatch.cond: 14502 // CHECK10-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 14503 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 14504 // CHECK10-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 14505 // CHECK10-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 14506 // CHECK10-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 14507 // CHECK10: omp.dispatch.body: 14508 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 14509 // CHECK10-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 14510 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 14511 // CHECK10: omp.inner.for.cond: 14512 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 14513 // CHECK10-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !21 14514 // CHECK10-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 14515 // CHECK10-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 14516 // CHECK10: omp.inner.for.body: 14517 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 14518 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 14519 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 14520 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I6]], align 4, !llvm.access.group !21 14521 // CHECK10-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 8, !llvm.access.group !21 14522 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !21 14523 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP23]] to i64 14524 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i64 [[IDXPROM]] 14525 // CHECK10-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 8, !llvm.access.group !21 14526 // CHECK10-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 8, !llvm.access.group !21 14527 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !21 14528 // CHECK10-NEXT: [[IDXPROM8:%.*]] = sext i32 [[TMP26]] to i64 14529 // CHECK10-NEXT: [[ARRAYIDX9:%.*]] = getelementptr inbounds double, double* [[TMP25]], i64 [[IDXPROM8]] 14530 // CHECK10-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX9]], align 8, !llvm.access.group !21 14531 // CHECK10-NEXT: [[ADD10:%.*]] = fadd double [[TMP24]], [[TMP27]] 14532 // CHECK10-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 8, !llvm.access.group !21 14533 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !21 14534 // CHECK10-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP29]] to i64 14535 // CHECK10-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds double, double* [[TMP28]], i64 [[IDXPROM11]] 14536 // CHECK10-NEXT: store double [[ADD10]], double* [[ARRAYIDX12]], align 8, !llvm.access.group !21 14537 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 14538 // CHECK10: omp.body.continue: 14539 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 14540 // CHECK10: omp.inner.for.inc: 14541 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 14542 // CHECK10-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP30]], 1 14543 // CHECK10-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !21 14544 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP22:![0-9]+]] 14545 // CHECK10: omp.inner.for.end: 14546 // CHECK10-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 14547 // CHECK10: omp.dispatch.inc: 14548 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND]] 14549 // CHECK10: omp.dispatch.end: 14550 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 14551 // CHECK10: omp.precond.end: 14552 // CHECK10-NEXT: ret void 14553 // 14554 // 14555 // CHECK10-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 14556 // CHECK10-SAME: () #[[ATTR3:[0-9]+]] comdat { 14557 // CHECK10-NEXT: entry: 14558 // CHECK10-NEXT: [[A:%.*]] = alloca i32*, align 8 14559 // CHECK10-NEXT: [[B:%.*]] = alloca i32*, align 8 14560 // CHECK10-NEXT: [[C:%.*]] = alloca i32*, align 8 14561 // CHECK10-NEXT: [[N:%.*]] = alloca i32, align 4 14562 // CHECK10-NEXT: [[CH:%.*]] = alloca i32, align 4 14563 // CHECK10-NEXT: [[N_CASTED:%.*]] = alloca i64, align 8 14564 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 8 14565 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 8 14566 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 8 14567 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 14568 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 14569 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 14570 // CHECK10-NEXT: [[N_CASTED3:%.*]] = alloca i64, align 8 14571 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS5:%.*]] = alloca [4 x i8*], align 8 14572 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS6:%.*]] = alloca [4 x i8*], align 8 14573 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS7:%.*]] = alloca [4 x i8*], align 8 14574 // CHECK10-NEXT: [[_TMP8:%.*]] = alloca i32, align 4 14575 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 14576 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_10:%.*]] = alloca i32, align 4 14577 // CHECK10-NEXT: [[CH_CASTED:%.*]] = alloca i64, align 8 14578 // CHECK10-NEXT: [[N_CASTED18:%.*]] = alloca i64, align 8 14579 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS20:%.*]] = alloca [5 x i8*], align 8 14580 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS21:%.*]] = alloca [5 x i8*], align 8 14581 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS22:%.*]] = alloca [5 x i8*], align 8 14582 // CHECK10-NEXT: [[_TMP23:%.*]] = alloca i32, align 4 14583 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_24:%.*]] = alloca i32, align 4 14584 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_25:%.*]] = alloca i32, align 4 14585 // CHECK10-NEXT: [[N_CASTED32:%.*]] = alloca i64, align 8 14586 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS34:%.*]] = alloca [4 x i8*], align 8 14587 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS35:%.*]] = alloca [4 x i8*], align 8 14588 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS36:%.*]] = alloca [4 x i8*], align 8 14589 // CHECK10-NEXT: [[_TMP37:%.*]] = alloca i32, align 4 14590 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_38:%.*]] = alloca i32, align 4 14591 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_39:%.*]] = alloca i32, align 4 14592 // CHECK10-NEXT: [[CH_CASTED46:%.*]] = alloca i64, align 8 14593 // CHECK10-NEXT: [[N_CASTED48:%.*]] = alloca i64, align 8 14594 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS50:%.*]] = alloca [5 x i8*], align 8 14595 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS51:%.*]] = alloca [5 x i8*], align 8 14596 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS52:%.*]] = alloca [5 x i8*], align 8 14597 // CHECK10-NEXT: [[_TMP53:%.*]] = alloca i32, align 4 14598 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_54:%.*]] = alloca i32, align 4 14599 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_55:%.*]] = alloca i32, align 4 14600 // CHECK10-NEXT: [[N_CASTED62:%.*]] = alloca i64, align 8 14601 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS64:%.*]] = alloca [4 x i8*], align 8 14602 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS65:%.*]] = alloca [4 x i8*], align 8 14603 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS66:%.*]] = alloca [4 x i8*], align 8 14604 // CHECK10-NEXT: [[_TMP67:%.*]] = alloca i32, align 4 14605 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_68:%.*]] = alloca i32, align 4 14606 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_69:%.*]] = alloca i32, align 4 14607 // CHECK10-NEXT: [[CH_CASTED76:%.*]] = alloca i64, align 8 14608 // CHECK10-NEXT: [[N_CASTED78:%.*]] = alloca i64, align 8 14609 // CHECK10-NEXT: [[DOTOFFLOAD_BASEPTRS80:%.*]] = alloca [5 x i8*], align 8 14610 // CHECK10-NEXT: [[DOTOFFLOAD_PTRS81:%.*]] = alloca [5 x i8*], align 8 14611 // CHECK10-NEXT: [[DOTOFFLOAD_MAPPERS82:%.*]] = alloca [5 x i8*], align 8 14612 // CHECK10-NEXT: [[_TMP83:%.*]] = alloca i32, align 4 14613 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_84:%.*]] = alloca i32, align 4 14614 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_85:%.*]] = alloca i32, align 4 14615 // CHECK10-NEXT: store i32 10000, i32* [[N]], align 4 14616 // CHECK10-NEXT: store i32 100, i32* [[CH]], align 4 14617 // CHECK10-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 14618 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_CASTED]] to i32* 14619 // CHECK10-NEXT: store i32 [[TMP0]], i32* [[CONV]], align 4 14620 // CHECK10-NEXT: [[TMP1:%.*]] = load i64, i64* [[N_CASTED]], align 8 14621 // CHECK10-NEXT: [[TMP2:%.*]] = load i32*, i32** [[A]], align 8 14622 // CHECK10-NEXT: [[TMP3:%.*]] = load i32*, i32** [[B]], align 8 14623 // CHECK10-NEXT: [[TMP4:%.*]] = load i32*, i32** [[C]], align 8 14624 // CHECK10-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 14625 // CHECK10-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i64* 14626 // CHECK10-NEXT: store i64 [[TMP1]], i64* [[TMP6]], align 8 14627 // CHECK10-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 14628 // CHECK10-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i64* 14629 // CHECK10-NEXT: store i64 [[TMP1]], i64* [[TMP8]], align 8 14630 // CHECK10-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0 14631 // CHECK10-NEXT: store i8* null, i8** [[TMP9]], align 8 14632 // CHECK10-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 14633 // CHECK10-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to i32** 14634 // CHECK10-NEXT: store i32* [[TMP2]], i32** [[TMP11]], align 8 14635 // CHECK10-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 14636 // CHECK10-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to i32** 14637 // CHECK10-NEXT: store i32* [[TMP2]], i32** [[TMP13]], align 8 14638 // CHECK10-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 1 14639 // CHECK10-NEXT: store i8* null, i8** [[TMP14]], align 8 14640 // CHECK10-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 14641 // CHECK10-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to i32** 14642 // CHECK10-NEXT: store i32* [[TMP3]], i32** [[TMP16]], align 8 14643 // CHECK10-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 14644 // CHECK10-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to i32** 14645 // CHECK10-NEXT: store i32* [[TMP3]], i32** [[TMP18]], align 8 14646 // CHECK10-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 2 14647 // CHECK10-NEXT: store i8* null, i8** [[TMP19]], align 8 14648 // CHECK10-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 14649 // CHECK10-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to i32** 14650 // CHECK10-NEXT: store i32* [[TMP4]], i32** [[TMP21]], align 8 14651 // CHECK10-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 14652 // CHECK10-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to i32** 14653 // CHECK10-NEXT: store i32* [[TMP4]], i32** [[TMP23]], align 8 14654 // CHECK10-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i64 0, i64 3 14655 // CHECK10-NEXT: store i8* null, i8** [[TMP24]], align 8 14656 // CHECK10-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 14657 // CHECK10-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 14658 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 14659 // CHECK10-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 14660 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 14661 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 14662 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 14663 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 14664 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 14665 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 14666 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 14667 // CHECK10-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 14668 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP30]]) 14669 // CHECK10-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.28, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.29, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 14670 // CHECK10-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 14671 // CHECK10-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 14672 // CHECK10: omp_offload.failed: 14673 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42(i64 [[TMP1]], i32* [[TMP2]], i32* [[TMP3]], i32* [[TMP4]]) #[[ATTR2]] 14674 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT]] 14675 // CHECK10: omp_offload.cont: 14676 // CHECK10-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 14677 // CHECK10-NEXT: [[CONV4:%.*]] = bitcast i64* [[N_CASTED3]] to i32* 14678 // CHECK10-NEXT: store i32 [[TMP33]], i32* [[CONV4]], align 4 14679 // CHECK10-NEXT: [[TMP34:%.*]] = load i64, i64* [[N_CASTED3]], align 8 14680 // CHECK10-NEXT: [[TMP35:%.*]] = load i32*, i32** [[A]], align 8 14681 // CHECK10-NEXT: [[TMP36:%.*]] = load i32*, i32** [[B]], align 8 14682 // CHECK10-NEXT: [[TMP37:%.*]] = load i32*, i32** [[C]], align 8 14683 // CHECK10-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 14684 // CHECK10-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i64* 14685 // CHECK10-NEXT: store i64 [[TMP34]], i64* [[TMP39]], align 8 14686 // CHECK10-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 14687 // CHECK10-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i64* 14688 // CHECK10-NEXT: store i64 [[TMP34]], i64* [[TMP41]], align 8 14689 // CHECK10-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 0 14690 // CHECK10-NEXT: store i8* null, i8** [[TMP42]], align 8 14691 // CHECK10-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 1 14692 // CHECK10-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to i32** 14693 // CHECK10-NEXT: store i32* [[TMP35]], i32** [[TMP44]], align 8 14694 // CHECK10-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 1 14695 // CHECK10-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to i32** 14696 // CHECK10-NEXT: store i32* [[TMP35]], i32** [[TMP46]], align 8 14697 // CHECK10-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 1 14698 // CHECK10-NEXT: store i8* null, i8** [[TMP47]], align 8 14699 // CHECK10-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 2 14700 // CHECK10-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to i32** 14701 // CHECK10-NEXT: store i32* [[TMP36]], i32** [[TMP49]], align 8 14702 // CHECK10-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 2 14703 // CHECK10-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to i32** 14704 // CHECK10-NEXT: store i32* [[TMP36]], i32** [[TMP51]], align 8 14705 // CHECK10-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 2 14706 // CHECK10-NEXT: store i8* null, i8** [[TMP52]], align 8 14707 // CHECK10-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 3 14708 // CHECK10-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to i32** 14709 // CHECK10-NEXT: store i32* [[TMP37]], i32** [[TMP54]], align 8 14710 // CHECK10-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 3 14711 // CHECK10-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to i32** 14712 // CHECK10-NEXT: store i32* [[TMP37]], i32** [[TMP56]], align 8 14713 // CHECK10-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS7]], i64 0, i64 3 14714 // CHECK10-NEXT: store i8* null, i8** [[TMP57]], align 8 14715 // CHECK10-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS5]], i32 0, i32 0 14716 // CHECK10-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS6]], i32 0, i32 0 14717 // CHECK10-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 14718 // CHECK10-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_9]], align 4 14719 // CHECK10-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 14720 // CHECK10-NEXT: [[SUB11:%.*]] = sub nsw i32 [[TMP61]], 0 14721 // CHECK10-NEXT: [[DIV12:%.*]] = sdiv i32 [[SUB11]], 1 14722 // CHECK10-NEXT: [[SUB13:%.*]] = sub nsw i32 [[DIV12]], 1 14723 // CHECK10-NEXT: store i32 [[SUB13]], i32* [[DOTCAPTURE_EXPR_10]], align 4 14724 // CHECK10-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_10]], align 4 14725 // CHECK10-NEXT: [[ADD14:%.*]] = add nsw i32 [[TMP62]], 1 14726 // CHECK10-NEXT: [[TMP63:%.*]] = zext i32 [[ADD14]] to i64 14727 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 14728 // CHECK10-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.32, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.33, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 14729 // CHECK10-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 14730 // CHECK10-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED15:%.*]], label [[OMP_OFFLOAD_CONT16:%.*]] 14731 // CHECK10: omp_offload.failed15: 14732 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51(i64 [[TMP34]], i32* [[TMP35]], i32* [[TMP36]], i32* [[TMP37]]) #[[ATTR2]] 14733 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT16]] 14734 // CHECK10: omp_offload.cont16: 14735 // CHECK10-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 14736 // CHECK10-NEXT: [[CONV17:%.*]] = bitcast i64* [[CH_CASTED]] to i32* 14737 // CHECK10-NEXT: store i32 [[TMP66]], i32* [[CONV17]], align 4 14738 // CHECK10-NEXT: [[TMP67:%.*]] = load i64, i64* [[CH_CASTED]], align 8 14739 // CHECK10-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 14740 // CHECK10-NEXT: [[CONV19:%.*]] = bitcast i64* [[N_CASTED18]] to i32* 14741 // CHECK10-NEXT: store i32 [[TMP68]], i32* [[CONV19]], align 4 14742 // CHECK10-NEXT: [[TMP69:%.*]] = load i64, i64* [[N_CASTED18]], align 8 14743 // CHECK10-NEXT: [[TMP70:%.*]] = load i32*, i32** [[A]], align 8 14744 // CHECK10-NEXT: [[TMP71:%.*]] = load i32*, i32** [[B]], align 8 14745 // CHECK10-NEXT: [[TMP72:%.*]] = load i32*, i32** [[C]], align 8 14746 // CHECK10-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 14747 // CHECK10-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i64* 14748 // CHECK10-NEXT: store i64 [[TMP67]], i64* [[TMP74]], align 8 14749 // CHECK10-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 14750 // CHECK10-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i64* 14751 // CHECK10-NEXT: store i64 [[TMP67]], i64* [[TMP76]], align 8 14752 // CHECK10-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 0 14753 // CHECK10-NEXT: store i8* null, i8** [[TMP77]], align 8 14754 // CHECK10-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 1 14755 // CHECK10-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i64* 14756 // CHECK10-NEXT: store i64 [[TMP69]], i64* [[TMP79]], align 8 14757 // CHECK10-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 1 14758 // CHECK10-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i64* 14759 // CHECK10-NEXT: store i64 [[TMP69]], i64* [[TMP81]], align 8 14760 // CHECK10-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 1 14761 // CHECK10-NEXT: store i8* null, i8** [[TMP82]], align 8 14762 // CHECK10-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 2 14763 // CHECK10-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to i32** 14764 // CHECK10-NEXT: store i32* [[TMP70]], i32** [[TMP84]], align 8 14765 // CHECK10-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 2 14766 // CHECK10-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to i32** 14767 // CHECK10-NEXT: store i32* [[TMP70]], i32** [[TMP86]], align 8 14768 // CHECK10-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 2 14769 // CHECK10-NEXT: store i8* null, i8** [[TMP87]], align 8 14770 // CHECK10-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 3 14771 // CHECK10-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to i32** 14772 // CHECK10-NEXT: store i32* [[TMP71]], i32** [[TMP89]], align 8 14773 // CHECK10-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 3 14774 // CHECK10-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to i32** 14775 // CHECK10-NEXT: store i32* [[TMP71]], i32** [[TMP91]], align 8 14776 // CHECK10-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 3 14777 // CHECK10-NEXT: store i8* null, i8** [[TMP92]], align 8 14778 // CHECK10-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 4 14779 // CHECK10-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to i32** 14780 // CHECK10-NEXT: store i32* [[TMP72]], i32** [[TMP94]], align 8 14781 // CHECK10-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 4 14782 // CHECK10-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to i32** 14783 // CHECK10-NEXT: store i32* [[TMP72]], i32** [[TMP96]], align 8 14784 // CHECK10-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS22]], i64 0, i64 4 14785 // CHECK10-NEXT: store i8* null, i8** [[TMP97]], align 8 14786 // CHECK10-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS20]], i32 0, i32 0 14787 // CHECK10-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS21]], i32 0, i32 0 14788 // CHECK10-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 14789 // CHECK10-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_24]], align 4 14790 // CHECK10-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_24]], align 4 14791 // CHECK10-NEXT: [[SUB26:%.*]] = sub nsw i32 [[TMP101]], 0 14792 // CHECK10-NEXT: [[DIV27:%.*]] = sdiv i32 [[SUB26]], 1 14793 // CHECK10-NEXT: [[SUB28:%.*]] = sub nsw i32 [[DIV27]], 1 14794 // CHECK10-NEXT: store i32 [[SUB28]], i32* [[DOTCAPTURE_EXPR_25]], align 4 14795 // CHECK10-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_25]], align 4 14796 // CHECK10-NEXT: [[ADD29:%.*]] = add nsw i32 [[TMP102]], 1 14797 // CHECK10-NEXT: [[TMP103:%.*]] = zext i32 [[ADD29]] to i64 14798 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 14799 // CHECK10-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.36, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.37, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 14800 // CHECK10-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 14801 // CHECK10-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED30:%.*]], label [[OMP_OFFLOAD_CONT31:%.*]] 14802 // CHECK10: omp_offload.failed30: 14803 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59(i64 [[TMP67]], i64 [[TMP69]], i32* [[TMP70]], i32* [[TMP71]], i32* [[TMP72]]) #[[ATTR2]] 14804 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT31]] 14805 // CHECK10: omp_offload.cont31: 14806 // CHECK10-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 14807 // CHECK10-NEXT: [[CONV33:%.*]] = bitcast i64* [[N_CASTED32]] to i32* 14808 // CHECK10-NEXT: store i32 [[TMP106]], i32* [[CONV33]], align 4 14809 // CHECK10-NEXT: [[TMP107:%.*]] = load i64, i64* [[N_CASTED32]], align 8 14810 // CHECK10-NEXT: [[TMP108:%.*]] = load i32*, i32** [[A]], align 8 14811 // CHECK10-NEXT: [[TMP109:%.*]] = load i32*, i32** [[B]], align 8 14812 // CHECK10-NEXT: [[TMP110:%.*]] = load i32*, i32** [[C]], align 8 14813 // CHECK10-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 14814 // CHECK10-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i64* 14815 // CHECK10-NEXT: store i64 [[TMP107]], i64* [[TMP112]], align 8 14816 // CHECK10-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 14817 // CHECK10-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i64* 14818 // CHECK10-NEXT: store i64 [[TMP107]], i64* [[TMP114]], align 8 14819 // CHECK10-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 0 14820 // CHECK10-NEXT: store i8* null, i8** [[TMP115]], align 8 14821 // CHECK10-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 1 14822 // CHECK10-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to i32** 14823 // CHECK10-NEXT: store i32* [[TMP108]], i32** [[TMP117]], align 8 14824 // CHECK10-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 1 14825 // CHECK10-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to i32** 14826 // CHECK10-NEXT: store i32* [[TMP108]], i32** [[TMP119]], align 8 14827 // CHECK10-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 1 14828 // CHECK10-NEXT: store i8* null, i8** [[TMP120]], align 8 14829 // CHECK10-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 2 14830 // CHECK10-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to i32** 14831 // CHECK10-NEXT: store i32* [[TMP109]], i32** [[TMP122]], align 8 14832 // CHECK10-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 2 14833 // CHECK10-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to i32** 14834 // CHECK10-NEXT: store i32* [[TMP109]], i32** [[TMP124]], align 8 14835 // CHECK10-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 2 14836 // CHECK10-NEXT: store i8* null, i8** [[TMP125]], align 8 14837 // CHECK10-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 3 14838 // CHECK10-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to i32** 14839 // CHECK10-NEXT: store i32* [[TMP110]], i32** [[TMP127]], align 8 14840 // CHECK10-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 3 14841 // CHECK10-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to i32** 14842 // CHECK10-NEXT: store i32* [[TMP110]], i32** [[TMP129]], align 8 14843 // CHECK10-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS36]], i64 0, i64 3 14844 // CHECK10-NEXT: store i8* null, i8** [[TMP130]], align 8 14845 // CHECK10-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS34]], i32 0, i32 0 14846 // CHECK10-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS35]], i32 0, i32 0 14847 // CHECK10-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 14848 // CHECK10-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_38]], align 4 14849 // CHECK10-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_38]], align 4 14850 // CHECK10-NEXT: [[SUB40:%.*]] = sub nsw i32 [[TMP134]], 0 14851 // CHECK10-NEXT: [[DIV41:%.*]] = sdiv i32 [[SUB40]], 1 14852 // CHECK10-NEXT: [[SUB42:%.*]] = sub nsw i32 [[DIV41]], 1 14853 // CHECK10-NEXT: store i32 [[SUB42]], i32* [[DOTCAPTURE_EXPR_39]], align 4 14854 // CHECK10-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_39]], align 4 14855 // CHECK10-NEXT: [[ADD43:%.*]] = add nsw i32 [[TMP135]], 1 14856 // CHECK10-NEXT: [[TMP136:%.*]] = zext i32 [[ADD43]] to i64 14857 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 14858 // CHECK10-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.40, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.41, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 14859 // CHECK10-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 14860 // CHECK10-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED44:%.*]], label [[OMP_OFFLOAD_CONT45:%.*]] 14861 // CHECK10: omp_offload.failed44: 14862 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67(i64 [[TMP107]], i32* [[TMP108]], i32* [[TMP109]], i32* [[TMP110]]) #[[ATTR2]] 14863 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT45]] 14864 // CHECK10: omp_offload.cont45: 14865 // CHECK10-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 14866 // CHECK10-NEXT: [[CONV47:%.*]] = bitcast i64* [[CH_CASTED46]] to i32* 14867 // CHECK10-NEXT: store i32 [[TMP139]], i32* [[CONV47]], align 4 14868 // CHECK10-NEXT: [[TMP140:%.*]] = load i64, i64* [[CH_CASTED46]], align 8 14869 // CHECK10-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 14870 // CHECK10-NEXT: [[CONV49:%.*]] = bitcast i64* [[N_CASTED48]] to i32* 14871 // CHECK10-NEXT: store i32 [[TMP141]], i32* [[CONV49]], align 4 14872 // CHECK10-NEXT: [[TMP142:%.*]] = load i64, i64* [[N_CASTED48]], align 8 14873 // CHECK10-NEXT: [[TMP143:%.*]] = load i32*, i32** [[A]], align 8 14874 // CHECK10-NEXT: [[TMP144:%.*]] = load i32*, i32** [[B]], align 8 14875 // CHECK10-NEXT: [[TMP145:%.*]] = load i32*, i32** [[C]], align 8 14876 // CHECK10-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 14877 // CHECK10-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i64* 14878 // CHECK10-NEXT: store i64 [[TMP140]], i64* [[TMP147]], align 8 14879 // CHECK10-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 14880 // CHECK10-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i64* 14881 // CHECK10-NEXT: store i64 [[TMP140]], i64* [[TMP149]], align 8 14882 // CHECK10-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 0 14883 // CHECK10-NEXT: store i8* null, i8** [[TMP150]], align 8 14884 // CHECK10-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 1 14885 // CHECK10-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i64* 14886 // CHECK10-NEXT: store i64 [[TMP142]], i64* [[TMP152]], align 8 14887 // CHECK10-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 1 14888 // CHECK10-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i64* 14889 // CHECK10-NEXT: store i64 [[TMP142]], i64* [[TMP154]], align 8 14890 // CHECK10-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 1 14891 // CHECK10-NEXT: store i8* null, i8** [[TMP155]], align 8 14892 // CHECK10-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 2 14893 // CHECK10-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to i32** 14894 // CHECK10-NEXT: store i32* [[TMP143]], i32** [[TMP157]], align 8 14895 // CHECK10-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 2 14896 // CHECK10-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to i32** 14897 // CHECK10-NEXT: store i32* [[TMP143]], i32** [[TMP159]], align 8 14898 // CHECK10-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 2 14899 // CHECK10-NEXT: store i8* null, i8** [[TMP160]], align 8 14900 // CHECK10-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 3 14901 // CHECK10-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to i32** 14902 // CHECK10-NEXT: store i32* [[TMP144]], i32** [[TMP162]], align 8 14903 // CHECK10-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 3 14904 // CHECK10-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to i32** 14905 // CHECK10-NEXT: store i32* [[TMP144]], i32** [[TMP164]], align 8 14906 // CHECK10-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 3 14907 // CHECK10-NEXT: store i8* null, i8** [[TMP165]], align 8 14908 // CHECK10-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 4 14909 // CHECK10-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to i32** 14910 // CHECK10-NEXT: store i32* [[TMP145]], i32** [[TMP167]], align 8 14911 // CHECK10-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 4 14912 // CHECK10-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to i32** 14913 // CHECK10-NEXT: store i32* [[TMP145]], i32** [[TMP169]], align 8 14914 // CHECK10-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS52]], i64 0, i64 4 14915 // CHECK10-NEXT: store i8* null, i8** [[TMP170]], align 8 14916 // CHECK10-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS50]], i32 0, i32 0 14917 // CHECK10-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS51]], i32 0, i32 0 14918 // CHECK10-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 14919 // CHECK10-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_54]], align 4 14920 // CHECK10-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_54]], align 4 14921 // CHECK10-NEXT: [[SUB56:%.*]] = sub nsw i32 [[TMP174]], 0 14922 // CHECK10-NEXT: [[DIV57:%.*]] = sdiv i32 [[SUB56]], 1 14923 // CHECK10-NEXT: [[SUB58:%.*]] = sub nsw i32 [[DIV57]], 1 14924 // CHECK10-NEXT: store i32 [[SUB58]], i32* [[DOTCAPTURE_EXPR_55]], align 4 14925 // CHECK10-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_55]], align 4 14926 // CHECK10-NEXT: [[ADD59:%.*]] = add nsw i32 [[TMP175]], 1 14927 // CHECK10-NEXT: [[TMP176:%.*]] = zext i32 [[ADD59]] to i64 14928 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 14929 // CHECK10-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.44, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.45, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 14930 // CHECK10-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 14931 // CHECK10-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED60:%.*]], label [[OMP_OFFLOAD_CONT61:%.*]] 14932 // CHECK10: omp_offload.failed60: 14933 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75(i64 [[TMP140]], i64 [[TMP142]], i32* [[TMP143]], i32* [[TMP144]], i32* [[TMP145]]) #[[ATTR2]] 14934 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT61]] 14935 // CHECK10: omp_offload.cont61: 14936 // CHECK10-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 14937 // CHECK10-NEXT: [[CONV63:%.*]] = bitcast i64* [[N_CASTED62]] to i32* 14938 // CHECK10-NEXT: store i32 [[TMP179]], i32* [[CONV63]], align 4 14939 // CHECK10-NEXT: [[TMP180:%.*]] = load i64, i64* [[N_CASTED62]], align 8 14940 // CHECK10-NEXT: [[TMP181:%.*]] = load i32*, i32** [[A]], align 8 14941 // CHECK10-NEXT: [[TMP182:%.*]] = load i32*, i32** [[B]], align 8 14942 // CHECK10-NEXT: [[TMP183:%.*]] = load i32*, i32** [[C]], align 8 14943 // CHECK10-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 14944 // CHECK10-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i64* 14945 // CHECK10-NEXT: store i64 [[TMP180]], i64* [[TMP185]], align 8 14946 // CHECK10-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 14947 // CHECK10-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i64* 14948 // CHECK10-NEXT: store i64 [[TMP180]], i64* [[TMP187]], align 8 14949 // CHECK10-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 0 14950 // CHECK10-NEXT: store i8* null, i8** [[TMP188]], align 8 14951 // CHECK10-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 1 14952 // CHECK10-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to i32** 14953 // CHECK10-NEXT: store i32* [[TMP181]], i32** [[TMP190]], align 8 14954 // CHECK10-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 1 14955 // CHECK10-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to i32** 14956 // CHECK10-NEXT: store i32* [[TMP181]], i32** [[TMP192]], align 8 14957 // CHECK10-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 1 14958 // CHECK10-NEXT: store i8* null, i8** [[TMP193]], align 8 14959 // CHECK10-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 2 14960 // CHECK10-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to i32** 14961 // CHECK10-NEXT: store i32* [[TMP182]], i32** [[TMP195]], align 8 14962 // CHECK10-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 2 14963 // CHECK10-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to i32** 14964 // CHECK10-NEXT: store i32* [[TMP182]], i32** [[TMP197]], align 8 14965 // CHECK10-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 2 14966 // CHECK10-NEXT: store i8* null, i8** [[TMP198]], align 8 14967 // CHECK10-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 3 14968 // CHECK10-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to i32** 14969 // CHECK10-NEXT: store i32* [[TMP183]], i32** [[TMP200]], align 8 14970 // CHECK10-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 3 14971 // CHECK10-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to i32** 14972 // CHECK10-NEXT: store i32* [[TMP183]], i32** [[TMP202]], align 8 14973 // CHECK10-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS66]], i64 0, i64 3 14974 // CHECK10-NEXT: store i8* null, i8** [[TMP203]], align 8 14975 // CHECK10-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS64]], i32 0, i32 0 14976 // CHECK10-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS65]], i32 0, i32 0 14977 // CHECK10-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 14978 // CHECK10-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_68]], align 4 14979 // CHECK10-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_68]], align 4 14980 // CHECK10-NEXT: [[SUB70:%.*]] = sub nsw i32 [[TMP207]], 0 14981 // CHECK10-NEXT: [[DIV71:%.*]] = sdiv i32 [[SUB70]], 1 14982 // CHECK10-NEXT: [[SUB72:%.*]] = sub nsw i32 [[DIV71]], 1 14983 // CHECK10-NEXT: store i32 [[SUB72]], i32* [[DOTCAPTURE_EXPR_69]], align 4 14984 // CHECK10-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_69]], align 4 14985 // CHECK10-NEXT: [[ADD73:%.*]] = add nsw i32 [[TMP208]], 1 14986 // CHECK10-NEXT: [[TMP209:%.*]] = zext i32 [[ADD73]] to i64 14987 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 14988 // CHECK10-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.48, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.49, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 14989 // CHECK10-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 14990 // CHECK10-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED74:%.*]], label [[OMP_OFFLOAD_CONT75:%.*]] 14991 // CHECK10: omp_offload.failed74: 14992 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83(i64 [[TMP180]], i32* [[TMP181]], i32* [[TMP182]], i32* [[TMP183]]) #[[ATTR2]] 14993 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT75]] 14994 // CHECK10: omp_offload.cont75: 14995 // CHECK10-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 14996 // CHECK10-NEXT: [[CONV77:%.*]] = bitcast i64* [[CH_CASTED76]] to i32* 14997 // CHECK10-NEXT: store i32 [[TMP212]], i32* [[CONV77]], align 4 14998 // CHECK10-NEXT: [[TMP213:%.*]] = load i64, i64* [[CH_CASTED76]], align 8 14999 // CHECK10-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 15000 // CHECK10-NEXT: [[CONV79:%.*]] = bitcast i64* [[N_CASTED78]] to i32* 15001 // CHECK10-NEXT: store i32 [[TMP214]], i32* [[CONV79]], align 4 15002 // CHECK10-NEXT: [[TMP215:%.*]] = load i64, i64* [[N_CASTED78]], align 8 15003 // CHECK10-NEXT: [[TMP216:%.*]] = load i32*, i32** [[A]], align 8 15004 // CHECK10-NEXT: [[TMP217:%.*]] = load i32*, i32** [[B]], align 8 15005 // CHECK10-NEXT: [[TMP218:%.*]] = load i32*, i32** [[C]], align 8 15006 // CHECK10-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 15007 // CHECK10-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i64* 15008 // CHECK10-NEXT: store i64 [[TMP213]], i64* [[TMP220]], align 8 15009 // CHECK10-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 15010 // CHECK10-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i64* 15011 // CHECK10-NEXT: store i64 [[TMP213]], i64* [[TMP222]], align 8 15012 // CHECK10-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 0 15013 // CHECK10-NEXT: store i8* null, i8** [[TMP223]], align 8 15014 // CHECK10-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 1 15015 // CHECK10-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i64* 15016 // CHECK10-NEXT: store i64 [[TMP215]], i64* [[TMP225]], align 8 15017 // CHECK10-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 1 15018 // CHECK10-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i64* 15019 // CHECK10-NEXT: store i64 [[TMP215]], i64* [[TMP227]], align 8 15020 // CHECK10-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 1 15021 // CHECK10-NEXT: store i8* null, i8** [[TMP228]], align 8 15022 // CHECK10-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 2 15023 // CHECK10-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to i32** 15024 // CHECK10-NEXT: store i32* [[TMP216]], i32** [[TMP230]], align 8 15025 // CHECK10-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 2 15026 // CHECK10-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to i32** 15027 // CHECK10-NEXT: store i32* [[TMP216]], i32** [[TMP232]], align 8 15028 // CHECK10-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 2 15029 // CHECK10-NEXT: store i8* null, i8** [[TMP233]], align 8 15030 // CHECK10-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 3 15031 // CHECK10-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to i32** 15032 // CHECK10-NEXT: store i32* [[TMP217]], i32** [[TMP235]], align 8 15033 // CHECK10-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 3 15034 // CHECK10-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to i32** 15035 // CHECK10-NEXT: store i32* [[TMP217]], i32** [[TMP237]], align 8 15036 // CHECK10-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 3 15037 // CHECK10-NEXT: store i8* null, i8** [[TMP238]], align 8 15038 // CHECK10-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 4 15039 // CHECK10-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to i32** 15040 // CHECK10-NEXT: store i32* [[TMP218]], i32** [[TMP240]], align 8 15041 // CHECK10-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 4 15042 // CHECK10-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to i32** 15043 // CHECK10-NEXT: store i32* [[TMP218]], i32** [[TMP242]], align 8 15044 // CHECK10-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS82]], i64 0, i64 4 15045 // CHECK10-NEXT: store i8* null, i8** [[TMP243]], align 8 15046 // CHECK10-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS80]], i32 0, i32 0 15047 // CHECK10-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS81]], i32 0, i32 0 15048 // CHECK10-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 15049 // CHECK10-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_84]], align 4 15050 // CHECK10-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_84]], align 4 15051 // CHECK10-NEXT: [[SUB86:%.*]] = sub nsw i32 [[TMP247]], 0 15052 // CHECK10-NEXT: [[DIV87:%.*]] = sdiv i32 [[SUB86]], 1 15053 // CHECK10-NEXT: [[SUB88:%.*]] = sub nsw i32 [[DIV87]], 1 15054 // CHECK10-NEXT: store i32 [[SUB88]], i32* [[DOTCAPTURE_EXPR_85]], align 4 15055 // CHECK10-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_85]], align 4 15056 // CHECK10-NEXT: [[ADD89:%.*]] = add nsw i32 [[TMP248]], 1 15057 // CHECK10-NEXT: [[TMP249:%.*]] = zext i32 [[ADD89]] to i64 15058 // CHECK10-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 15059 // CHECK10-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.52, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.53, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 15060 // CHECK10-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 15061 // CHECK10-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED90:%.*]], label [[OMP_OFFLOAD_CONT91:%.*]] 15062 // CHECK10: omp_offload.failed90: 15063 // CHECK10-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91(i64 [[TMP213]], i64 [[TMP215]], i32* [[TMP216]], i32* [[TMP217]], i32* [[TMP218]]) #[[ATTR2]] 15064 // CHECK10-NEXT: br label [[OMP_OFFLOAD_CONT91]] 15065 // CHECK10: omp_offload.cont91: 15066 // CHECK10-NEXT: ret i32 0 15067 // 15068 // 15069 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42 15070 // CHECK10-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 15071 // CHECK10-NEXT: entry: 15072 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 15073 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 15074 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 15075 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 15076 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 15077 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 15078 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 15079 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 15080 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 15081 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..26 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 15082 // CHECK10-NEXT: ret void 15083 // 15084 // 15085 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..26 15086 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15087 // CHECK10-NEXT: entry: 15088 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15089 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15090 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15091 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15092 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15093 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15094 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15095 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15096 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15097 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15098 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15099 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 15100 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 15101 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15102 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15103 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 15104 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15105 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15106 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15107 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15108 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15109 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15110 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15111 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15112 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15113 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15114 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15115 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15116 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15117 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15118 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15119 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15120 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15121 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15122 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15123 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15124 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15125 // CHECK10: omp.precond.then: 15126 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 15127 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15128 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 15129 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15130 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15131 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15132 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 15133 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15134 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15135 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15136 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 15137 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15138 // CHECK10: cond.true: 15139 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15140 // CHECK10-NEXT: br label [[COND_END:%.*]] 15141 // CHECK10: cond.false: 15142 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15143 // CHECK10-NEXT: br label [[COND_END]] 15144 // CHECK10: cond.end: 15145 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 15146 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 15147 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15148 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 15149 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15150 // CHECK10: omp.inner.for.cond: 15151 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15152 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15153 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 15154 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15155 // CHECK10: omp.inner.for.body: 15156 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15157 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 15158 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15159 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 15160 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..27 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 15161 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15162 // CHECK10: omp.inner.for.inc: 15163 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15164 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 15165 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 15166 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 15167 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15168 // CHECK10: omp.inner.for.end: 15169 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15170 // CHECK10: omp.loop.exit: 15171 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15172 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 15173 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 15174 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15175 // CHECK10: omp.precond.end: 15176 // CHECK10-NEXT: ret void 15177 // 15178 // 15179 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..27 15180 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15181 // CHECK10-NEXT: entry: 15182 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15183 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15184 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 15185 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 15186 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15187 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15188 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15189 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15190 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15191 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15192 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15193 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15194 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15195 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 15196 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 15197 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15198 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15199 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 15200 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15201 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15202 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15203 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15204 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15205 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15206 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15207 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15208 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15209 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15210 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15211 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15212 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15213 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15214 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15215 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15216 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15217 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15218 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15219 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15220 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15221 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15222 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15223 // CHECK10: omp.precond.then: 15224 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 15225 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15226 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 15227 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15228 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 15229 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15230 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 15231 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 15232 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 15233 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15234 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15235 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15236 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 15237 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15238 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15239 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15240 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 15241 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15242 // CHECK10: cond.true: 15243 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15244 // CHECK10-NEXT: br label [[COND_END:%.*]] 15245 // CHECK10: cond.false: 15246 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15247 // CHECK10-NEXT: br label [[COND_END]] 15248 // CHECK10: cond.end: 15249 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 15250 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 15251 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 15252 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 15253 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15254 // CHECK10: omp.inner.for.cond: 15255 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15256 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15257 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 15258 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15259 // CHECK10: omp.inner.for.body: 15260 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15261 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 15262 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 15263 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 15264 // CHECK10-NEXT: [[TMP20:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15265 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[TMP20]], align 4 15266 // CHECK10-NEXT: [[TMP22:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* @[[GLOB3]], i32 [[TMP21]], i32 2) 15267 // CHECK10-NEXT: [[TMP23:%.*]] = icmp ne i32 [[TMP22]], 0 15268 // CHECK10-NEXT: br i1 [[TMP23]], label [[DOTCANCEL_EXIT:%.*]], label [[DOTCANCEL_CONTINUE:%.*]] 15269 // CHECK10: .cancel.exit: 15270 // CHECK10-NEXT: br label [[CANCEL_EXIT:%.*]] 15271 // CHECK10: .cancel.continue: 15272 // CHECK10-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP2]], align 8 15273 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4 15274 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP25]] to i64 15275 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i64 [[IDXPROM]] 15276 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 15277 // CHECK10-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP3]], align 8 15278 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4 15279 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP28]] to i64 15280 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i64 [[IDXPROM7]] 15281 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 15282 // CHECK10-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 15283 // CHECK10-NEXT: [[TMP30:%.*]] = load i32*, i32** [[TMP1]], align 8 15284 // CHECK10-NEXT: [[TMP31:%.*]] = load i32, i32* [[I4]], align 4 15285 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP31]] to i64 15286 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i64 [[IDXPROM10]] 15287 // CHECK10-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 15288 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 15289 // CHECK10: omp.body.continue: 15290 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15291 // CHECK10: omp.inner.for.inc: 15292 // CHECK10-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15293 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], 1 15294 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 15295 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15296 // CHECK10: omp.inner.for.end: 15297 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15298 // CHECK10: omp.loop.exit: 15299 // CHECK10-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15300 // CHECK10-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 15301 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 15302 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15303 // CHECK10: cancel.exit: 15304 // CHECK10-NEXT: [[TMP35:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15305 // CHECK10-NEXT: [[TMP36:%.*]] = load i32, i32* [[TMP35]], align 4 15306 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP36]]) 15307 // CHECK10-NEXT: br label [[CANCEL_CONT:%.*]] 15308 // CHECK10: omp.precond.end: 15309 // CHECK10-NEXT: br label [[CANCEL_CONT]] 15310 // CHECK10: cancel.cont: 15311 // CHECK10-NEXT: ret void 15312 // 15313 // 15314 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51 15315 // CHECK10-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 15316 // CHECK10-NEXT: entry: 15317 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 15318 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 15319 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 15320 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 15321 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 15322 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 15323 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 15324 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 15325 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 15326 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 15327 // CHECK10-NEXT: ret void 15328 // 15329 // 15330 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..30 15331 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15332 // CHECK10-NEXT: entry: 15333 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15334 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15335 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15336 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15337 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15338 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15339 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15340 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15341 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15342 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15343 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15344 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 15345 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 15346 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15347 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15348 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 15349 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15350 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15351 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15352 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15353 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15354 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15355 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15356 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15357 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15358 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15359 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15360 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15361 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15362 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15363 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15364 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15365 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15366 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15367 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15368 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15369 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15370 // CHECK10: omp.precond.then: 15371 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 15372 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15373 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 15374 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15375 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15376 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15377 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 15378 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15379 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15380 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15381 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 15382 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15383 // CHECK10: cond.true: 15384 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15385 // CHECK10-NEXT: br label [[COND_END:%.*]] 15386 // CHECK10: cond.false: 15387 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15388 // CHECK10-NEXT: br label [[COND_END]] 15389 // CHECK10: cond.end: 15390 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 15391 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 15392 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15393 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 15394 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15395 // CHECK10: omp.inner.for.cond: 15396 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15397 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15398 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 15399 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15400 // CHECK10: omp.inner.for.body: 15401 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15402 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 15403 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15404 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 15405 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 15406 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15407 // CHECK10: omp.inner.for.inc: 15408 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15409 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 15410 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 15411 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 15412 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15413 // CHECK10: omp.inner.for.end: 15414 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15415 // CHECK10: omp.loop.exit: 15416 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15417 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 15418 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 15419 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15420 // CHECK10: omp.precond.end: 15421 // CHECK10-NEXT: ret void 15422 // 15423 // 15424 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..31 15425 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15426 // CHECK10-NEXT: entry: 15427 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15428 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15429 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 15430 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 15431 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15432 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15433 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15434 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15435 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15436 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15437 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15438 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15439 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15440 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 15441 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 15442 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15443 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15444 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 15445 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15446 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15447 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15448 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15449 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15450 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15451 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15452 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15453 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15454 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15455 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15456 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15457 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15458 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15459 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15460 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15461 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15462 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15463 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15464 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15465 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15466 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15467 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15468 // CHECK10: omp.precond.then: 15469 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 15470 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15471 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 15472 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15473 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 15474 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15475 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 15476 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 15477 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 15478 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15479 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15480 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15481 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 15482 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15483 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15484 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15485 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 15486 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15487 // CHECK10: cond.true: 15488 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15489 // CHECK10-NEXT: br label [[COND_END:%.*]] 15490 // CHECK10: cond.false: 15491 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15492 // CHECK10-NEXT: br label [[COND_END]] 15493 // CHECK10: cond.end: 15494 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 15495 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 15496 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 15497 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 15498 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15499 // CHECK10: omp.inner.for.cond: 15500 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15501 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15502 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 15503 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15504 // CHECK10: omp.inner.for.body: 15505 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15506 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 15507 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 15508 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 15509 // CHECK10-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 8 15510 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 15511 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 15512 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i64 [[IDXPROM]] 15513 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 15514 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 8 15515 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 15516 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 15517 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM7]] 15518 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 15519 // CHECK10-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 15520 // CHECK10-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 8 15521 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 15522 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 15523 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM10]] 15524 // CHECK10-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 15525 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 15526 // CHECK10: omp.body.continue: 15527 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15528 // CHECK10: omp.inner.for.inc: 15529 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15530 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 15531 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 15532 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15533 // CHECK10: omp.inner.for.end: 15534 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15535 // CHECK10: omp.loop.exit: 15536 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15537 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 15538 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 15539 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15540 // CHECK10: omp.precond.end: 15541 // CHECK10-NEXT: ret void 15542 // 15543 // 15544 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59 15545 // CHECK10-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 15546 // CHECK10-NEXT: entry: 15547 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 15548 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 15549 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 15550 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 15551 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 15552 // CHECK10-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 15553 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 15554 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 15555 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 15556 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 15557 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 15558 // CHECK10-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 15559 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 15560 // CHECK10-NEXT: ret void 15561 // 15562 // 15563 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..34 15564 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15565 // CHECK10-NEXT: entry: 15566 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15567 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15568 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 15569 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15570 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15571 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15572 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15573 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15574 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15575 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15576 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15577 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15578 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 15579 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 15580 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15581 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15582 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 15583 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15584 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15585 // CHECK10-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 15586 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15587 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15588 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15589 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15590 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 15591 // CHECK10-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15592 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15593 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15594 // CHECK10-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15595 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 15596 // CHECK10-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 15597 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15598 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 15599 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15600 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15601 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15602 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15603 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15604 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 15605 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15606 // CHECK10: omp.precond.then: 15607 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 15608 // CHECK10-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15609 // CHECK10-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 15610 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15611 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15612 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 15613 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15614 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 15615 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 15616 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15617 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15618 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 15619 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15620 // CHECK10: cond.true: 15621 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15622 // CHECK10-NEXT: br label [[COND_END:%.*]] 15623 // CHECK10: cond.false: 15624 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15625 // CHECK10-NEXT: br label [[COND_END]] 15626 // CHECK10: cond.end: 15627 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 15628 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 15629 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15630 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 15631 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15632 // CHECK10: omp.inner.for.cond: 15633 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15634 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15635 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 15636 // CHECK10-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 15637 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15638 // CHECK10: omp.inner.for.body: 15639 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15640 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 15641 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15642 // CHECK10-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 15643 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]]) 15644 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15645 // CHECK10: omp.inner.for.inc: 15646 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15647 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 15648 // CHECK10-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 15649 // CHECK10-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 15650 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15651 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 15652 // CHECK10-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 15653 // CHECK10-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 15654 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15655 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 15656 // CHECK10-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP27]], [[TMP28]] 15657 // CHECK10-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 15658 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15659 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15660 // CHECK10-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP29]], [[TMP30]] 15661 // CHECK10-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 15662 // CHECK10: cond.true10: 15663 // CHECK10-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15664 // CHECK10-NEXT: br label [[COND_END12:%.*]] 15665 // CHECK10: cond.false11: 15666 // CHECK10-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15667 // CHECK10-NEXT: br label [[COND_END12]] 15668 // CHECK10: cond.end12: 15669 // CHECK10-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP31]], [[COND_TRUE10]] ], [ [[TMP32]], [[COND_FALSE11]] ] 15670 // CHECK10-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 15671 // CHECK10-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15672 // CHECK10-NEXT: store i32 [[TMP33]], i32* [[DOTOMP_IV]], align 4 15673 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15674 // CHECK10: omp.inner.for.end: 15675 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15676 // CHECK10: omp.loop.exit: 15677 // CHECK10-NEXT: [[TMP34:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15678 // CHECK10-NEXT: [[TMP35:%.*]] = load i32, i32* [[TMP34]], align 4 15679 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP35]]) 15680 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15681 // CHECK10: omp.precond.end: 15682 // CHECK10-NEXT: ret void 15683 // 15684 // 15685 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..35 15686 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15687 // CHECK10-NEXT: entry: 15688 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15689 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15690 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 15691 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 15692 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15693 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15694 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15695 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15696 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15697 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15698 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15699 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15700 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15701 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 15702 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 15703 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15704 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15705 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 15706 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15707 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15708 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15709 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15710 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15711 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15712 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15713 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15714 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15715 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15716 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15717 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15718 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15719 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15720 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15721 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15722 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15723 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15724 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15725 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15726 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15727 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15728 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15729 // CHECK10: omp.precond.then: 15730 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 15731 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15732 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 15733 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15734 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 15735 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15736 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 15737 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 15738 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 15739 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15740 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15741 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15742 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 15743 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15744 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15745 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15746 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 15747 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15748 // CHECK10: cond.true: 15749 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15750 // CHECK10-NEXT: br label [[COND_END:%.*]] 15751 // CHECK10: cond.false: 15752 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15753 // CHECK10-NEXT: br label [[COND_END]] 15754 // CHECK10: cond.end: 15755 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 15756 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 15757 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 15758 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 15759 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15760 // CHECK10: omp.inner.for.cond: 15761 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15762 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15763 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 15764 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15765 // CHECK10: omp.inner.for.body: 15766 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15767 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 15768 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 15769 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 15770 // CHECK10-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 8 15771 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 15772 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 15773 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i64 [[IDXPROM]] 15774 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 15775 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 8 15776 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 15777 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 15778 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM7]] 15779 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 15780 // CHECK10-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 15781 // CHECK10-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 8 15782 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 15783 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 15784 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM10]] 15785 // CHECK10-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 15786 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 15787 // CHECK10: omp.body.continue: 15788 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15789 // CHECK10: omp.inner.for.inc: 15790 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15791 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 15792 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 15793 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15794 // CHECK10: omp.inner.for.end: 15795 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15796 // CHECK10: omp.loop.exit: 15797 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15798 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 15799 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 15800 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15801 // CHECK10: omp.precond.end: 15802 // CHECK10-NEXT: ret void 15803 // 15804 // 15805 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67 15806 // CHECK10-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 15807 // CHECK10-NEXT: entry: 15808 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 15809 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 15810 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 15811 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 15812 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 15813 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 15814 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 15815 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 15816 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 15817 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..38 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 15818 // CHECK10-NEXT: ret void 15819 // 15820 // 15821 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..38 15822 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15823 // CHECK10-NEXT: entry: 15824 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15825 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15826 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15827 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15828 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15829 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15830 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15831 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15832 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15833 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15834 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15835 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 15836 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 15837 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15838 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15839 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 15840 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15841 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15842 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15843 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15844 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15845 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15846 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15847 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15848 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15849 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15850 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15851 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15852 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15853 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15854 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15855 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15856 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15857 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15858 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15859 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15860 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15861 // CHECK10: omp.precond.then: 15862 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 15863 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15864 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 15865 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15866 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15867 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15868 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 15869 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15870 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15871 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15872 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 15873 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15874 // CHECK10: cond.true: 15875 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15876 // CHECK10-NEXT: br label [[COND_END:%.*]] 15877 // CHECK10: cond.false: 15878 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15879 // CHECK10-NEXT: br label [[COND_END]] 15880 // CHECK10: cond.end: 15881 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 15882 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 15883 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15884 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 15885 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15886 // CHECK10: omp.inner.for.cond: 15887 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15888 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15889 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 15890 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15891 // CHECK10: omp.inner.for.body: 15892 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 15893 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 15894 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 15895 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 15896 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 15897 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 15898 // CHECK10: omp.inner.for.inc: 15899 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15900 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 15901 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 15902 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 15903 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 15904 // CHECK10: omp.inner.for.end: 15905 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 15906 // CHECK10: omp.loop.exit: 15907 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15908 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 15909 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 15910 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 15911 // CHECK10: omp.precond.end: 15912 // CHECK10-NEXT: ret void 15913 // 15914 // 15915 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..39 15916 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 15917 // CHECK10-NEXT: entry: 15918 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 15919 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 15920 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 15921 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 15922 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 15923 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 15924 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 15925 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 15926 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 15927 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 15928 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 15929 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 15930 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 15931 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 15932 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 15933 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 15934 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 15935 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 15936 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 15937 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 15938 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15939 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15940 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 15941 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 15942 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 15943 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 15944 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 15945 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 15946 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 15947 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 15948 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 15949 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 15950 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15951 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 15952 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 15953 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 15954 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 15955 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 15956 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 15957 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 15958 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 15959 // CHECK10: omp.precond.then: 15960 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 15961 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15962 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 15963 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 15964 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 15965 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 15966 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 15967 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 15968 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 15969 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 15970 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 15971 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 15972 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 15973 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 15974 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15975 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15976 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 15977 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 15978 // CHECK10: cond.true: 15979 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 15980 // CHECK10-NEXT: br label [[COND_END:%.*]] 15981 // CHECK10: cond.false: 15982 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15983 // CHECK10-NEXT: br label [[COND_END]] 15984 // CHECK10: cond.end: 15985 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 15986 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 15987 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 15988 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 15989 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 15990 // CHECK10: omp.inner.for.cond: 15991 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15992 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 15993 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 15994 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 15995 // CHECK10: omp.inner.for.body: 15996 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 15997 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 15998 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 15999 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 16000 // CHECK10-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 8 16001 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[I4]], align 4 16002 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP21]] to i64 16003 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i64 [[IDXPROM]] 16004 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 16005 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 8 16006 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 16007 // CHECK10-NEXT: [[IDXPROM7:%.*]] = sext i32 [[TMP24]] to i64 16008 // CHECK10-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM7]] 16009 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 16010 // CHECK10-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 16011 // CHECK10-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 8 16012 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 16013 // CHECK10-NEXT: [[IDXPROM10:%.*]] = sext i32 [[TMP27]] to i64 16014 // CHECK10-NEXT: [[ARRAYIDX11:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM10]] 16015 // CHECK10-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX11]], align 4 16016 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 16017 // CHECK10: omp.body.continue: 16018 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16019 // CHECK10: omp.inner.for.inc: 16020 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16021 // CHECK10-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP28]], 1 16022 // CHECK10-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_IV]], align 4 16023 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 16024 // CHECK10: omp.inner.for.end: 16025 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 16026 // CHECK10: omp.loop.exit: 16027 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16028 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 16029 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 16030 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16031 // CHECK10: omp.precond.end: 16032 // CHECK10-NEXT: ret void 16033 // 16034 // 16035 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75 16036 // CHECK10-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 16037 // CHECK10-NEXT: entry: 16038 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 16039 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 16040 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 16041 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 16042 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 16043 // CHECK10-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 16044 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 16045 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 16046 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 16047 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 16048 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 16049 // CHECK10-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 16050 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..42 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 16051 // CHECK10-NEXT: ret void 16052 // 16053 // 16054 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..42 16055 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 16056 // CHECK10-NEXT: entry: 16057 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 16058 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 16059 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 16060 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 16061 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 16062 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 16063 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 16064 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 16065 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 16066 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 16067 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16068 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 16069 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 16070 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 16071 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 16072 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 16073 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 16074 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 16075 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 16076 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 16077 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 16078 // CHECK10-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 16079 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 16080 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 16081 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 16082 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 16083 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 16084 // CHECK10-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 16085 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 16086 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 16087 // CHECK10-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 16088 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 16089 // CHECK10-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 16090 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 16091 // CHECK10-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16092 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16093 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 16094 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16095 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 16096 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 16097 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 16098 // CHECK10-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16099 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 16100 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 16101 // CHECK10: omp.precond.then: 16102 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 16103 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16104 // CHECK10-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 16105 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 16106 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 16107 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16108 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 16109 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 16110 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16111 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16112 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 16113 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 16114 // CHECK10: cond.true: 16115 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16116 // CHECK10-NEXT: br label [[COND_END:%.*]] 16117 // CHECK10: cond.false: 16118 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16119 // CHECK10-NEXT: br label [[COND_END]] 16120 // CHECK10: cond.end: 16121 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 16122 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 16123 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 16124 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 16125 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 16126 // CHECK10: omp.inner.for.cond: 16127 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16128 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16129 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 16130 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 16131 // CHECK10: omp.inner.for.body: 16132 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 16133 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 16134 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16135 // CHECK10-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 16136 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16137 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 16138 // CHECK10-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 16139 // CHECK10-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 16140 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**, i64)* @.omp_outlined..43 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i64 [[TMP24]]) 16141 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16142 // CHECK10: omp.inner.for.inc: 16143 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16144 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 16145 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 16146 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 16147 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 16148 // CHECK10: omp.inner.for.end: 16149 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 16150 // CHECK10: omp.loop.exit: 16151 // CHECK10-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16152 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 16153 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 16154 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16155 // CHECK10: omp.precond.end: 16156 // CHECK10-NEXT: ret void 16157 // 16158 // 16159 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..43 16160 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 16161 // CHECK10-NEXT: entry: 16162 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 16163 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 16164 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 16165 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 16166 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 16167 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 16168 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 16169 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 16170 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 16171 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 16172 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 16173 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16174 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 16175 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 16176 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 16177 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 16178 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 16179 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 16180 // CHECK10-NEXT: [[I6:%.*]] = alloca i32, align 4 16181 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 16182 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 16183 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 16184 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16185 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 16186 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 16187 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 16188 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 16189 // CHECK10-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 16190 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 16191 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 16192 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 16193 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 16194 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 16195 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 16196 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16197 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16198 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 16199 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16200 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 16201 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 16202 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 16203 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16204 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 16205 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 16206 // CHECK10: omp.precond.then: 16207 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 16208 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16209 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 16210 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 16211 // CHECK10-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 16212 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16213 // CHECK10-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 16214 // CHECK10-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 16215 // CHECK10-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 16216 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 16217 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 16218 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 16219 // CHECK10-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16220 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 16221 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 16222 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 16223 // CHECK10: omp.dispatch.cond: 16224 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16225 // CHECK10-NEXT: [[CONV7:%.*]] = sext i32 [[TMP13]] to i64 16226 // CHECK10-NEXT: [[TMP14:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16227 // CHECK10-NEXT: [[CMP8:%.*]] = icmp ugt i64 [[CONV7]], [[TMP14]] 16228 // CHECK10-NEXT: br i1 [[CMP8]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 16229 // CHECK10: cond.true: 16230 // CHECK10-NEXT: [[TMP15:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16231 // CHECK10-NEXT: br label [[COND_END:%.*]] 16232 // CHECK10: cond.false: 16233 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16234 // CHECK10-NEXT: [[CONV9:%.*]] = sext i32 [[TMP16]] to i64 16235 // CHECK10-NEXT: br label [[COND_END]] 16236 // CHECK10: cond.end: 16237 // CHECK10-NEXT: [[COND:%.*]] = phi i64 [ [[TMP15]], [[COND_TRUE]] ], [ [[CONV9]], [[COND_FALSE]] ] 16238 // CHECK10-NEXT: [[CONV10:%.*]] = trunc i64 [[COND]] to i32 16239 // CHECK10-NEXT: store i32 [[CONV10]], i32* [[DOTOMP_UB]], align 4 16240 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 16241 // CHECK10-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 16242 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16243 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16244 // CHECK10-NEXT: [[CMP11:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 16245 // CHECK10-NEXT: br i1 [[CMP11]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 16246 // CHECK10: omp.dispatch.body: 16247 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 16248 // CHECK10: omp.inner.for.cond: 16249 // CHECK10-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16250 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16251 // CHECK10-NEXT: [[CMP12:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 16252 // CHECK10-NEXT: br i1 [[CMP12]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 16253 // CHECK10: omp.inner.for.body: 16254 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16255 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 16256 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 16257 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I6]], align 4 16258 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP2]], align 8 16259 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[I6]], align 4 16260 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP24]] to i64 16261 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i64 [[IDXPROM]] 16262 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 16263 // CHECK10-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP3]], align 8 16264 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[I6]], align 4 16265 // CHECK10-NEXT: [[IDXPROM13:%.*]] = sext i32 [[TMP27]] to i64 16266 // CHECK10-NEXT: [[ARRAYIDX14:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i64 [[IDXPROM13]] 16267 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[ARRAYIDX14]], align 4 16268 // CHECK10-NEXT: [[ADD15:%.*]] = add nsw i32 [[TMP25]], [[TMP28]] 16269 // CHECK10-NEXT: [[TMP29:%.*]] = load i32*, i32** [[TMP1]], align 8 16270 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[I6]], align 4 16271 // CHECK10-NEXT: [[IDXPROM16:%.*]] = sext i32 [[TMP30]] to i64 16272 // CHECK10-NEXT: [[ARRAYIDX17:%.*]] = getelementptr inbounds i32, i32* [[TMP29]], i64 [[IDXPROM16]] 16273 // CHECK10-NEXT: store i32 [[ADD15]], i32* [[ARRAYIDX17]], align 4 16274 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 16275 // CHECK10: omp.body.continue: 16276 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16277 // CHECK10: omp.inner.for.inc: 16278 // CHECK10-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16279 // CHECK10-NEXT: [[ADD18:%.*]] = add nsw i32 [[TMP31]], 1 16280 // CHECK10-NEXT: store i32 [[ADD18]], i32* [[DOTOMP_IV]], align 4 16281 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 16282 // CHECK10: omp.inner.for.end: 16283 // CHECK10-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 16284 // CHECK10: omp.dispatch.inc: 16285 // CHECK10-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 16286 // CHECK10-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 16287 // CHECK10-NEXT: [[ADD19:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 16288 // CHECK10-NEXT: store i32 [[ADD19]], i32* [[DOTOMP_LB]], align 4 16289 // CHECK10-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16290 // CHECK10-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 16291 // CHECK10-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 16292 // CHECK10-NEXT: store i32 [[ADD20]], i32* [[DOTOMP_UB]], align 4 16293 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND]] 16294 // CHECK10: omp.dispatch.end: 16295 // CHECK10-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16296 // CHECK10-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 16297 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 16298 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16299 // CHECK10: omp.precond.end: 16300 // CHECK10-NEXT: ret void 16301 // 16302 // 16303 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83 16304 // CHECK10-SAME: (i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 16305 // CHECK10-NEXT: entry: 16306 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 16307 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 16308 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 16309 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 16310 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 16311 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 16312 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 16313 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 16314 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[N_ADDR]] to i32* 16315 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..46 to void (i32*, i32*, ...)*), i32* [[CONV]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 16316 // CHECK10-NEXT: ret void 16317 // 16318 // 16319 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..46 16320 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 16321 // CHECK10-NEXT: entry: 16322 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 16323 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 16324 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 16325 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 16326 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 16327 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 16328 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 16329 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 16330 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 16331 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16332 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 16333 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 16334 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 16335 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 16336 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 16337 // CHECK10-NEXT: [[I3:%.*]] = alloca i32, align 4 16338 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 16339 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 16340 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 16341 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 16342 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 16343 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 16344 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 16345 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 16346 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 16347 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 16348 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 16349 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 16350 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16351 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 16352 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16353 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 16354 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16355 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 16356 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16357 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 16358 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 16359 // CHECK10: omp.precond.then: 16360 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 16361 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16362 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 16363 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 16364 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 16365 // CHECK10-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16366 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 16367 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 16368 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16369 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16370 // CHECK10-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 16371 // CHECK10-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 16372 // CHECK10: cond.true: 16373 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16374 // CHECK10-NEXT: br label [[COND_END:%.*]] 16375 // CHECK10: cond.false: 16376 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16377 // CHECK10-NEXT: br label [[COND_END]] 16378 // CHECK10: cond.end: 16379 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 16380 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 16381 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 16382 // CHECK10-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 16383 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 16384 // CHECK10: omp.inner.for.cond: 16385 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16386 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16387 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 16388 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 16389 // CHECK10: omp.inner.for.body: 16390 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 16391 // CHECK10-NEXT: [[TMP18:%.*]] = zext i32 [[TMP17]] to i64 16392 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16393 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 16394 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**)* @.omp_outlined..47 to void (i32*, i32*, ...)*), i64 [[TMP18]], i64 [[TMP20]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 16395 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16396 // CHECK10: omp.inner.for.inc: 16397 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16398 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 16399 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 16400 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 16401 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 16402 // CHECK10: omp.inner.for.end: 16403 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 16404 // CHECK10: omp.loop.exit: 16405 // CHECK10-NEXT: [[TMP23:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16406 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[TMP23]], align 4 16407 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP24]]) 16408 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16409 // CHECK10: omp.precond.end: 16410 // CHECK10-NEXT: ret void 16411 // 16412 // 16413 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..47 16414 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 16415 // CHECK10-NEXT: entry: 16416 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 16417 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 16418 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 16419 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 16420 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 16421 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 16422 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 16423 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 16424 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 16425 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 16426 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 16427 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16428 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 16429 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 16430 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 16431 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 16432 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 16433 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 16434 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 16435 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 16436 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 16437 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16438 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 16439 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 16440 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 16441 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 16442 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 16443 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 16444 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 16445 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 16446 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 16447 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 16448 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16449 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 16450 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16451 // CHECK10-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 16452 // CHECK10-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16453 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 16454 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16455 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 16456 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 16457 // CHECK10: omp.precond.then: 16458 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 16459 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16460 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 16461 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 16462 // CHECK10-NEXT: [[CONV:%.*]] = trunc i64 [[TMP8]] to i32 16463 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16464 // CHECK10-NEXT: [[CONV3:%.*]] = trunc i64 [[TMP9]] to i32 16465 // CHECK10-NEXT: store i32 [[CONV]], i32* [[DOTOMP_LB]], align 4 16466 // CHECK10-NEXT: store i32 [[CONV3]], i32* [[DOTOMP_UB]], align 4 16467 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 16468 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 16469 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 16470 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16471 // CHECK10-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16472 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 16473 // CHECK10-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 16474 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 16475 // CHECK10: omp.dispatch.cond: 16476 // CHECK10-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16477 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 16478 // CHECK10-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 16479 // CHECK10-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 16480 // CHECK10-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 16481 // CHECK10: omp.dispatch.body: 16482 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 16483 // CHECK10-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 16484 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 16485 // CHECK10: omp.inner.for.cond: 16486 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 16487 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !24 16488 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 16489 // CHECK10-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 16490 // CHECK10: omp.inner.for.body: 16491 // CHECK10-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 16492 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 16493 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 16494 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !24 16495 // CHECK10-NEXT: [[TMP21:%.*]] = load i32*, i32** [[TMP2]], align 8, !llvm.access.group !24 16496 // CHECK10-NEXT: [[TMP22:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !24 16497 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP22]] to i64 16498 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP21]], i64 [[IDXPROM]] 16499 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !24 16500 // CHECK10-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP3]], align 8, !llvm.access.group !24 16501 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !24 16502 // CHECK10-NEXT: [[IDXPROM6:%.*]] = sext i32 [[TMP25]] to i64 16503 // CHECK10-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i64 [[IDXPROM6]] 16504 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX7]], align 4, !llvm.access.group !24 16505 // CHECK10-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP23]], [[TMP26]] 16506 // CHECK10-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP1]], align 8, !llvm.access.group !24 16507 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !24 16508 // CHECK10-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP28]] to i64 16509 // CHECK10-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i64 [[IDXPROM9]] 16510 // CHECK10-NEXT: store i32 [[ADD8]], i32* [[ARRAYIDX10]], align 4, !llvm.access.group !24 16511 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 16512 // CHECK10: omp.body.continue: 16513 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16514 // CHECK10: omp.inner.for.inc: 16515 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 16516 // CHECK10-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP29]], 1 16517 // CHECK10-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !24 16518 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP25:![0-9]+]] 16519 // CHECK10: omp.inner.for.end: 16520 // CHECK10-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 16521 // CHECK10: omp.dispatch.inc: 16522 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND]] 16523 // CHECK10: omp.dispatch.end: 16524 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16525 // CHECK10: omp.precond.end: 16526 // CHECK10-NEXT: ret void 16527 // 16528 // 16529 // CHECK10-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91 16530 // CHECK10-SAME: (i64 [[CH:%.*]], i64 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 16531 // CHECK10-NEXT: entry: 16532 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i64, align 8 16533 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i64, align 8 16534 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 8 16535 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 8 16536 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 8 16537 // CHECK10-NEXT: store i64 [[CH]], i64* [[CH_ADDR]], align 8 16538 // CHECK10-NEXT: store i64 [[N]], i64* [[N_ADDR]], align 8 16539 // CHECK10-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 8 16540 // CHECK10-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 8 16541 // CHECK10-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 8 16542 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[CH_ADDR]] to i32* 16543 // CHECK10-NEXT: [[CONV1:%.*]] = bitcast i64* [[N_ADDR]] to i32* 16544 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..50 to void (i32*, i32*, ...)*), i32* [[CONV]], i32* [[CONV1]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 16545 // CHECK10-NEXT: ret void 16546 // 16547 // 16548 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..50 16549 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]]) #[[ATTR1]] { 16550 // CHECK10-NEXT: entry: 16551 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 16552 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 16553 // CHECK10-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 8 16554 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 16555 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 16556 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 16557 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 16558 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 16559 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 16560 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 16561 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16562 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 16563 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 16564 // CHECK10-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 16565 // CHECK10-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 16566 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 16567 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 16568 // CHECK10-NEXT: [[I4:%.*]] = alloca i32, align 4 16569 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i64, align 8 16570 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 16571 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 16572 // CHECK10-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 8 16573 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 16574 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 16575 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 16576 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 16577 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 8 16578 // CHECK10-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 8 16579 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 16580 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 16581 // CHECK10-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 16582 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 16583 // CHECK10-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 16584 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 16585 // CHECK10-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16586 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16587 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 16588 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16589 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 16590 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 16591 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 16592 // CHECK10-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16593 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 16594 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 16595 // CHECK10: omp.precond.then: 16596 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 16597 // CHECK10-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16598 // CHECK10-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 16599 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 16600 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 16601 // CHECK10-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16602 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 16603 // CHECK10-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 16604 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16605 // CHECK10-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16606 // CHECK10-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 16607 // CHECK10-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 16608 // CHECK10: cond.true: 16609 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16610 // CHECK10-NEXT: br label [[COND_END:%.*]] 16611 // CHECK10: cond.false: 16612 // CHECK10-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16613 // CHECK10-NEXT: br label [[COND_END]] 16614 // CHECK10: cond.end: 16615 // CHECK10-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 16616 // CHECK10-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 16617 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 16618 // CHECK10-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 16619 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 16620 // CHECK10: omp.inner.for.cond: 16621 // CHECK10-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16622 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16623 // CHECK10-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 16624 // CHECK10-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 16625 // CHECK10: omp.inner.for.body: 16626 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 16627 // CHECK10-NEXT: [[TMP20:%.*]] = zext i32 [[TMP19]] to i64 16628 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 16629 // CHECK10-NEXT: [[TMP22:%.*]] = zext i32 [[TMP21]] to i64 16630 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16631 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__CASTED]] to i32* 16632 // CHECK10-NEXT: store i32 [[TMP23]], i32* [[CONV]], align 4 16633 // CHECK10-NEXT: [[TMP24:%.*]] = load i64, i64* [[DOTCAPTURE_EXPR__CASTED]], align 8 16634 // CHECK10-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64, i64, i32*, i32**, i32**, i32**, i64)* @.omp_outlined..51 to void (i32*, i32*, ...)*), i64 [[TMP20]], i64 [[TMP22]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i64 [[TMP24]]) 16635 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16636 // CHECK10: omp.inner.for.inc: 16637 // CHECK10-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 16638 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 16639 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 16640 // CHECK10-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 16641 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]] 16642 // CHECK10: omp.inner.for.end: 16643 // CHECK10-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 16644 // CHECK10: omp.loop.exit: 16645 // CHECK10-NEXT: [[TMP27:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16646 // CHECK10-NEXT: [[TMP28:%.*]] = load i32, i32* [[TMP27]], align 4 16647 // CHECK10-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP28]]) 16648 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16649 // CHECK10: omp.precond.end: 16650 // CHECK10-NEXT: ret void 16651 // 16652 // 16653 // CHECK10-LABEL: define {{[^@]+}}@.omp_outlined..51 16654 // CHECK10-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i64 [[DOTPREVIOUS_LB_:%.*]], i64 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 8 dereferenceable(8) [[A:%.*]], i32** nonnull align 8 dereferenceable(8) [[B:%.*]], i32** nonnull align 8 dereferenceable(8) [[C:%.*]], i64 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 16655 // CHECK10-NEXT: entry: 16656 // CHECK10-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 8 16657 // CHECK10-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 8 16658 // CHECK10-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i64, align 8 16659 // CHECK10-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i64, align 8 16660 // CHECK10-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 8 16661 // CHECK10-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 8 16662 // CHECK10-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 8 16663 // CHECK10-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 8 16664 // CHECK10-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i64, align 8 16665 // CHECK10-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 16666 // CHECK10-NEXT: [[TMP:%.*]] = alloca i32, align 4 16667 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16668 // CHECK10-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 16669 // CHECK10-NEXT: [[I:%.*]] = alloca i32, align 4 16670 // CHECK10-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 16671 // CHECK10-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 16672 // CHECK10-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 16673 // CHECK10-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 16674 // CHECK10-NEXT: [[I6:%.*]] = alloca i32, align 4 16675 // CHECK10-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 8 16676 // CHECK10-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 8 16677 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_LB_]], i64* [[DOTPREVIOUS_LB__ADDR]], align 8 16678 // CHECK10-NEXT: store i64 [[DOTPREVIOUS_UB_]], i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16679 // CHECK10-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 8 16680 // CHECK10-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 8 16681 // CHECK10-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 8 16682 // CHECK10-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 8 16683 // CHECK10-NEXT: store i64 [[DOTCAPTURE_EXPR_]], i64* [[DOTCAPTURE_EXPR__ADDR]], align 8 16684 // CHECK10-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 8 16685 // CHECK10-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 8 16686 // CHECK10-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 8 16687 // CHECK10-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 8 16688 // CHECK10-NEXT: [[CONV:%.*]] = bitcast i64* [[DOTCAPTURE_EXPR__ADDR]] to i32* 16689 // CHECK10-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 16690 // CHECK10-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16691 // CHECK10-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16692 // CHECK10-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 16693 // CHECK10-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16694 // CHECK10-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 16695 // CHECK10-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 16696 // CHECK10-NEXT: store i32 0, i32* [[I]], align 4 16697 // CHECK10-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16698 // CHECK10-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 16699 // CHECK10-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 16700 // CHECK10: omp.precond.then: 16701 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 16702 // CHECK10-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 16703 // CHECK10-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 16704 // CHECK10-NEXT: [[TMP8:%.*]] = load i64, i64* [[DOTPREVIOUS_LB__ADDR]], align 8 16705 // CHECK10-NEXT: [[CONV4:%.*]] = trunc i64 [[TMP8]] to i32 16706 // CHECK10-NEXT: [[TMP9:%.*]] = load i64, i64* [[DOTPREVIOUS_UB__ADDR]], align 8 16707 // CHECK10-NEXT: [[CONV5:%.*]] = trunc i64 [[TMP9]] to i32 16708 // CHECK10-NEXT: store i32 [[CONV4]], i32* [[DOTOMP_LB]], align 4 16709 // CHECK10-NEXT: store i32 [[CONV5]], i32* [[DOTOMP_UB]], align 4 16710 // CHECK10-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 16711 // CHECK10-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 16712 // CHECK10-NEXT: [[TMP10:%.*]] = load i32, i32* [[CONV]], align 8 16713 // CHECK10-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 16714 // CHECK10-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 16715 // CHECK10-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16716 // CHECK10-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 16717 // CHECK10-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 16718 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 16719 // CHECK10: omp.dispatch.cond: 16720 // CHECK10-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 8 16721 // CHECK10-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 16722 // CHECK10-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 16723 // CHECK10-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 16724 // CHECK10-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 16725 // CHECK10: omp.dispatch.body: 16726 // CHECK10-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 16727 // CHECK10-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 16728 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 16729 // CHECK10: omp.inner.for.cond: 16730 // CHECK10-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 16731 // CHECK10-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !27 16732 // CHECK10-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 16733 // CHECK10-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 16734 // CHECK10: omp.inner.for.body: 16735 // CHECK10-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 16736 // CHECK10-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 16737 // CHECK10-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 16738 // CHECK10-NEXT: store i32 [[ADD]], i32* [[I6]], align 4, !llvm.access.group !27 16739 // CHECK10-NEXT: [[TMP22:%.*]] = load i32*, i32** [[TMP2]], align 8, !llvm.access.group !27 16740 // CHECK10-NEXT: [[TMP23:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !27 16741 // CHECK10-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP23]] to i64 16742 // CHECK10-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP22]], i64 [[IDXPROM]] 16743 // CHECK10-NEXT: [[TMP24:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !27 16744 // CHECK10-NEXT: [[TMP25:%.*]] = load i32*, i32** [[TMP3]], align 8, !llvm.access.group !27 16745 // CHECK10-NEXT: [[TMP26:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !27 16746 // CHECK10-NEXT: [[IDXPROM8:%.*]] = sext i32 [[TMP26]] to i64 16747 // CHECK10-NEXT: [[ARRAYIDX9:%.*]] = getelementptr inbounds i32, i32* [[TMP25]], i64 [[IDXPROM8]] 16748 // CHECK10-NEXT: [[TMP27:%.*]] = load i32, i32* [[ARRAYIDX9]], align 4, !llvm.access.group !27 16749 // CHECK10-NEXT: [[ADD10:%.*]] = add nsw i32 [[TMP24]], [[TMP27]] 16750 // CHECK10-NEXT: [[TMP28:%.*]] = load i32*, i32** [[TMP1]], align 8, !llvm.access.group !27 16751 // CHECK10-NEXT: [[TMP29:%.*]] = load i32, i32* [[I6]], align 4, !llvm.access.group !27 16752 // CHECK10-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP29]] to i64 16753 // CHECK10-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds i32, i32* [[TMP28]], i64 [[IDXPROM11]] 16754 // CHECK10-NEXT: store i32 [[ADD10]], i32* [[ARRAYIDX12]], align 4, !llvm.access.group !27 16755 // CHECK10-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 16756 // CHECK10: omp.body.continue: 16757 // CHECK10-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 16758 // CHECK10: omp.inner.for.inc: 16759 // CHECK10-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 16760 // CHECK10-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP30]], 1 16761 // CHECK10-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !27 16762 // CHECK10-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP28:![0-9]+]] 16763 // CHECK10: omp.inner.for.end: 16764 // CHECK10-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 16765 // CHECK10: omp.dispatch.inc: 16766 // CHECK10-NEXT: br label [[OMP_DISPATCH_COND]] 16767 // CHECK10: omp.dispatch.end: 16768 // CHECK10-NEXT: br label [[OMP_PRECOND_END]] 16769 // CHECK10: omp.precond.end: 16770 // CHECK10-NEXT: ret void 16771 // 16772 // 16773 // CHECK10-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 16774 // CHECK10-SAME: () #[[ATTR4:[0-9]+]] { 16775 // CHECK10-NEXT: entry: 16776 // CHECK10-NEXT: call void @__tgt_register_requires(i64 1) 16777 // CHECK10-NEXT: ret void 16778 // 16779 // 16780 // CHECK11-LABEL: define {{[^@]+}}@main 16781 // CHECK11-SAME: () #[[ATTR0:[0-9]+]] { 16782 // CHECK11-NEXT: entry: 16783 // CHECK11-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 16784 // CHECK11-NEXT: [[A:%.*]] = alloca double*, align 4 16785 // CHECK11-NEXT: [[B:%.*]] = alloca double*, align 4 16786 // CHECK11-NEXT: [[C:%.*]] = alloca double*, align 4 16787 // CHECK11-NEXT: [[N:%.*]] = alloca i32, align 4 16788 // CHECK11-NEXT: [[CH:%.*]] = alloca i32, align 4 16789 // CHECK11-NEXT: [[N_CASTED:%.*]] = alloca i32, align 4 16790 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 4 16791 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 4 16792 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 4 16793 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 16794 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 16795 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 16796 // CHECK11-NEXT: [[N_CASTED3:%.*]] = alloca i32, align 4 16797 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS4:%.*]] = alloca [4 x i8*], align 4 16798 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS5:%.*]] = alloca [4 x i8*], align 4 16799 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS6:%.*]] = alloca [4 x i8*], align 4 16800 // CHECK11-NEXT: [[_TMP7:%.*]] = alloca i32, align 4 16801 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_8:%.*]] = alloca i32, align 4 16802 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 16803 // CHECK11-NEXT: [[CH_CASTED:%.*]] = alloca i32, align 4 16804 // CHECK11-NEXT: [[N_CASTED16:%.*]] = alloca i32, align 4 16805 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS17:%.*]] = alloca [5 x i8*], align 4 16806 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS18:%.*]] = alloca [5 x i8*], align 4 16807 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS19:%.*]] = alloca [5 x i8*], align 4 16808 // CHECK11-NEXT: [[_TMP20:%.*]] = alloca i32, align 4 16809 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_21:%.*]] = alloca i32, align 4 16810 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_22:%.*]] = alloca i32, align 4 16811 // CHECK11-NEXT: [[N_CASTED29:%.*]] = alloca i32, align 4 16812 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS30:%.*]] = alloca [4 x i8*], align 4 16813 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS31:%.*]] = alloca [4 x i8*], align 4 16814 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS32:%.*]] = alloca [4 x i8*], align 4 16815 // CHECK11-NEXT: [[_TMP33:%.*]] = alloca i32, align 4 16816 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_34:%.*]] = alloca i32, align 4 16817 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_35:%.*]] = alloca i32, align 4 16818 // CHECK11-NEXT: [[CH_CASTED42:%.*]] = alloca i32, align 4 16819 // CHECK11-NEXT: [[N_CASTED43:%.*]] = alloca i32, align 4 16820 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS44:%.*]] = alloca [5 x i8*], align 4 16821 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS45:%.*]] = alloca [5 x i8*], align 4 16822 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS46:%.*]] = alloca [5 x i8*], align 4 16823 // CHECK11-NEXT: [[_TMP47:%.*]] = alloca i32, align 4 16824 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_48:%.*]] = alloca i32, align 4 16825 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_49:%.*]] = alloca i32, align 4 16826 // CHECK11-NEXT: [[N_CASTED56:%.*]] = alloca i32, align 4 16827 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS57:%.*]] = alloca [4 x i8*], align 4 16828 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS58:%.*]] = alloca [4 x i8*], align 4 16829 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS59:%.*]] = alloca [4 x i8*], align 4 16830 // CHECK11-NEXT: [[_TMP60:%.*]] = alloca i32, align 4 16831 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_61:%.*]] = alloca i32, align 4 16832 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_62:%.*]] = alloca i32, align 4 16833 // CHECK11-NEXT: [[CH_CASTED69:%.*]] = alloca i32, align 4 16834 // CHECK11-NEXT: [[N_CASTED70:%.*]] = alloca i32, align 4 16835 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS71:%.*]] = alloca [5 x i8*], align 4 16836 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS72:%.*]] = alloca [5 x i8*], align 4 16837 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS73:%.*]] = alloca [5 x i8*], align 4 16838 // CHECK11-NEXT: [[_TMP74:%.*]] = alloca i32, align 4 16839 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 16840 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_76:%.*]] = alloca i32, align 4 16841 // CHECK11-NEXT: store i32 0, i32* [[RETVAL]], align 4 16842 // CHECK11-NEXT: store i32 10000, i32* [[N]], align 4 16843 // CHECK11-NEXT: store i32 100, i32* [[CH]], align 4 16844 // CHECK11-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 16845 // CHECK11-NEXT: store i32 [[TMP0]], i32* [[N_CASTED]], align 4 16846 // CHECK11-NEXT: [[TMP1:%.*]] = load i32, i32* [[N_CASTED]], align 4 16847 // CHECK11-NEXT: [[TMP2:%.*]] = load double*, double** [[A]], align 4 16848 // CHECK11-NEXT: [[TMP3:%.*]] = load double*, double** [[B]], align 4 16849 // CHECK11-NEXT: [[TMP4:%.*]] = load double*, double** [[C]], align 4 16850 // CHECK11-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 16851 // CHECK11-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i32* 16852 // CHECK11-NEXT: store i32 [[TMP1]], i32* [[TMP6]], align 4 16853 // CHECK11-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 16854 // CHECK11-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i32* 16855 // CHECK11-NEXT: store i32 [[TMP1]], i32* [[TMP8]], align 4 16856 // CHECK11-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 0 16857 // CHECK11-NEXT: store i8* null, i8** [[TMP9]], align 4 16858 // CHECK11-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 16859 // CHECK11-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to double** 16860 // CHECK11-NEXT: store double* [[TMP2]], double** [[TMP11]], align 4 16861 // CHECK11-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 16862 // CHECK11-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to double** 16863 // CHECK11-NEXT: store double* [[TMP2]], double** [[TMP13]], align 4 16864 // CHECK11-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 1 16865 // CHECK11-NEXT: store i8* null, i8** [[TMP14]], align 4 16866 // CHECK11-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 16867 // CHECK11-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to double** 16868 // CHECK11-NEXT: store double* [[TMP3]], double** [[TMP16]], align 4 16869 // CHECK11-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 16870 // CHECK11-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to double** 16871 // CHECK11-NEXT: store double* [[TMP3]], double** [[TMP18]], align 4 16872 // CHECK11-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 2 16873 // CHECK11-NEXT: store i8* null, i8** [[TMP19]], align 4 16874 // CHECK11-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 16875 // CHECK11-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to double** 16876 // CHECK11-NEXT: store double* [[TMP4]], double** [[TMP21]], align 4 16877 // CHECK11-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 16878 // CHECK11-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to double** 16879 // CHECK11-NEXT: store double* [[TMP4]], double** [[TMP23]], align 4 16880 // CHECK11-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 3 16881 // CHECK11-NEXT: store i8* null, i8** [[TMP24]], align 4 16882 // CHECK11-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 16883 // CHECK11-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 16884 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 16885 // CHECK11-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 16886 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 16887 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 16888 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 16889 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 16890 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 16891 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 16892 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 16893 // CHECK11-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 16894 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3:[0-9]+]], i64 -1, i64 [[TMP30]]) 16895 // CHECK11-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 16896 // CHECK11-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 16897 // CHECK11-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 16898 // CHECK11: omp_offload.failed: 16899 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369(i32 [[TMP1]], double* [[TMP2]], double* [[TMP3]], double* [[TMP4]]) #[[ATTR2:[0-9]+]] 16900 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT]] 16901 // CHECK11: omp_offload.cont: 16902 // CHECK11-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 16903 // CHECK11-NEXT: store i32 [[TMP33]], i32* [[N_CASTED3]], align 4 16904 // CHECK11-NEXT: [[TMP34:%.*]] = load i32, i32* [[N_CASTED3]], align 4 16905 // CHECK11-NEXT: [[TMP35:%.*]] = load double*, double** [[A]], align 4 16906 // CHECK11-NEXT: [[TMP36:%.*]] = load double*, double** [[B]], align 4 16907 // CHECK11-NEXT: [[TMP37:%.*]] = load double*, double** [[C]], align 4 16908 // CHECK11-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 16909 // CHECK11-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i32* 16910 // CHECK11-NEXT: store i32 [[TMP34]], i32* [[TMP39]], align 4 16911 // CHECK11-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 16912 // CHECK11-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i32* 16913 // CHECK11-NEXT: store i32 [[TMP34]], i32* [[TMP41]], align 4 16914 // CHECK11-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 0 16915 // CHECK11-NEXT: store i8* null, i8** [[TMP42]], align 4 16916 // CHECK11-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 1 16917 // CHECK11-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to double** 16918 // CHECK11-NEXT: store double* [[TMP35]], double** [[TMP44]], align 4 16919 // CHECK11-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 1 16920 // CHECK11-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to double** 16921 // CHECK11-NEXT: store double* [[TMP35]], double** [[TMP46]], align 4 16922 // CHECK11-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 1 16923 // CHECK11-NEXT: store i8* null, i8** [[TMP47]], align 4 16924 // CHECK11-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 2 16925 // CHECK11-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to double** 16926 // CHECK11-NEXT: store double* [[TMP36]], double** [[TMP49]], align 4 16927 // CHECK11-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 2 16928 // CHECK11-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to double** 16929 // CHECK11-NEXT: store double* [[TMP36]], double** [[TMP51]], align 4 16930 // CHECK11-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 2 16931 // CHECK11-NEXT: store i8* null, i8** [[TMP52]], align 4 16932 // CHECK11-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 3 16933 // CHECK11-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to double** 16934 // CHECK11-NEXT: store double* [[TMP37]], double** [[TMP54]], align 4 16935 // CHECK11-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 3 16936 // CHECK11-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to double** 16937 // CHECK11-NEXT: store double* [[TMP37]], double** [[TMP56]], align 4 16938 // CHECK11-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 3 16939 // CHECK11-NEXT: store i8* null, i8** [[TMP57]], align 4 16940 // CHECK11-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 16941 // CHECK11-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 16942 // CHECK11-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 16943 // CHECK11-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_8]], align 4 16944 // CHECK11-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_8]], align 4 16945 // CHECK11-NEXT: [[SUB10:%.*]] = sub nsw i32 [[TMP61]], 0 16946 // CHECK11-NEXT: [[DIV11:%.*]] = sdiv i32 [[SUB10]], 1 16947 // CHECK11-NEXT: [[SUB12:%.*]] = sub nsw i32 [[DIV11]], 1 16948 // CHECK11-NEXT: store i32 [[SUB12]], i32* [[DOTCAPTURE_EXPR_9]], align 4 16949 // CHECK11-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 16950 // CHECK11-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP62]], 1 16951 // CHECK11-NEXT: [[TMP63:%.*]] = zext i32 [[ADD13]] to i64 16952 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 16953 // CHECK11-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.4, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.5, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 16954 // CHECK11-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 16955 // CHECK11-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED14:%.*]], label [[OMP_OFFLOAD_CONT15:%.*]] 16956 // CHECK11: omp_offload.failed14: 16957 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408(i32 [[TMP34]], double* [[TMP35]], double* [[TMP36]], double* [[TMP37]]) #[[ATTR2]] 16958 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT15]] 16959 // CHECK11: omp_offload.cont15: 16960 // CHECK11-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 16961 // CHECK11-NEXT: store i32 [[TMP66]], i32* [[CH_CASTED]], align 4 16962 // CHECK11-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH_CASTED]], align 4 16963 // CHECK11-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 16964 // CHECK11-NEXT: store i32 [[TMP68]], i32* [[N_CASTED16]], align 4 16965 // CHECK11-NEXT: [[TMP69:%.*]] = load i32, i32* [[N_CASTED16]], align 4 16966 // CHECK11-NEXT: [[TMP70:%.*]] = load double*, double** [[A]], align 4 16967 // CHECK11-NEXT: [[TMP71:%.*]] = load double*, double** [[B]], align 4 16968 // CHECK11-NEXT: [[TMP72:%.*]] = load double*, double** [[C]], align 4 16969 // CHECK11-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 16970 // CHECK11-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i32* 16971 // CHECK11-NEXT: store i32 [[TMP67]], i32* [[TMP74]], align 4 16972 // CHECK11-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 16973 // CHECK11-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i32* 16974 // CHECK11-NEXT: store i32 [[TMP67]], i32* [[TMP76]], align 4 16975 // CHECK11-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 0 16976 // CHECK11-NEXT: store i8* null, i8** [[TMP77]], align 4 16977 // CHECK11-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 1 16978 // CHECK11-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i32* 16979 // CHECK11-NEXT: store i32 [[TMP69]], i32* [[TMP79]], align 4 16980 // CHECK11-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 1 16981 // CHECK11-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i32* 16982 // CHECK11-NEXT: store i32 [[TMP69]], i32* [[TMP81]], align 4 16983 // CHECK11-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 1 16984 // CHECK11-NEXT: store i8* null, i8** [[TMP82]], align 4 16985 // CHECK11-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 2 16986 // CHECK11-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to double** 16987 // CHECK11-NEXT: store double* [[TMP70]], double** [[TMP84]], align 4 16988 // CHECK11-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 2 16989 // CHECK11-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to double** 16990 // CHECK11-NEXT: store double* [[TMP70]], double** [[TMP86]], align 4 16991 // CHECK11-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 2 16992 // CHECK11-NEXT: store i8* null, i8** [[TMP87]], align 4 16993 // CHECK11-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 3 16994 // CHECK11-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to double** 16995 // CHECK11-NEXT: store double* [[TMP71]], double** [[TMP89]], align 4 16996 // CHECK11-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 3 16997 // CHECK11-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to double** 16998 // CHECK11-NEXT: store double* [[TMP71]], double** [[TMP91]], align 4 16999 // CHECK11-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 3 17000 // CHECK11-NEXT: store i8* null, i8** [[TMP92]], align 4 17001 // CHECK11-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 4 17002 // CHECK11-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to double** 17003 // CHECK11-NEXT: store double* [[TMP72]], double** [[TMP94]], align 4 17004 // CHECK11-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 4 17005 // CHECK11-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to double** 17006 // CHECK11-NEXT: store double* [[TMP72]], double** [[TMP96]], align 4 17007 // CHECK11-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 4 17008 // CHECK11-NEXT: store i8* null, i8** [[TMP97]], align 4 17009 // CHECK11-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 17010 // CHECK11-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 17011 // CHECK11-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 17012 // CHECK11-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_21]], align 4 17013 // CHECK11-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_21]], align 4 17014 // CHECK11-NEXT: [[SUB23:%.*]] = sub nsw i32 [[TMP101]], 0 17015 // CHECK11-NEXT: [[DIV24:%.*]] = sdiv i32 [[SUB23]], 1 17016 // CHECK11-NEXT: [[SUB25:%.*]] = sub nsw i32 [[DIV24]], 1 17017 // CHECK11-NEXT: store i32 [[SUB25]], i32* [[DOTCAPTURE_EXPR_22]], align 4 17018 // CHECK11-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_22]], align 4 17019 // CHECK11-NEXT: [[ADD26:%.*]] = add nsw i32 [[TMP102]], 1 17020 // CHECK11-NEXT: [[TMP103:%.*]] = zext i32 [[ADD26]] to i64 17021 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 17022 // CHECK11-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.8, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.9, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 17023 // CHECK11-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 17024 // CHECK11-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED27:%.*]], label [[OMP_OFFLOAD_CONT28:%.*]] 17025 // CHECK11: omp_offload.failed27: 17026 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447(i32 [[TMP67]], i32 [[TMP69]], double* [[TMP70]], double* [[TMP71]], double* [[TMP72]]) #[[ATTR2]] 17027 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT28]] 17028 // CHECK11: omp_offload.cont28: 17029 // CHECK11-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 17030 // CHECK11-NEXT: store i32 [[TMP106]], i32* [[N_CASTED29]], align 4 17031 // CHECK11-NEXT: [[TMP107:%.*]] = load i32, i32* [[N_CASTED29]], align 4 17032 // CHECK11-NEXT: [[TMP108:%.*]] = load double*, double** [[A]], align 4 17033 // CHECK11-NEXT: [[TMP109:%.*]] = load double*, double** [[B]], align 4 17034 // CHECK11-NEXT: [[TMP110:%.*]] = load double*, double** [[C]], align 4 17035 // CHECK11-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 17036 // CHECK11-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i32* 17037 // CHECK11-NEXT: store i32 [[TMP107]], i32* [[TMP112]], align 4 17038 // CHECK11-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 17039 // CHECK11-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i32* 17040 // CHECK11-NEXT: store i32 [[TMP107]], i32* [[TMP114]], align 4 17041 // CHECK11-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 0 17042 // CHECK11-NEXT: store i8* null, i8** [[TMP115]], align 4 17043 // CHECK11-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 1 17044 // CHECK11-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to double** 17045 // CHECK11-NEXT: store double* [[TMP108]], double** [[TMP117]], align 4 17046 // CHECK11-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 1 17047 // CHECK11-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to double** 17048 // CHECK11-NEXT: store double* [[TMP108]], double** [[TMP119]], align 4 17049 // CHECK11-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 1 17050 // CHECK11-NEXT: store i8* null, i8** [[TMP120]], align 4 17051 // CHECK11-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 2 17052 // CHECK11-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to double** 17053 // CHECK11-NEXT: store double* [[TMP109]], double** [[TMP122]], align 4 17054 // CHECK11-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 2 17055 // CHECK11-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to double** 17056 // CHECK11-NEXT: store double* [[TMP109]], double** [[TMP124]], align 4 17057 // CHECK11-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 2 17058 // CHECK11-NEXT: store i8* null, i8** [[TMP125]], align 4 17059 // CHECK11-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 3 17060 // CHECK11-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to double** 17061 // CHECK11-NEXT: store double* [[TMP110]], double** [[TMP127]], align 4 17062 // CHECK11-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 3 17063 // CHECK11-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to double** 17064 // CHECK11-NEXT: store double* [[TMP110]], double** [[TMP129]], align 4 17065 // CHECK11-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 3 17066 // CHECK11-NEXT: store i8* null, i8** [[TMP130]], align 4 17067 // CHECK11-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 17068 // CHECK11-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 17069 // CHECK11-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 17070 // CHECK11-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_34]], align 4 17071 // CHECK11-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_34]], align 4 17072 // CHECK11-NEXT: [[SUB36:%.*]] = sub nsw i32 [[TMP134]], 0 17073 // CHECK11-NEXT: [[DIV37:%.*]] = sdiv i32 [[SUB36]], 1 17074 // CHECK11-NEXT: [[SUB38:%.*]] = sub nsw i32 [[DIV37]], 1 17075 // CHECK11-NEXT: store i32 [[SUB38]], i32* [[DOTCAPTURE_EXPR_35]], align 4 17076 // CHECK11-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_35]], align 4 17077 // CHECK11-NEXT: [[ADD39:%.*]] = add nsw i32 [[TMP135]], 1 17078 // CHECK11-NEXT: [[TMP136:%.*]] = zext i32 [[ADD39]] to i64 17079 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 17080 // CHECK11-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.12, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.13, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 17081 // CHECK11-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 17082 // CHECK11-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED40:%.*]], label [[OMP_OFFLOAD_CONT41:%.*]] 17083 // CHECK11: omp_offload.failed40: 17084 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478(i32 [[TMP107]], double* [[TMP108]], double* [[TMP109]], double* [[TMP110]]) #[[ATTR2]] 17085 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT41]] 17086 // CHECK11: omp_offload.cont41: 17087 // CHECK11-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 17088 // CHECK11-NEXT: store i32 [[TMP139]], i32* [[CH_CASTED42]], align 4 17089 // CHECK11-NEXT: [[TMP140:%.*]] = load i32, i32* [[CH_CASTED42]], align 4 17090 // CHECK11-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 17091 // CHECK11-NEXT: store i32 [[TMP141]], i32* [[N_CASTED43]], align 4 17092 // CHECK11-NEXT: [[TMP142:%.*]] = load i32, i32* [[N_CASTED43]], align 4 17093 // CHECK11-NEXT: [[TMP143:%.*]] = load double*, double** [[A]], align 4 17094 // CHECK11-NEXT: [[TMP144:%.*]] = load double*, double** [[B]], align 4 17095 // CHECK11-NEXT: [[TMP145:%.*]] = load double*, double** [[C]], align 4 17096 // CHECK11-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 17097 // CHECK11-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i32* 17098 // CHECK11-NEXT: store i32 [[TMP140]], i32* [[TMP147]], align 4 17099 // CHECK11-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 17100 // CHECK11-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i32* 17101 // CHECK11-NEXT: store i32 [[TMP140]], i32* [[TMP149]], align 4 17102 // CHECK11-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 0 17103 // CHECK11-NEXT: store i8* null, i8** [[TMP150]], align 4 17104 // CHECK11-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 1 17105 // CHECK11-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i32* 17106 // CHECK11-NEXT: store i32 [[TMP142]], i32* [[TMP152]], align 4 17107 // CHECK11-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 1 17108 // CHECK11-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i32* 17109 // CHECK11-NEXT: store i32 [[TMP142]], i32* [[TMP154]], align 4 17110 // CHECK11-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 1 17111 // CHECK11-NEXT: store i8* null, i8** [[TMP155]], align 4 17112 // CHECK11-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 2 17113 // CHECK11-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to double** 17114 // CHECK11-NEXT: store double* [[TMP143]], double** [[TMP157]], align 4 17115 // CHECK11-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 2 17116 // CHECK11-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to double** 17117 // CHECK11-NEXT: store double* [[TMP143]], double** [[TMP159]], align 4 17118 // CHECK11-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 2 17119 // CHECK11-NEXT: store i8* null, i8** [[TMP160]], align 4 17120 // CHECK11-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 3 17121 // CHECK11-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to double** 17122 // CHECK11-NEXT: store double* [[TMP144]], double** [[TMP162]], align 4 17123 // CHECK11-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 3 17124 // CHECK11-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to double** 17125 // CHECK11-NEXT: store double* [[TMP144]], double** [[TMP164]], align 4 17126 // CHECK11-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 3 17127 // CHECK11-NEXT: store i8* null, i8** [[TMP165]], align 4 17128 // CHECK11-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 4 17129 // CHECK11-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to double** 17130 // CHECK11-NEXT: store double* [[TMP145]], double** [[TMP167]], align 4 17131 // CHECK11-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 4 17132 // CHECK11-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to double** 17133 // CHECK11-NEXT: store double* [[TMP145]], double** [[TMP169]], align 4 17134 // CHECK11-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 4 17135 // CHECK11-NEXT: store i8* null, i8** [[TMP170]], align 4 17136 // CHECK11-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 17137 // CHECK11-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 17138 // CHECK11-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 17139 // CHECK11-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_48]], align 4 17140 // CHECK11-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_48]], align 4 17141 // CHECK11-NEXT: [[SUB50:%.*]] = sub nsw i32 [[TMP174]], 0 17142 // CHECK11-NEXT: [[DIV51:%.*]] = sdiv i32 [[SUB50]], 1 17143 // CHECK11-NEXT: [[SUB52:%.*]] = sub nsw i32 [[DIV51]], 1 17144 // CHECK11-NEXT: store i32 [[SUB52]], i32* [[DOTCAPTURE_EXPR_49]], align 4 17145 // CHECK11-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_49]], align 4 17146 // CHECK11-NEXT: [[ADD53:%.*]] = add nsw i32 [[TMP175]], 1 17147 // CHECK11-NEXT: [[TMP176:%.*]] = zext i32 [[ADD53]] to i64 17148 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 17149 // CHECK11-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.16, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.17, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 17150 // CHECK11-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 17151 // CHECK11-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED54:%.*]], label [[OMP_OFFLOAD_CONT55:%.*]] 17152 // CHECK11: omp_offload.failed54: 17153 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506(i32 [[TMP140]], i32 [[TMP142]], double* [[TMP143]], double* [[TMP144]], double* [[TMP145]]) #[[ATTR2]] 17154 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT55]] 17155 // CHECK11: omp_offload.cont55: 17156 // CHECK11-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 17157 // CHECK11-NEXT: store i32 [[TMP179]], i32* [[N_CASTED56]], align 4 17158 // CHECK11-NEXT: [[TMP180:%.*]] = load i32, i32* [[N_CASTED56]], align 4 17159 // CHECK11-NEXT: [[TMP181:%.*]] = load double*, double** [[A]], align 4 17160 // CHECK11-NEXT: [[TMP182:%.*]] = load double*, double** [[B]], align 4 17161 // CHECK11-NEXT: [[TMP183:%.*]] = load double*, double** [[C]], align 4 17162 // CHECK11-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 17163 // CHECK11-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i32* 17164 // CHECK11-NEXT: store i32 [[TMP180]], i32* [[TMP185]], align 4 17165 // CHECK11-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 17166 // CHECK11-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i32* 17167 // CHECK11-NEXT: store i32 [[TMP180]], i32* [[TMP187]], align 4 17168 // CHECK11-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 0 17169 // CHECK11-NEXT: store i8* null, i8** [[TMP188]], align 4 17170 // CHECK11-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 1 17171 // CHECK11-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to double** 17172 // CHECK11-NEXT: store double* [[TMP181]], double** [[TMP190]], align 4 17173 // CHECK11-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 1 17174 // CHECK11-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to double** 17175 // CHECK11-NEXT: store double* [[TMP181]], double** [[TMP192]], align 4 17176 // CHECK11-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 1 17177 // CHECK11-NEXT: store i8* null, i8** [[TMP193]], align 4 17178 // CHECK11-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 2 17179 // CHECK11-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to double** 17180 // CHECK11-NEXT: store double* [[TMP182]], double** [[TMP195]], align 4 17181 // CHECK11-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 2 17182 // CHECK11-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to double** 17183 // CHECK11-NEXT: store double* [[TMP182]], double** [[TMP197]], align 4 17184 // CHECK11-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 2 17185 // CHECK11-NEXT: store i8* null, i8** [[TMP198]], align 4 17186 // CHECK11-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 3 17187 // CHECK11-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to double** 17188 // CHECK11-NEXT: store double* [[TMP183]], double** [[TMP200]], align 4 17189 // CHECK11-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 3 17190 // CHECK11-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to double** 17191 // CHECK11-NEXT: store double* [[TMP183]], double** [[TMP202]], align 4 17192 // CHECK11-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 3 17193 // CHECK11-NEXT: store i8* null, i8** [[TMP203]], align 4 17194 // CHECK11-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 17195 // CHECK11-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 17196 // CHECK11-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 17197 // CHECK11-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_61]], align 4 17198 // CHECK11-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_61]], align 4 17199 // CHECK11-NEXT: [[SUB63:%.*]] = sub nsw i32 [[TMP207]], 0 17200 // CHECK11-NEXT: [[DIV64:%.*]] = sdiv i32 [[SUB63]], 1 17201 // CHECK11-NEXT: [[SUB65:%.*]] = sub nsw i32 [[DIV64]], 1 17202 // CHECK11-NEXT: store i32 [[SUB65]], i32* [[DOTCAPTURE_EXPR_62]], align 4 17203 // CHECK11-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_62]], align 4 17204 // CHECK11-NEXT: [[ADD66:%.*]] = add nsw i32 [[TMP208]], 1 17205 // CHECK11-NEXT: [[TMP209:%.*]] = zext i32 [[ADD66]] to i64 17206 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 17207 // CHECK11-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.20, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.21, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 17208 // CHECK11-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 17209 // CHECK11-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED67:%.*]], label [[OMP_OFFLOAD_CONT68:%.*]] 17210 // CHECK11: omp_offload.failed67: 17211 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536(i32 [[TMP180]], double* [[TMP181]], double* [[TMP182]], double* [[TMP183]]) #[[ATTR2]] 17212 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT68]] 17213 // CHECK11: omp_offload.cont68: 17214 // CHECK11-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 17215 // CHECK11-NEXT: store i32 [[TMP212]], i32* [[CH_CASTED69]], align 4 17216 // CHECK11-NEXT: [[TMP213:%.*]] = load i32, i32* [[CH_CASTED69]], align 4 17217 // CHECK11-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 17218 // CHECK11-NEXT: store i32 [[TMP214]], i32* [[N_CASTED70]], align 4 17219 // CHECK11-NEXT: [[TMP215:%.*]] = load i32, i32* [[N_CASTED70]], align 4 17220 // CHECK11-NEXT: [[TMP216:%.*]] = load double*, double** [[A]], align 4 17221 // CHECK11-NEXT: [[TMP217:%.*]] = load double*, double** [[B]], align 4 17222 // CHECK11-NEXT: [[TMP218:%.*]] = load double*, double** [[C]], align 4 17223 // CHECK11-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 17224 // CHECK11-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i32* 17225 // CHECK11-NEXT: store i32 [[TMP213]], i32* [[TMP220]], align 4 17226 // CHECK11-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 17227 // CHECK11-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i32* 17228 // CHECK11-NEXT: store i32 [[TMP213]], i32* [[TMP222]], align 4 17229 // CHECK11-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 0 17230 // CHECK11-NEXT: store i8* null, i8** [[TMP223]], align 4 17231 // CHECK11-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 1 17232 // CHECK11-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i32* 17233 // CHECK11-NEXT: store i32 [[TMP215]], i32* [[TMP225]], align 4 17234 // CHECK11-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 1 17235 // CHECK11-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i32* 17236 // CHECK11-NEXT: store i32 [[TMP215]], i32* [[TMP227]], align 4 17237 // CHECK11-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 1 17238 // CHECK11-NEXT: store i8* null, i8** [[TMP228]], align 4 17239 // CHECK11-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 2 17240 // CHECK11-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to double** 17241 // CHECK11-NEXT: store double* [[TMP216]], double** [[TMP230]], align 4 17242 // CHECK11-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 2 17243 // CHECK11-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to double** 17244 // CHECK11-NEXT: store double* [[TMP216]], double** [[TMP232]], align 4 17245 // CHECK11-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 2 17246 // CHECK11-NEXT: store i8* null, i8** [[TMP233]], align 4 17247 // CHECK11-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 3 17248 // CHECK11-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to double** 17249 // CHECK11-NEXT: store double* [[TMP217]], double** [[TMP235]], align 4 17250 // CHECK11-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 3 17251 // CHECK11-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to double** 17252 // CHECK11-NEXT: store double* [[TMP217]], double** [[TMP237]], align 4 17253 // CHECK11-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 3 17254 // CHECK11-NEXT: store i8* null, i8** [[TMP238]], align 4 17255 // CHECK11-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 4 17256 // CHECK11-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to double** 17257 // CHECK11-NEXT: store double* [[TMP218]], double** [[TMP240]], align 4 17258 // CHECK11-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 4 17259 // CHECK11-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to double** 17260 // CHECK11-NEXT: store double* [[TMP218]], double** [[TMP242]], align 4 17261 // CHECK11-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 4 17262 // CHECK11-NEXT: store i8* null, i8** [[TMP243]], align 4 17263 // CHECK11-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 17264 // CHECK11-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 17265 // CHECK11-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 17266 // CHECK11-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_75]], align 4 17267 // CHECK11-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_75]], align 4 17268 // CHECK11-NEXT: [[SUB77:%.*]] = sub nsw i32 [[TMP247]], 0 17269 // CHECK11-NEXT: [[DIV78:%.*]] = sdiv i32 [[SUB77]], 1 17270 // CHECK11-NEXT: [[SUB79:%.*]] = sub nsw i32 [[DIV78]], 1 17271 // CHECK11-NEXT: store i32 [[SUB79]], i32* [[DOTCAPTURE_EXPR_76]], align 4 17272 // CHECK11-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_76]], align 4 17273 // CHECK11-NEXT: [[ADD80:%.*]] = add nsw i32 [[TMP248]], 1 17274 // CHECK11-NEXT: [[TMP249:%.*]] = zext i32 [[ADD80]] to i64 17275 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 17276 // CHECK11-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.24, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.25, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 17277 // CHECK11-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 17278 // CHECK11-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED81:%.*]], label [[OMP_OFFLOAD_CONT82:%.*]] 17279 // CHECK11: omp_offload.failed81: 17280 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562(i32 [[TMP213]], i32 [[TMP215]], double* [[TMP216]], double* [[TMP217]], double* [[TMP218]]) #[[ATTR2]] 17281 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT82]] 17282 // CHECK11: omp_offload.cont82: 17283 // CHECK11-NEXT: [[CALL:%.*]] = call i32 @_Z5tmainIiET_v() 17284 // CHECK11-NEXT: ret i32 [[CALL]] 17285 // 17286 // 17287 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369 17288 // CHECK11-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1:[0-9]+]] { 17289 // CHECK11-NEXT: entry: 17290 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 17291 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 17292 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 17293 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 17294 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 17295 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 17296 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 17297 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 17298 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 17299 // CHECK11-NEXT: ret void 17300 // 17301 // 17302 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined. 17303 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 17304 // CHECK11-NEXT: entry: 17305 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 17306 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 17307 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 17308 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 17309 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 17310 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 17311 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 17312 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 17313 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 17314 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 17315 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 17316 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 17317 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 17318 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 17319 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 17320 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 17321 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 17322 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 17323 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 17324 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 17325 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 17326 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 17327 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 17328 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 17329 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 17330 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 17331 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 17332 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 17333 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17334 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 17335 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 17336 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 17337 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 17338 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 17339 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17340 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 17341 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 17342 // CHECK11: omp.precond.then: 17343 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 17344 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17345 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 17346 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 17347 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 17348 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17349 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 17350 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 17351 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17352 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17353 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 17354 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 17355 // CHECK11: cond.true: 17356 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17357 // CHECK11-NEXT: br label [[COND_END:%.*]] 17358 // CHECK11: cond.false: 17359 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17360 // CHECK11-NEXT: br label [[COND_END]] 17361 // CHECK11: cond.end: 17362 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 17363 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 17364 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17365 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 17366 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 17367 // CHECK11: omp.inner.for.cond: 17368 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17369 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17370 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 17371 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 17372 // CHECK11: omp.inner.for.body: 17373 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17374 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17375 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 17376 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 17377 // CHECK11: omp.inner.for.inc: 17378 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17379 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 17380 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 17381 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 17382 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 17383 // CHECK11: omp.inner.for.end: 17384 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 17385 // CHECK11: omp.loop.exit: 17386 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17387 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 17388 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 17389 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 17390 // CHECK11: omp.precond.end: 17391 // CHECK11-NEXT: ret void 17392 // 17393 // 17394 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..1 17395 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 17396 // CHECK11-NEXT: entry: 17397 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 17398 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 17399 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 17400 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 17401 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 17402 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 17403 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 17404 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 17405 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 17406 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 17407 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 17408 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 17409 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 17410 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 17411 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 17412 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 17413 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 17414 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 17415 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 17416 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 17417 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 17418 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 17419 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 17420 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 17421 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 17422 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 17423 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 17424 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 17425 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 17426 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 17427 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 17428 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 17429 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17430 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 17431 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 17432 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 17433 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 17434 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 17435 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17436 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 17437 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 17438 // CHECK11: omp.precond.then: 17439 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 17440 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17441 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 17442 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 17443 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 17444 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 17445 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 17446 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 17447 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 17448 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17449 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 17450 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 17451 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17452 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17453 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 17454 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 17455 // CHECK11: cond.true: 17456 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17457 // CHECK11-NEXT: br label [[COND_END:%.*]] 17458 // CHECK11: cond.false: 17459 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17460 // CHECK11-NEXT: br label [[COND_END]] 17461 // CHECK11: cond.end: 17462 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 17463 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 17464 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 17465 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 17466 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 17467 // CHECK11: omp.inner.for.cond: 17468 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17469 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17470 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 17471 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 17472 // CHECK11: omp.inner.for.body: 17473 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17474 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 17475 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 17476 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 17477 // CHECK11-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 17478 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 17479 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 17480 // CHECK11-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 17481 // CHECK11-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 17482 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 17483 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 17484 // CHECK11-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 17485 // CHECK11-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 17486 // CHECK11-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 17487 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 17488 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 17489 // CHECK11-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 17490 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 17491 // CHECK11: omp.body.continue: 17492 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 17493 // CHECK11: omp.inner.for.inc: 17494 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17495 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 17496 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 17497 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 17498 // CHECK11: omp.inner.for.end: 17499 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 17500 // CHECK11: omp.loop.exit: 17501 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17502 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 17503 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 17504 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 17505 // CHECK11: omp.precond.end: 17506 // CHECK11-NEXT: ret void 17507 // 17508 // 17509 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408 17510 // CHECK11-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 17511 // CHECK11-NEXT: entry: 17512 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 17513 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 17514 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 17515 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 17516 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 17517 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 17518 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 17519 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 17520 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 17521 // CHECK11-NEXT: ret void 17522 // 17523 // 17524 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..2 17525 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 17526 // CHECK11-NEXT: entry: 17527 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 17528 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 17529 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 17530 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 17531 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 17532 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 17533 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 17534 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 17535 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 17536 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 17537 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 17538 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 17539 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 17540 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 17541 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 17542 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 17543 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 17544 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 17545 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 17546 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 17547 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 17548 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 17549 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 17550 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 17551 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 17552 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 17553 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 17554 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 17555 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17556 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 17557 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 17558 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 17559 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 17560 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 17561 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17562 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 17563 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 17564 // CHECK11: omp.precond.then: 17565 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 17566 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17567 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 17568 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 17569 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 17570 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17571 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 17572 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 17573 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17574 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17575 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 17576 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 17577 // CHECK11: cond.true: 17578 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17579 // CHECK11-NEXT: br label [[COND_END:%.*]] 17580 // CHECK11: cond.false: 17581 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17582 // CHECK11-NEXT: br label [[COND_END]] 17583 // CHECK11: cond.end: 17584 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 17585 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 17586 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17587 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 17588 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 17589 // CHECK11: omp.inner.for.cond: 17590 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17591 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17592 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 17593 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 17594 // CHECK11: omp.inner.for.body: 17595 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17596 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17597 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 17598 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 17599 // CHECK11: omp.inner.for.inc: 17600 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17601 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 17602 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 17603 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 17604 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 17605 // CHECK11: omp.inner.for.end: 17606 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 17607 // CHECK11: omp.loop.exit: 17608 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17609 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 17610 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 17611 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 17612 // CHECK11: omp.precond.end: 17613 // CHECK11-NEXT: ret void 17614 // 17615 // 17616 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..3 17617 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 17618 // CHECK11-NEXT: entry: 17619 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 17620 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 17621 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 17622 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 17623 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 17624 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 17625 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 17626 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 17627 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 17628 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 17629 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 17630 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 17631 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 17632 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 17633 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 17634 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 17635 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 17636 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 17637 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 17638 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 17639 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 17640 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 17641 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 17642 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 17643 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 17644 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 17645 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 17646 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 17647 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 17648 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 17649 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 17650 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 17651 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17652 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 17653 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 17654 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 17655 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 17656 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 17657 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17658 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 17659 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 17660 // CHECK11: omp.precond.then: 17661 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 17662 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17663 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 17664 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 17665 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 17666 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 17667 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 17668 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 17669 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 17670 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17671 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 17672 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 17673 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17674 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17675 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 17676 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 17677 // CHECK11: cond.true: 17678 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17679 // CHECK11-NEXT: br label [[COND_END:%.*]] 17680 // CHECK11: cond.false: 17681 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17682 // CHECK11-NEXT: br label [[COND_END]] 17683 // CHECK11: cond.end: 17684 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 17685 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 17686 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 17687 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 17688 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 17689 // CHECK11: omp.inner.for.cond: 17690 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17691 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17692 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 17693 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 17694 // CHECK11: omp.inner.for.body: 17695 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17696 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 17697 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 17698 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 17699 // CHECK11-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 17700 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 17701 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 17702 // CHECK11-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 17703 // CHECK11-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 17704 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 17705 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 17706 // CHECK11-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 17707 // CHECK11-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 17708 // CHECK11-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 17709 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 17710 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 17711 // CHECK11-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 17712 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 17713 // CHECK11: omp.body.continue: 17714 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 17715 // CHECK11: omp.inner.for.inc: 17716 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17717 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 17718 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 17719 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 17720 // CHECK11: omp.inner.for.end: 17721 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 17722 // CHECK11: omp.loop.exit: 17723 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17724 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 17725 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 17726 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 17727 // CHECK11: omp.precond.end: 17728 // CHECK11-NEXT: ret void 17729 // 17730 // 17731 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447 17732 // CHECK11-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 17733 // CHECK11-NEXT: entry: 17734 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 17735 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 17736 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 17737 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 17738 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 17739 // CHECK11-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 17740 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 17741 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 17742 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 17743 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 17744 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 17745 // CHECK11-NEXT: ret void 17746 // 17747 // 17748 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..6 17749 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 17750 // CHECK11-NEXT: entry: 17751 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 17752 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 17753 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 17754 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 17755 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 17756 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 17757 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 17758 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 17759 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 17760 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 17761 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 17762 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 17763 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 17764 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 17765 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 17766 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 17767 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 17768 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 17769 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 17770 // CHECK11-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 17771 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 17772 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 17773 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 17774 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 17775 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 17776 // CHECK11-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 17777 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 17778 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 17779 // CHECK11-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 17780 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 17781 // CHECK11-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 17782 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17783 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 17784 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 17785 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 17786 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 17787 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 17788 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17789 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 17790 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 17791 // CHECK11: omp.precond.then: 17792 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 17793 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17794 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 17795 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 17796 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 17797 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 17798 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17799 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 17800 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 17801 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17802 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17803 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 17804 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 17805 // CHECK11: cond.true: 17806 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17807 // CHECK11-NEXT: br label [[COND_END:%.*]] 17808 // CHECK11: cond.false: 17809 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17810 // CHECK11-NEXT: br label [[COND_END]] 17811 // CHECK11: cond.end: 17812 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 17813 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 17814 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17815 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 17816 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 17817 // CHECK11: omp.inner.for.cond: 17818 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17819 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17820 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 17821 // CHECK11-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 17822 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 17823 // CHECK11: omp.inner.for.body: 17824 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17825 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17826 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 17827 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 17828 // CHECK11: omp.inner.for.inc: 17829 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17830 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 17831 // CHECK11-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 17832 // CHECK11-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 17833 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17834 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 17835 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 17836 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 17837 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17838 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 17839 // CHECK11-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 17840 // CHECK11-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 17841 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17842 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17843 // CHECK11-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP27]], [[TMP28]] 17844 // CHECK11-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 17845 // CHECK11: cond.true10: 17846 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17847 // CHECK11-NEXT: br label [[COND_END12:%.*]] 17848 // CHECK11: cond.false11: 17849 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 17850 // CHECK11-NEXT: br label [[COND_END12]] 17851 // CHECK11: cond.end12: 17852 // CHECK11-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP29]], [[COND_TRUE10]] ], [ [[TMP30]], [[COND_FALSE11]] ] 17853 // CHECK11-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 17854 // CHECK11-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 17855 // CHECK11-NEXT: store i32 [[TMP31]], i32* [[DOTOMP_IV]], align 4 17856 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 17857 // CHECK11: omp.inner.for.end: 17858 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 17859 // CHECK11: omp.loop.exit: 17860 // CHECK11-NEXT: [[TMP32:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17861 // CHECK11-NEXT: [[TMP33:%.*]] = load i32, i32* [[TMP32]], align 4 17862 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP33]]) 17863 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 17864 // CHECK11: omp.precond.end: 17865 // CHECK11-NEXT: ret void 17866 // 17867 // 17868 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..7 17869 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 17870 // CHECK11-NEXT: entry: 17871 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 17872 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 17873 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 17874 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 17875 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 17876 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 17877 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 17878 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 17879 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 17880 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 17881 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 17882 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 17883 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 17884 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 17885 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 17886 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 17887 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 17888 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 17889 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 17890 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 17891 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 17892 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 17893 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 17894 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 17895 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 17896 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 17897 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 17898 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 17899 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 17900 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 17901 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 17902 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 17903 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17904 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 17905 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 17906 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 17907 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 17908 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 17909 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 17910 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 17911 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 17912 // CHECK11: omp.precond.then: 17913 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 17914 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17915 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 17916 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 17917 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 17918 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 17919 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 17920 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 17921 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 17922 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17923 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 17924 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 17925 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17926 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17927 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 17928 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 17929 // CHECK11: cond.true: 17930 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 17931 // CHECK11-NEXT: br label [[COND_END:%.*]] 17932 // CHECK11: cond.false: 17933 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17934 // CHECK11-NEXT: br label [[COND_END]] 17935 // CHECK11: cond.end: 17936 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 17937 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 17938 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 17939 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 17940 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 17941 // CHECK11: omp.inner.for.cond: 17942 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17943 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 17944 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 17945 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 17946 // CHECK11: omp.inner.for.body: 17947 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17948 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 17949 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 17950 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 17951 // CHECK11-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 17952 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 17953 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 17954 // CHECK11-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 17955 // CHECK11-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 17956 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 17957 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 17958 // CHECK11-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 17959 // CHECK11-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 17960 // CHECK11-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 17961 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 17962 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 17963 // CHECK11-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 17964 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 17965 // CHECK11: omp.body.continue: 17966 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 17967 // CHECK11: omp.inner.for.inc: 17968 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 17969 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 17970 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 17971 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 17972 // CHECK11: omp.inner.for.end: 17973 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 17974 // CHECK11: omp.loop.exit: 17975 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 17976 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 17977 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 17978 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 17979 // CHECK11: omp.precond.end: 17980 // CHECK11-NEXT: ret void 17981 // 17982 // 17983 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478 17984 // CHECK11-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 17985 // CHECK11-NEXT: entry: 17986 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 17987 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 17988 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 17989 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 17990 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 17991 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 17992 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 17993 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 17994 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 17995 // CHECK11-NEXT: ret void 17996 // 17997 // 17998 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..10 17999 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 18000 // CHECK11-NEXT: entry: 18001 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18002 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18003 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18004 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18005 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18006 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18007 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18008 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18009 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18010 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18011 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18012 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 18013 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 18014 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18015 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18016 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 18017 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18018 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18019 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18020 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18021 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18022 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18023 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18024 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 18025 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 18026 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 18027 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 18028 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 18029 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18030 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 18031 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18032 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 18033 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18034 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18035 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18036 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 18037 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18038 // CHECK11: omp.precond.then: 18039 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 18040 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18041 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 18042 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18043 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18044 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18045 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 18046 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 18047 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18048 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18049 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 18050 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 18051 // CHECK11: cond.true: 18052 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18053 // CHECK11-NEXT: br label [[COND_END:%.*]] 18054 // CHECK11: cond.false: 18055 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18056 // CHECK11-NEXT: br label [[COND_END]] 18057 // CHECK11: cond.end: 18058 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 18059 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 18060 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18061 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 18062 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18063 // CHECK11: omp.inner.for.cond: 18064 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18065 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18066 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 18067 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18068 // CHECK11: omp.inner.for.body: 18069 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18070 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18071 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 18072 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18073 // CHECK11: omp.inner.for.inc: 18074 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18075 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 18076 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 18077 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 18078 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 18079 // CHECK11: omp.inner.for.end: 18080 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 18081 // CHECK11: omp.loop.exit: 18082 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18083 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 18084 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 18085 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18086 // CHECK11: omp.precond.end: 18087 // CHECK11-NEXT: ret void 18088 // 18089 // 18090 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..11 18091 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 18092 // CHECK11-NEXT: entry: 18093 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18094 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18095 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 18096 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 18097 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18098 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18099 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18100 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18101 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18102 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18103 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18104 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18105 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18106 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 18107 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 18108 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18109 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18110 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 18111 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18112 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18113 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18114 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18115 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18116 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18117 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18118 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18119 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18120 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 18121 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 18122 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 18123 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 18124 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 18125 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18126 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 18127 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18128 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 18129 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18130 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18131 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18132 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 18133 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18134 // CHECK11: omp.precond.then: 18135 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 18136 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18137 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 18138 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18139 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18140 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 18141 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 18142 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18143 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18144 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18145 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 18146 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 18147 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18148 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18149 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 18150 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 18151 // CHECK11: cond.true: 18152 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18153 // CHECK11-NEXT: br label [[COND_END:%.*]] 18154 // CHECK11: cond.false: 18155 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18156 // CHECK11-NEXT: br label [[COND_END]] 18157 // CHECK11: cond.end: 18158 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 18159 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 18160 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18161 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 18162 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18163 // CHECK11: omp.inner.for.cond: 18164 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18165 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18166 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 18167 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18168 // CHECK11: omp.inner.for.body: 18169 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18170 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 18171 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 18172 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 18173 // CHECK11-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 18174 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 18175 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 18176 // CHECK11-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 18177 // CHECK11-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 18178 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 18179 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 18180 // CHECK11-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 18181 // CHECK11-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 18182 // CHECK11-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 18183 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 18184 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 18185 // CHECK11-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 18186 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 18187 // CHECK11: omp.body.continue: 18188 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18189 // CHECK11: omp.inner.for.inc: 18190 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18191 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 18192 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 18193 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 18194 // CHECK11: omp.inner.for.end: 18195 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 18196 // CHECK11: omp.loop.exit: 18197 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18198 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 18199 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 18200 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18201 // CHECK11: omp.precond.end: 18202 // CHECK11-NEXT: ret void 18203 // 18204 // 18205 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506 18206 // CHECK11-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 18207 // CHECK11-NEXT: entry: 18208 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 18209 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 18210 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 18211 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 18212 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 18213 // CHECK11-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 18214 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 18215 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 18216 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 18217 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 18218 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 18219 // CHECK11-NEXT: ret void 18220 // 18221 // 18222 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..14 18223 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 18224 // CHECK11-NEXT: entry: 18225 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18226 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18227 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 18228 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18229 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18230 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18231 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18232 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18233 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18234 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18235 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18236 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 18237 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18238 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 18239 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 18240 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18241 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18242 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 18243 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 18244 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18245 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18246 // CHECK11-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 18247 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18248 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18249 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18250 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18251 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 18252 // CHECK11-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18253 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 18254 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 18255 // CHECK11-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 18256 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 18257 // CHECK11-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 18258 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 18259 // CHECK11-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18260 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18261 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 18262 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18263 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 18264 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 18265 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18266 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18267 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 18268 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18269 // CHECK11: omp.precond.then: 18270 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 18271 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18272 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 18273 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18274 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18275 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18276 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 18277 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 18278 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18279 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18280 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 18281 // CHECK11-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 18282 // CHECK11: cond.true: 18283 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18284 // CHECK11-NEXT: br label [[COND_END:%.*]] 18285 // CHECK11: cond.false: 18286 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18287 // CHECK11-NEXT: br label [[COND_END]] 18288 // CHECK11: cond.end: 18289 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 18290 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 18291 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18292 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 18293 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18294 // CHECK11: omp.inner.for.cond: 18295 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18296 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18297 // CHECK11-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 18298 // CHECK11-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18299 // CHECK11: omp.inner.for.body: 18300 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18301 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18302 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18303 // CHECK11-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 18304 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 18305 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 18306 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18307 // CHECK11: omp.inner.for.inc: 18308 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18309 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 18310 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 18311 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 18312 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 18313 // CHECK11: omp.inner.for.end: 18314 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 18315 // CHECK11: omp.loop.exit: 18316 // CHECK11-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18317 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 18318 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 18319 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18320 // CHECK11: omp.precond.end: 18321 // CHECK11-NEXT: ret void 18322 // 18323 // 18324 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..15 18325 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 18326 // CHECK11-NEXT: entry: 18327 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18328 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18329 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 18330 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 18331 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18332 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18333 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18334 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18335 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 18336 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18337 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18338 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18339 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 18340 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18341 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 18342 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 18343 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18344 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18345 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 18346 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18347 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18348 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18349 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18350 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18351 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18352 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18353 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18354 // CHECK11-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 18355 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18356 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 18357 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 18358 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 18359 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 18360 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18361 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18362 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 18363 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18364 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 18365 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 18366 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18367 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18368 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 18369 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18370 // CHECK11: omp.precond.then: 18371 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 18372 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18373 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 18374 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18375 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18376 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 18377 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 18378 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18379 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18380 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 18381 // CHECK11-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18382 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 18383 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 18384 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 18385 // CHECK11: omp.dispatch.cond: 18386 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18387 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18388 // CHECK11-NEXT: [[CMP5:%.*]] = icmp ugt i32 [[TMP13]], [[TMP14]] 18389 // CHECK11-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 18390 // CHECK11: cond.true: 18391 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18392 // CHECK11-NEXT: br label [[COND_END:%.*]] 18393 // CHECK11: cond.false: 18394 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18395 // CHECK11-NEXT: br label [[COND_END]] 18396 // CHECK11: cond.end: 18397 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP15]], [[COND_TRUE]] ], [ [[TMP16]], [[COND_FALSE]] ] 18398 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 18399 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18400 // CHECK11-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 18401 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18402 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18403 // CHECK11-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 18404 // CHECK11-NEXT: br i1 [[CMP6]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 18405 // CHECK11: omp.dispatch.body: 18406 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18407 // CHECK11: omp.inner.for.cond: 18408 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18409 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18410 // CHECK11-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 18411 // CHECK11-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18412 // CHECK11: omp.inner.for.body: 18413 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18414 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 18415 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 18416 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 18417 // CHECK11-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 4 18418 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 18419 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 18420 // CHECK11-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 4 18421 // CHECK11-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 4 18422 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 18423 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 18424 // CHECK11-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX8]], align 4 18425 // CHECK11-NEXT: [[ADD9:%.*]] = fadd double [[TMP25]], [[TMP28]] 18426 // CHECK11-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 4 18427 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[I4]], align 4 18428 // CHECK11-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP29]], i32 [[TMP30]] 18429 // CHECK11-NEXT: store double [[ADD9]], double* [[ARRAYIDX10]], align 4 18430 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 18431 // CHECK11: omp.body.continue: 18432 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18433 // CHECK11: omp.inner.for.inc: 18434 // CHECK11-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18435 // CHECK11-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP31]], 1 18436 // CHECK11-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4 18437 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 18438 // CHECK11: omp.inner.for.end: 18439 // CHECK11-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 18440 // CHECK11: omp.dispatch.inc: 18441 // CHECK11-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18442 // CHECK11-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 18443 // CHECK11-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 18444 // CHECK11-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_LB]], align 4 18445 // CHECK11-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18446 // CHECK11-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 18447 // CHECK11-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 18448 // CHECK11-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_UB]], align 4 18449 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND]] 18450 // CHECK11: omp.dispatch.end: 18451 // CHECK11-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18452 // CHECK11-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 18453 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 18454 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18455 // CHECK11: omp.precond.end: 18456 // CHECK11-NEXT: ret void 18457 // 18458 // 18459 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536 18460 // CHECK11-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 18461 // CHECK11-NEXT: entry: 18462 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 18463 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 18464 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 18465 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 18466 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 18467 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 18468 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 18469 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 18470 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 18471 // CHECK11-NEXT: ret void 18472 // 18473 // 18474 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..18 18475 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 18476 // CHECK11-NEXT: entry: 18477 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18478 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18479 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18480 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18481 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18482 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18483 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18484 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18485 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18486 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18487 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18488 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 18489 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 18490 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18491 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18492 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 18493 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18494 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18495 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18496 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18497 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18498 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18499 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18500 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 18501 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 18502 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 18503 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 18504 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 18505 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18506 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 18507 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18508 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 18509 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18510 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18511 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18512 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 18513 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18514 // CHECK11: omp.precond.then: 18515 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 18516 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18517 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 18518 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18519 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18520 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18521 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 18522 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 18523 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18524 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18525 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 18526 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 18527 // CHECK11: cond.true: 18528 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18529 // CHECK11-NEXT: br label [[COND_END:%.*]] 18530 // CHECK11: cond.false: 18531 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18532 // CHECK11-NEXT: br label [[COND_END]] 18533 // CHECK11: cond.end: 18534 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 18535 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 18536 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18537 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 18538 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18539 // CHECK11: omp.inner.for.cond: 18540 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18541 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18542 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 18543 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18544 // CHECK11: omp.inner.for.body: 18545 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18546 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18547 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 18548 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18549 // CHECK11: omp.inner.for.inc: 18550 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18551 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 18552 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 18553 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 18554 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 18555 // CHECK11: omp.inner.for.end: 18556 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 18557 // CHECK11: omp.loop.exit: 18558 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18559 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 18560 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 18561 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18562 // CHECK11: omp.precond.end: 18563 // CHECK11-NEXT: ret void 18564 // 18565 // 18566 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..19 18567 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 18568 // CHECK11-NEXT: entry: 18569 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18570 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18571 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 18572 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 18573 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18574 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18575 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18576 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18577 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18578 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18579 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18580 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18581 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18582 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 18583 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 18584 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18585 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18586 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 18587 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18588 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18589 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18590 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18591 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18592 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18593 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18594 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18595 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18596 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 18597 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 18598 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 18599 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 18600 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 18601 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18602 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 18603 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18604 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 18605 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18606 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18607 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18608 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 18609 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18610 // CHECK11: omp.precond.then: 18611 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 18612 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18613 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 18614 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18615 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18616 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 18617 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 18618 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18619 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18620 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18621 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18622 // CHECK11-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18623 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 18624 // CHECK11-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 18625 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 18626 // CHECK11: omp.dispatch.cond: 18627 // CHECK11-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18628 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 18629 // CHECK11-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 18630 // CHECK11-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 18631 // CHECK11-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 18632 // CHECK11: omp.dispatch.body: 18633 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18634 // CHECK11-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 18635 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18636 // CHECK11: omp.inner.for.cond: 18637 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 18638 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !19 18639 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 18640 // CHECK11-NEXT: br i1 [[CMP4]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18641 // CHECK11: omp.inner.for.body: 18642 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 18643 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 18644 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 18645 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4, !llvm.access.group !19 18646 // CHECK11-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !19 18647 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !19 18648 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i32 [[TMP22]] 18649 // CHECK11-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !19 18650 // CHECK11-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !19 18651 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !19 18652 // CHECK11-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds double, double* [[TMP24]], i32 [[TMP25]] 18653 // CHECK11-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX5]], align 4, !llvm.access.group !19 18654 // CHECK11-NEXT: [[ADD6:%.*]] = fadd double [[TMP23]], [[TMP26]] 18655 // CHECK11-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !19 18656 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !19 18657 // CHECK11-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP27]], i32 [[TMP28]] 18658 // CHECK11-NEXT: store double [[ADD6]], double* [[ARRAYIDX7]], align 4, !llvm.access.group !19 18659 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 18660 // CHECK11: omp.body.continue: 18661 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18662 // CHECK11: omp.inner.for.inc: 18663 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 18664 // CHECK11-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP29]], 1 18665 // CHECK11-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 18666 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP20:![0-9]+]] 18667 // CHECK11: omp.inner.for.end: 18668 // CHECK11-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 18669 // CHECK11: omp.dispatch.inc: 18670 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND]] 18671 // CHECK11: omp.dispatch.end: 18672 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18673 // CHECK11: omp.precond.end: 18674 // CHECK11-NEXT: ret void 18675 // 18676 // 18677 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562 18678 // CHECK11-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 18679 // CHECK11-NEXT: entry: 18680 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 18681 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 18682 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 18683 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 18684 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 18685 // CHECK11-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 18686 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 18687 // CHECK11-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 18688 // CHECK11-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 18689 // CHECK11-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 18690 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 18691 // CHECK11-NEXT: ret void 18692 // 18693 // 18694 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..22 18695 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 18696 // CHECK11-NEXT: entry: 18697 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18698 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18699 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 18700 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18701 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18702 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18703 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18704 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18705 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18706 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18707 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18708 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 18709 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18710 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 18711 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 18712 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18713 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18714 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 18715 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 18716 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18717 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18718 // CHECK11-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 18719 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18720 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18721 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18722 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18723 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 18724 // CHECK11-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18725 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 18726 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 18727 // CHECK11-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 18728 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 18729 // CHECK11-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 18730 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 18731 // CHECK11-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18732 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18733 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 18734 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18735 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 18736 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 18737 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18738 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18739 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 18740 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18741 // CHECK11: omp.precond.then: 18742 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 18743 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18744 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 18745 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18746 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18747 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18748 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 18749 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 18750 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18751 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18752 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 18753 // CHECK11-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 18754 // CHECK11: cond.true: 18755 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18756 // CHECK11-NEXT: br label [[COND_END:%.*]] 18757 // CHECK11: cond.false: 18758 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18759 // CHECK11-NEXT: br label [[COND_END]] 18760 // CHECK11: cond.end: 18761 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 18762 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 18763 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18764 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 18765 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18766 // CHECK11: omp.inner.for.cond: 18767 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18768 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18769 // CHECK11-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 18770 // CHECK11-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18771 // CHECK11: omp.inner.for.body: 18772 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 18773 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 18774 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 18775 // CHECK11-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 18776 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 18777 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 18778 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18779 // CHECK11: omp.inner.for.inc: 18780 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 18781 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 18782 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 18783 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 18784 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 18785 // CHECK11: omp.inner.for.end: 18786 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 18787 // CHECK11: omp.loop.exit: 18788 // CHECK11-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18789 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 18790 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 18791 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18792 // CHECK11: omp.precond.end: 18793 // CHECK11-NEXT: ret void 18794 // 18795 // 18796 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..23 18797 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 18798 // CHECK11-NEXT: entry: 18799 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 18800 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 18801 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 18802 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 18803 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 18804 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 18805 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 18806 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 18807 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 18808 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 18809 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18810 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18811 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 18812 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 18813 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 18814 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 18815 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 18816 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 18817 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 18818 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 18819 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 18820 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18821 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18822 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 18823 // CHECK11-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 18824 // CHECK11-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 18825 // CHECK11-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 18826 // CHECK11-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 18827 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 18828 // CHECK11-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 18829 // CHECK11-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 18830 // CHECK11-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 18831 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 18832 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 18833 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18834 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 18835 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 18836 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 18837 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 18838 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 18839 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 18840 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 18841 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 18842 // CHECK11: omp.precond.then: 18843 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 18844 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 18845 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 18846 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 18847 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 18848 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 18849 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 18850 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 18851 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 18852 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 18853 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18854 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 18855 // CHECK11-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18856 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 18857 // CHECK11-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 18858 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 18859 // CHECK11: omp.dispatch.cond: 18860 // CHECK11-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 18861 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 18862 // CHECK11-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 18863 // CHECK11-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 18864 // CHECK11-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 18865 // CHECK11: omp.dispatch.body: 18866 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 18867 // CHECK11-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 18868 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 18869 // CHECK11: omp.inner.for.cond: 18870 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 18871 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !22 18872 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 18873 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 18874 // CHECK11: omp.inner.for.body: 18875 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 18876 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 18877 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 18878 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !22 18879 // CHECK11-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !22 18880 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !22 18881 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i32 [[TMP23]] 18882 // CHECK11-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !22 18883 // CHECK11-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !22 18884 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !22 18885 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP25]], i32 [[TMP26]] 18886 // CHECK11-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX6]], align 4, !llvm.access.group !22 18887 // CHECK11-NEXT: [[ADD7:%.*]] = fadd double [[TMP24]], [[TMP27]] 18888 // CHECK11-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !22 18889 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !22 18890 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP28]], i32 [[TMP29]] 18891 // CHECK11-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4, !llvm.access.group !22 18892 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 18893 // CHECK11: omp.body.continue: 18894 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 18895 // CHECK11: omp.inner.for.inc: 18896 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 18897 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP30]], 1 18898 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 18899 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP23:![0-9]+]] 18900 // CHECK11: omp.inner.for.end: 18901 // CHECK11-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 18902 // CHECK11: omp.dispatch.inc: 18903 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND]] 18904 // CHECK11: omp.dispatch.end: 18905 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 18906 // CHECK11: omp.precond.end: 18907 // CHECK11-NEXT: ret void 18908 // 18909 // 18910 // CHECK11-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 18911 // CHECK11-SAME: () #[[ATTR3:[0-9]+]] comdat { 18912 // CHECK11-NEXT: entry: 18913 // CHECK11-NEXT: [[A:%.*]] = alloca i32*, align 4 18914 // CHECK11-NEXT: [[B:%.*]] = alloca i32*, align 4 18915 // CHECK11-NEXT: [[C:%.*]] = alloca i32*, align 4 18916 // CHECK11-NEXT: [[N:%.*]] = alloca i32, align 4 18917 // CHECK11-NEXT: [[CH:%.*]] = alloca i32, align 4 18918 // CHECK11-NEXT: [[N_CASTED:%.*]] = alloca i32, align 4 18919 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 4 18920 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 4 18921 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 4 18922 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 18923 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 18924 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 18925 // CHECK11-NEXT: [[N_CASTED3:%.*]] = alloca i32, align 4 18926 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS4:%.*]] = alloca [4 x i8*], align 4 18927 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS5:%.*]] = alloca [4 x i8*], align 4 18928 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS6:%.*]] = alloca [4 x i8*], align 4 18929 // CHECK11-NEXT: [[_TMP7:%.*]] = alloca i32, align 4 18930 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_8:%.*]] = alloca i32, align 4 18931 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 18932 // CHECK11-NEXT: [[CH_CASTED:%.*]] = alloca i32, align 4 18933 // CHECK11-NEXT: [[N_CASTED16:%.*]] = alloca i32, align 4 18934 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS17:%.*]] = alloca [5 x i8*], align 4 18935 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS18:%.*]] = alloca [5 x i8*], align 4 18936 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS19:%.*]] = alloca [5 x i8*], align 4 18937 // CHECK11-NEXT: [[_TMP20:%.*]] = alloca i32, align 4 18938 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_21:%.*]] = alloca i32, align 4 18939 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_22:%.*]] = alloca i32, align 4 18940 // CHECK11-NEXT: [[N_CASTED29:%.*]] = alloca i32, align 4 18941 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS30:%.*]] = alloca [4 x i8*], align 4 18942 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS31:%.*]] = alloca [4 x i8*], align 4 18943 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS32:%.*]] = alloca [4 x i8*], align 4 18944 // CHECK11-NEXT: [[_TMP33:%.*]] = alloca i32, align 4 18945 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_34:%.*]] = alloca i32, align 4 18946 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_35:%.*]] = alloca i32, align 4 18947 // CHECK11-NEXT: [[CH_CASTED42:%.*]] = alloca i32, align 4 18948 // CHECK11-NEXT: [[N_CASTED43:%.*]] = alloca i32, align 4 18949 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS44:%.*]] = alloca [5 x i8*], align 4 18950 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS45:%.*]] = alloca [5 x i8*], align 4 18951 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS46:%.*]] = alloca [5 x i8*], align 4 18952 // CHECK11-NEXT: [[_TMP47:%.*]] = alloca i32, align 4 18953 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_48:%.*]] = alloca i32, align 4 18954 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_49:%.*]] = alloca i32, align 4 18955 // CHECK11-NEXT: [[N_CASTED56:%.*]] = alloca i32, align 4 18956 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS57:%.*]] = alloca [4 x i8*], align 4 18957 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS58:%.*]] = alloca [4 x i8*], align 4 18958 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS59:%.*]] = alloca [4 x i8*], align 4 18959 // CHECK11-NEXT: [[_TMP60:%.*]] = alloca i32, align 4 18960 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_61:%.*]] = alloca i32, align 4 18961 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_62:%.*]] = alloca i32, align 4 18962 // CHECK11-NEXT: [[CH_CASTED69:%.*]] = alloca i32, align 4 18963 // CHECK11-NEXT: [[N_CASTED70:%.*]] = alloca i32, align 4 18964 // CHECK11-NEXT: [[DOTOFFLOAD_BASEPTRS71:%.*]] = alloca [5 x i8*], align 4 18965 // CHECK11-NEXT: [[DOTOFFLOAD_PTRS72:%.*]] = alloca [5 x i8*], align 4 18966 // CHECK11-NEXT: [[DOTOFFLOAD_MAPPERS73:%.*]] = alloca [5 x i8*], align 4 18967 // CHECK11-NEXT: [[_TMP74:%.*]] = alloca i32, align 4 18968 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 18969 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_76:%.*]] = alloca i32, align 4 18970 // CHECK11-NEXT: store i32 10000, i32* [[N]], align 4 18971 // CHECK11-NEXT: store i32 100, i32* [[CH]], align 4 18972 // CHECK11-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 18973 // CHECK11-NEXT: store i32 [[TMP0]], i32* [[N_CASTED]], align 4 18974 // CHECK11-NEXT: [[TMP1:%.*]] = load i32, i32* [[N_CASTED]], align 4 18975 // CHECK11-NEXT: [[TMP2:%.*]] = load i32*, i32** [[A]], align 4 18976 // CHECK11-NEXT: [[TMP3:%.*]] = load i32*, i32** [[B]], align 4 18977 // CHECK11-NEXT: [[TMP4:%.*]] = load i32*, i32** [[C]], align 4 18978 // CHECK11-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 18979 // CHECK11-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i32* 18980 // CHECK11-NEXT: store i32 [[TMP1]], i32* [[TMP6]], align 4 18981 // CHECK11-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 18982 // CHECK11-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i32* 18983 // CHECK11-NEXT: store i32 [[TMP1]], i32* [[TMP8]], align 4 18984 // CHECK11-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 0 18985 // CHECK11-NEXT: store i8* null, i8** [[TMP9]], align 4 18986 // CHECK11-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 18987 // CHECK11-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to i32** 18988 // CHECK11-NEXT: store i32* [[TMP2]], i32** [[TMP11]], align 4 18989 // CHECK11-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 18990 // CHECK11-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to i32** 18991 // CHECK11-NEXT: store i32* [[TMP2]], i32** [[TMP13]], align 4 18992 // CHECK11-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 1 18993 // CHECK11-NEXT: store i8* null, i8** [[TMP14]], align 4 18994 // CHECK11-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 18995 // CHECK11-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to i32** 18996 // CHECK11-NEXT: store i32* [[TMP3]], i32** [[TMP16]], align 4 18997 // CHECK11-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 18998 // CHECK11-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to i32** 18999 // CHECK11-NEXT: store i32* [[TMP3]], i32** [[TMP18]], align 4 19000 // CHECK11-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 2 19001 // CHECK11-NEXT: store i8* null, i8** [[TMP19]], align 4 19002 // CHECK11-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 19003 // CHECK11-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to i32** 19004 // CHECK11-NEXT: store i32* [[TMP4]], i32** [[TMP21]], align 4 19005 // CHECK11-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 19006 // CHECK11-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to i32** 19007 // CHECK11-NEXT: store i32* [[TMP4]], i32** [[TMP23]], align 4 19008 // CHECK11-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 3 19009 // CHECK11-NEXT: store i8* null, i8** [[TMP24]], align 4 19010 // CHECK11-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 19011 // CHECK11-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 19012 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 19013 // CHECK11-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 19014 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19015 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 19016 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 19017 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 19018 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 19019 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19020 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 19021 // CHECK11-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 19022 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP30]]) 19023 // CHECK11-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.28, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.29, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19024 // CHECK11-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 19025 // CHECK11-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 19026 // CHECK11: omp_offload.failed: 19027 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42(i32 [[TMP1]], i32* [[TMP2]], i32* [[TMP3]], i32* [[TMP4]]) #[[ATTR2]] 19028 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT]] 19029 // CHECK11: omp_offload.cont: 19030 // CHECK11-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 19031 // CHECK11-NEXT: store i32 [[TMP33]], i32* [[N_CASTED3]], align 4 19032 // CHECK11-NEXT: [[TMP34:%.*]] = load i32, i32* [[N_CASTED3]], align 4 19033 // CHECK11-NEXT: [[TMP35:%.*]] = load i32*, i32** [[A]], align 4 19034 // CHECK11-NEXT: [[TMP36:%.*]] = load i32*, i32** [[B]], align 4 19035 // CHECK11-NEXT: [[TMP37:%.*]] = load i32*, i32** [[C]], align 4 19036 // CHECK11-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 19037 // CHECK11-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i32* 19038 // CHECK11-NEXT: store i32 [[TMP34]], i32* [[TMP39]], align 4 19039 // CHECK11-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 19040 // CHECK11-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i32* 19041 // CHECK11-NEXT: store i32 [[TMP34]], i32* [[TMP41]], align 4 19042 // CHECK11-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 0 19043 // CHECK11-NEXT: store i8* null, i8** [[TMP42]], align 4 19044 // CHECK11-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 1 19045 // CHECK11-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to i32** 19046 // CHECK11-NEXT: store i32* [[TMP35]], i32** [[TMP44]], align 4 19047 // CHECK11-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 1 19048 // CHECK11-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to i32** 19049 // CHECK11-NEXT: store i32* [[TMP35]], i32** [[TMP46]], align 4 19050 // CHECK11-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 1 19051 // CHECK11-NEXT: store i8* null, i8** [[TMP47]], align 4 19052 // CHECK11-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 2 19053 // CHECK11-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to i32** 19054 // CHECK11-NEXT: store i32* [[TMP36]], i32** [[TMP49]], align 4 19055 // CHECK11-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 2 19056 // CHECK11-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to i32** 19057 // CHECK11-NEXT: store i32* [[TMP36]], i32** [[TMP51]], align 4 19058 // CHECK11-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 2 19059 // CHECK11-NEXT: store i8* null, i8** [[TMP52]], align 4 19060 // CHECK11-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 3 19061 // CHECK11-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to i32** 19062 // CHECK11-NEXT: store i32* [[TMP37]], i32** [[TMP54]], align 4 19063 // CHECK11-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 3 19064 // CHECK11-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to i32** 19065 // CHECK11-NEXT: store i32* [[TMP37]], i32** [[TMP56]], align 4 19066 // CHECK11-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 3 19067 // CHECK11-NEXT: store i8* null, i8** [[TMP57]], align 4 19068 // CHECK11-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 19069 // CHECK11-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 19070 // CHECK11-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 19071 // CHECK11-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_8]], align 4 19072 // CHECK11-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_8]], align 4 19073 // CHECK11-NEXT: [[SUB10:%.*]] = sub nsw i32 [[TMP61]], 0 19074 // CHECK11-NEXT: [[DIV11:%.*]] = sdiv i32 [[SUB10]], 1 19075 // CHECK11-NEXT: [[SUB12:%.*]] = sub nsw i32 [[DIV11]], 1 19076 // CHECK11-NEXT: store i32 [[SUB12]], i32* [[DOTCAPTURE_EXPR_9]], align 4 19077 // CHECK11-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 19078 // CHECK11-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP62]], 1 19079 // CHECK11-NEXT: [[TMP63:%.*]] = zext i32 [[ADD13]] to i64 19080 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 19081 // CHECK11-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.32, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.33, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19082 // CHECK11-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 19083 // CHECK11-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED14:%.*]], label [[OMP_OFFLOAD_CONT15:%.*]] 19084 // CHECK11: omp_offload.failed14: 19085 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51(i32 [[TMP34]], i32* [[TMP35]], i32* [[TMP36]], i32* [[TMP37]]) #[[ATTR2]] 19086 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT15]] 19087 // CHECK11: omp_offload.cont15: 19088 // CHECK11-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 19089 // CHECK11-NEXT: store i32 [[TMP66]], i32* [[CH_CASTED]], align 4 19090 // CHECK11-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH_CASTED]], align 4 19091 // CHECK11-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 19092 // CHECK11-NEXT: store i32 [[TMP68]], i32* [[N_CASTED16]], align 4 19093 // CHECK11-NEXT: [[TMP69:%.*]] = load i32, i32* [[N_CASTED16]], align 4 19094 // CHECK11-NEXT: [[TMP70:%.*]] = load i32*, i32** [[A]], align 4 19095 // CHECK11-NEXT: [[TMP71:%.*]] = load i32*, i32** [[B]], align 4 19096 // CHECK11-NEXT: [[TMP72:%.*]] = load i32*, i32** [[C]], align 4 19097 // CHECK11-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 19098 // CHECK11-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i32* 19099 // CHECK11-NEXT: store i32 [[TMP67]], i32* [[TMP74]], align 4 19100 // CHECK11-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 19101 // CHECK11-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i32* 19102 // CHECK11-NEXT: store i32 [[TMP67]], i32* [[TMP76]], align 4 19103 // CHECK11-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 0 19104 // CHECK11-NEXT: store i8* null, i8** [[TMP77]], align 4 19105 // CHECK11-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 1 19106 // CHECK11-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i32* 19107 // CHECK11-NEXT: store i32 [[TMP69]], i32* [[TMP79]], align 4 19108 // CHECK11-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 1 19109 // CHECK11-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i32* 19110 // CHECK11-NEXT: store i32 [[TMP69]], i32* [[TMP81]], align 4 19111 // CHECK11-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 1 19112 // CHECK11-NEXT: store i8* null, i8** [[TMP82]], align 4 19113 // CHECK11-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 2 19114 // CHECK11-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to i32** 19115 // CHECK11-NEXT: store i32* [[TMP70]], i32** [[TMP84]], align 4 19116 // CHECK11-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 2 19117 // CHECK11-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to i32** 19118 // CHECK11-NEXT: store i32* [[TMP70]], i32** [[TMP86]], align 4 19119 // CHECK11-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 2 19120 // CHECK11-NEXT: store i8* null, i8** [[TMP87]], align 4 19121 // CHECK11-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 3 19122 // CHECK11-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to i32** 19123 // CHECK11-NEXT: store i32* [[TMP71]], i32** [[TMP89]], align 4 19124 // CHECK11-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 3 19125 // CHECK11-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to i32** 19126 // CHECK11-NEXT: store i32* [[TMP71]], i32** [[TMP91]], align 4 19127 // CHECK11-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 3 19128 // CHECK11-NEXT: store i8* null, i8** [[TMP92]], align 4 19129 // CHECK11-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 4 19130 // CHECK11-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to i32** 19131 // CHECK11-NEXT: store i32* [[TMP72]], i32** [[TMP94]], align 4 19132 // CHECK11-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 4 19133 // CHECK11-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to i32** 19134 // CHECK11-NEXT: store i32* [[TMP72]], i32** [[TMP96]], align 4 19135 // CHECK11-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 4 19136 // CHECK11-NEXT: store i8* null, i8** [[TMP97]], align 4 19137 // CHECK11-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 19138 // CHECK11-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 19139 // CHECK11-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 19140 // CHECK11-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_21]], align 4 19141 // CHECK11-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_21]], align 4 19142 // CHECK11-NEXT: [[SUB23:%.*]] = sub nsw i32 [[TMP101]], 0 19143 // CHECK11-NEXT: [[DIV24:%.*]] = sdiv i32 [[SUB23]], 1 19144 // CHECK11-NEXT: [[SUB25:%.*]] = sub nsw i32 [[DIV24]], 1 19145 // CHECK11-NEXT: store i32 [[SUB25]], i32* [[DOTCAPTURE_EXPR_22]], align 4 19146 // CHECK11-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_22]], align 4 19147 // CHECK11-NEXT: [[ADD26:%.*]] = add nsw i32 [[TMP102]], 1 19148 // CHECK11-NEXT: [[TMP103:%.*]] = zext i32 [[ADD26]] to i64 19149 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 19150 // CHECK11-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.36, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.37, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19151 // CHECK11-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 19152 // CHECK11-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED27:%.*]], label [[OMP_OFFLOAD_CONT28:%.*]] 19153 // CHECK11: omp_offload.failed27: 19154 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59(i32 [[TMP67]], i32 [[TMP69]], i32* [[TMP70]], i32* [[TMP71]], i32* [[TMP72]]) #[[ATTR2]] 19155 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT28]] 19156 // CHECK11: omp_offload.cont28: 19157 // CHECK11-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 19158 // CHECK11-NEXT: store i32 [[TMP106]], i32* [[N_CASTED29]], align 4 19159 // CHECK11-NEXT: [[TMP107:%.*]] = load i32, i32* [[N_CASTED29]], align 4 19160 // CHECK11-NEXT: [[TMP108:%.*]] = load i32*, i32** [[A]], align 4 19161 // CHECK11-NEXT: [[TMP109:%.*]] = load i32*, i32** [[B]], align 4 19162 // CHECK11-NEXT: [[TMP110:%.*]] = load i32*, i32** [[C]], align 4 19163 // CHECK11-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 19164 // CHECK11-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i32* 19165 // CHECK11-NEXT: store i32 [[TMP107]], i32* [[TMP112]], align 4 19166 // CHECK11-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 19167 // CHECK11-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i32* 19168 // CHECK11-NEXT: store i32 [[TMP107]], i32* [[TMP114]], align 4 19169 // CHECK11-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 0 19170 // CHECK11-NEXT: store i8* null, i8** [[TMP115]], align 4 19171 // CHECK11-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 1 19172 // CHECK11-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to i32** 19173 // CHECK11-NEXT: store i32* [[TMP108]], i32** [[TMP117]], align 4 19174 // CHECK11-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 1 19175 // CHECK11-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to i32** 19176 // CHECK11-NEXT: store i32* [[TMP108]], i32** [[TMP119]], align 4 19177 // CHECK11-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 1 19178 // CHECK11-NEXT: store i8* null, i8** [[TMP120]], align 4 19179 // CHECK11-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 2 19180 // CHECK11-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to i32** 19181 // CHECK11-NEXT: store i32* [[TMP109]], i32** [[TMP122]], align 4 19182 // CHECK11-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 2 19183 // CHECK11-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to i32** 19184 // CHECK11-NEXT: store i32* [[TMP109]], i32** [[TMP124]], align 4 19185 // CHECK11-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 2 19186 // CHECK11-NEXT: store i8* null, i8** [[TMP125]], align 4 19187 // CHECK11-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 3 19188 // CHECK11-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to i32** 19189 // CHECK11-NEXT: store i32* [[TMP110]], i32** [[TMP127]], align 4 19190 // CHECK11-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 3 19191 // CHECK11-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to i32** 19192 // CHECK11-NEXT: store i32* [[TMP110]], i32** [[TMP129]], align 4 19193 // CHECK11-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 3 19194 // CHECK11-NEXT: store i8* null, i8** [[TMP130]], align 4 19195 // CHECK11-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 19196 // CHECK11-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 19197 // CHECK11-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 19198 // CHECK11-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_34]], align 4 19199 // CHECK11-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_34]], align 4 19200 // CHECK11-NEXT: [[SUB36:%.*]] = sub nsw i32 [[TMP134]], 0 19201 // CHECK11-NEXT: [[DIV37:%.*]] = sdiv i32 [[SUB36]], 1 19202 // CHECK11-NEXT: [[SUB38:%.*]] = sub nsw i32 [[DIV37]], 1 19203 // CHECK11-NEXT: store i32 [[SUB38]], i32* [[DOTCAPTURE_EXPR_35]], align 4 19204 // CHECK11-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_35]], align 4 19205 // CHECK11-NEXT: [[ADD39:%.*]] = add nsw i32 [[TMP135]], 1 19206 // CHECK11-NEXT: [[TMP136:%.*]] = zext i32 [[ADD39]] to i64 19207 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 19208 // CHECK11-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.40, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.41, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19209 // CHECK11-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 19210 // CHECK11-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED40:%.*]], label [[OMP_OFFLOAD_CONT41:%.*]] 19211 // CHECK11: omp_offload.failed40: 19212 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67(i32 [[TMP107]], i32* [[TMP108]], i32* [[TMP109]], i32* [[TMP110]]) #[[ATTR2]] 19213 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT41]] 19214 // CHECK11: omp_offload.cont41: 19215 // CHECK11-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 19216 // CHECK11-NEXT: store i32 [[TMP139]], i32* [[CH_CASTED42]], align 4 19217 // CHECK11-NEXT: [[TMP140:%.*]] = load i32, i32* [[CH_CASTED42]], align 4 19218 // CHECK11-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 19219 // CHECK11-NEXT: store i32 [[TMP141]], i32* [[N_CASTED43]], align 4 19220 // CHECK11-NEXT: [[TMP142:%.*]] = load i32, i32* [[N_CASTED43]], align 4 19221 // CHECK11-NEXT: [[TMP143:%.*]] = load i32*, i32** [[A]], align 4 19222 // CHECK11-NEXT: [[TMP144:%.*]] = load i32*, i32** [[B]], align 4 19223 // CHECK11-NEXT: [[TMP145:%.*]] = load i32*, i32** [[C]], align 4 19224 // CHECK11-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 19225 // CHECK11-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i32* 19226 // CHECK11-NEXT: store i32 [[TMP140]], i32* [[TMP147]], align 4 19227 // CHECK11-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 19228 // CHECK11-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i32* 19229 // CHECK11-NEXT: store i32 [[TMP140]], i32* [[TMP149]], align 4 19230 // CHECK11-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 0 19231 // CHECK11-NEXT: store i8* null, i8** [[TMP150]], align 4 19232 // CHECK11-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 1 19233 // CHECK11-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i32* 19234 // CHECK11-NEXT: store i32 [[TMP142]], i32* [[TMP152]], align 4 19235 // CHECK11-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 1 19236 // CHECK11-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i32* 19237 // CHECK11-NEXT: store i32 [[TMP142]], i32* [[TMP154]], align 4 19238 // CHECK11-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 1 19239 // CHECK11-NEXT: store i8* null, i8** [[TMP155]], align 4 19240 // CHECK11-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 2 19241 // CHECK11-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to i32** 19242 // CHECK11-NEXT: store i32* [[TMP143]], i32** [[TMP157]], align 4 19243 // CHECK11-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 2 19244 // CHECK11-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to i32** 19245 // CHECK11-NEXT: store i32* [[TMP143]], i32** [[TMP159]], align 4 19246 // CHECK11-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 2 19247 // CHECK11-NEXT: store i8* null, i8** [[TMP160]], align 4 19248 // CHECK11-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 3 19249 // CHECK11-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to i32** 19250 // CHECK11-NEXT: store i32* [[TMP144]], i32** [[TMP162]], align 4 19251 // CHECK11-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 3 19252 // CHECK11-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to i32** 19253 // CHECK11-NEXT: store i32* [[TMP144]], i32** [[TMP164]], align 4 19254 // CHECK11-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 3 19255 // CHECK11-NEXT: store i8* null, i8** [[TMP165]], align 4 19256 // CHECK11-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 4 19257 // CHECK11-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to i32** 19258 // CHECK11-NEXT: store i32* [[TMP145]], i32** [[TMP167]], align 4 19259 // CHECK11-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 4 19260 // CHECK11-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to i32** 19261 // CHECK11-NEXT: store i32* [[TMP145]], i32** [[TMP169]], align 4 19262 // CHECK11-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 4 19263 // CHECK11-NEXT: store i8* null, i8** [[TMP170]], align 4 19264 // CHECK11-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 19265 // CHECK11-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 19266 // CHECK11-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 19267 // CHECK11-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_48]], align 4 19268 // CHECK11-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_48]], align 4 19269 // CHECK11-NEXT: [[SUB50:%.*]] = sub nsw i32 [[TMP174]], 0 19270 // CHECK11-NEXT: [[DIV51:%.*]] = sdiv i32 [[SUB50]], 1 19271 // CHECK11-NEXT: [[SUB52:%.*]] = sub nsw i32 [[DIV51]], 1 19272 // CHECK11-NEXT: store i32 [[SUB52]], i32* [[DOTCAPTURE_EXPR_49]], align 4 19273 // CHECK11-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_49]], align 4 19274 // CHECK11-NEXT: [[ADD53:%.*]] = add nsw i32 [[TMP175]], 1 19275 // CHECK11-NEXT: [[TMP176:%.*]] = zext i32 [[ADD53]] to i64 19276 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 19277 // CHECK11-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.44, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.45, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19278 // CHECK11-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 19279 // CHECK11-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED54:%.*]], label [[OMP_OFFLOAD_CONT55:%.*]] 19280 // CHECK11: omp_offload.failed54: 19281 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75(i32 [[TMP140]], i32 [[TMP142]], i32* [[TMP143]], i32* [[TMP144]], i32* [[TMP145]]) #[[ATTR2]] 19282 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT55]] 19283 // CHECK11: omp_offload.cont55: 19284 // CHECK11-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 19285 // CHECK11-NEXT: store i32 [[TMP179]], i32* [[N_CASTED56]], align 4 19286 // CHECK11-NEXT: [[TMP180:%.*]] = load i32, i32* [[N_CASTED56]], align 4 19287 // CHECK11-NEXT: [[TMP181:%.*]] = load i32*, i32** [[A]], align 4 19288 // CHECK11-NEXT: [[TMP182:%.*]] = load i32*, i32** [[B]], align 4 19289 // CHECK11-NEXT: [[TMP183:%.*]] = load i32*, i32** [[C]], align 4 19290 // CHECK11-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 19291 // CHECK11-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i32* 19292 // CHECK11-NEXT: store i32 [[TMP180]], i32* [[TMP185]], align 4 19293 // CHECK11-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 19294 // CHECK11-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i32* 19295 // CHECK11-NEXT: store i32 [[TMP180]], i32* [[TMP187]], align 4 19296 // CHECK11-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 0 19297 // CHECK11-NEXT: store i8* null, i8** [[TMP188]], align 4 19298 // CHECK11-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 1 19299 // CHECK11-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to i32** 19300 // CHECK11-NEXT: store i32* [[TMP181]], i32** [[TMP190]], align 4 19301 // CHECK11-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 1 19302 // CHECK11-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to i32** 19303 // CHECK11-NEXT: store i32* [[TMP181]], i32** [[TMP192]], align 4 19304 // CHECK11-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 1 19305 // CHECK11-NEXT: store i8* null, i8** [[TMP193]], align 4 19306 // CHECK11-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 2 19307 // CHECK11-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to i32** 19308 // CHECK11-NEXT: store i32* [[TMP182]], i32** [[TMP195]], align 4 19309 // CHECK11-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 2 19310 // CHECK11-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to i32** 19311 // CHECK11-NEXT: store i32* [[TMP182]], i32** [[TMP197]], align 4 19312 // CHECK11-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 2 19313 // CHECK11-NEXT: store i8* null, i8** [[TMP198]], align 4 19314 // CHECK11-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 3 19315 // CHECK11-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to i32** 19316 // CHECK11-NEXT: store i32* [[TMP183]], i32** [[TMP200]], align 4 19317 // CHECK11-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 3 19318 // CHECK11-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to i32** 19319 // CHECK11-NEXT: store i32* [[TMP183]], i32** [[TMP202]], align 4 19320 // CHECK11-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 3 19321 // CHECK11-NEXT: store i8* null, i8** [[TMP203]], align 4 19322 // CHECK11-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 19323 // CHECK11-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 19324 // CHECK11-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 19325 // CHECK11-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_61]], align 4 19326 // CHECK11-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_61]], align 4 19327 // CHECK11-NEXT: [[SUB63:%.*]] = sub nsw i32 [[TMP207]], 0 19328 // CHECK11-NEXT: [[DIV64:%.*]] = sdiv i32 [[SUB63]], 1 19329 // CHECK11-NEXT: [[SUB65:%.*]] = sub nsw i32 [[DIV64]], 1 19330 // CHECK11-NEXT: store i32 [[SUB65]], i32* [[DOTCAPTURE_EXPR_62]], align 4 19331 // CHECK11-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_62]], align 4 19332 // CHECK11-NEXT: [[ADD66:%.*]] = add nsw i32 [[TMP208]], 1 19333 // CHECK11-NEXT: [[TMP209:%.*]] = zext i32 [[ADD66]] to i64 19334 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 19335 // CHECK11-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.48, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.49, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19336 // CHECK11-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 19337 // CHECK11-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED67:%.*]], label [[OMP_OFFLOAD_CONT68:%.*]] 19338 // CHECK11: omp_offload.failed67: 19339 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83(i32 [[TMP180]], i32* [[TMP181]], i32* [[TMP182]], i32* [[TMP183]]) #[[ATTR2]] 19340 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT68]] 19341 // CHECK11: omp_offload.cont68: 19342 // CHECK11-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 19343 // CHECK11-NEXT: store i32 [[TMP212]], i32* [[CH_CASTED69]], align 4 19344 // CHECK11-NEXT: [[TMP213:%.*]] = load i32, i32* [[CH_CASTED69]], align 4 19345 // CHECK11-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 19346 // CHECK11-NEXT: store i32 [[TMP214]], i32* [[N_CASTED70]], align 4 19347 // CHECK11-NEXT: [[TMP215:%.*]] = load i32, i32* [[N_CASTED70]], align 4 19348 // CHECK11-NEXT: [[TMP216:%.*]] = load i32*, i32** [[A]], align 4 19349 // CHECK11-NEXT: [[TMP217:%.*]] = load i32*, i32** [[B]], align 4 19350 // CHECK11-NEXT: [[TMP218:%.*]] = load i32*, i32** [[C]], align 4 19351 // CHECK11-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 19352 // CHECK11-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i32* 19353 // CHECK11-NEXT: store i32 [[TMP213]], i32* [[TMP220]], align 4 19354 // CHECK11-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 19355 // CHECK11-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i32* 19356 // CHECK11-NEXT: store i32 [[TMP213]], i32* [[TMP222]], align 4 19357 // CHECK11-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 0 19358 // CHECK11-NEXT: store i8* null, i8** [[TMP223]], align 4 19359 // CHECK11-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 1 19360 // CHECK11-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i32* 19361 // CHECK11-NEXT: store i32 [[TMP215]], i32* [[TMP225]], align 4 19362 // CHECK11-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 1 19363 // CHECK11-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i32* 19364 // CHECK11-NEXT: store i32 [[TMP215]], i32* [[TMP227]], align 4 19365 // CHECK11-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 1 19366 // CHECK11-NEXT: store i8* null, i8** [[TMP228]], align 4 19367 // CHECK11-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 2 19368 // CHECK11-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to i32** 19369 // CHECK11-NEXT: store i32* [[TMP216]], i32** [[TMP230]], align 4 19370 // CHECK11-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 2 19371 // CHECK11-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to i32** 19372 // CHECK11-NEXT: store i32* [[TMP216]], i32** [[TMP232]], align 4 19373 // CHECK11-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 2 19374 // CHECK11-NEXT: store i8* null, i8** [[TMP233]], align 4 19375 // CHECK11-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 3 19376 // CHECK11-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to i32** 19377 // CHECK11-NEXT: store i32* [[TMP217]], i32** [[TMP235]], align 4 19378 // CHECK11-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 3 19379 // CHECK11-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to i32** 19380 // CHECK11-NEXT: store i32* [[TMP217]], i32** [[TMP237]], align 4 19381 // CHECK11-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 3 19382 // CHECK11-NEXT: store i8* null, i8** [[TMP238]], align 4 19383 // CHECK11-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 4 19384 // CHECK11-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to i32** 19385 // CHECK11-NEXT: store i32* [[TMP218]], i32** [[TMP240]], align 4 19386 // CHECK11-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 4 19387 // CHECK11-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to i32** 19388 // CHECK11-NEXT: store i32* [[TMP218]], i32** [[TMP242]], align 4 19389 // CHECK11-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 4 19390 // CHECK11-NEXT: store i8* null, i8** [[TMP243]], align 4 19391 // CHECK11-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 19392 // CHECK11-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 19393 // CHECK11-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 19394 // CHECK11-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_75]], align 4 19395 // CHECK11-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_75]], align 4 19396 // CHECK11-NEXT: [[SUB77:%.*]] = sub nsw i32 [[TMP247]], 0 19397 // CHECK11-NEXT: [[DIV78:%.*]] = sdiv i32 [[SUB77]], 1 19398 // CHECK11-NEXT: [[SUB79:%.*]] = sub nsw i32 [[DIV78]], 1 19399 // CHECK11-NEXT: store i32 [[SUB79]], i32* [[DOTCAPTURE_EXPR_76]], align 4 19400 // CHECK11-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_76]], align 4 19401 // CHECK11-NEXT: [[ADD80:%.*]] = add nsw i32 [[TMP248]], 1 19402 // CHECK11-NEXT: [[TMP249:%.*]] = zext i32 [[ADD80]] to i64 19403 // CHECK11-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 19404 // CHECK11-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.52, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.53, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 19405 // CHECK11-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 19406 // CHECK11-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED81:%.*]], label [[OMP_OFFLOAD_CONT82:%.*]] 19407 // CHECK11: omp_offload.failed81: 19408 // CHECK11-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91(i32 [[TMP213]], i32 [[TMP215]], i32* [[TMP216]], i32* [[TMP217]], i32* [[TMP218]]) #[[ATTR2]] 19409 // CHECK11-NEXT: br label [[OMP_OFFLOAD_CONT82]] 19410 // CHECK11: omp_offload.cont82: 19411 // CHECK11-NEXT: ret i32 0 19412 // 19413 // 19414 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42 19415 // CHECK11-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 19416 // CHECK11-NEXT: entry: 19417 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 19418 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 19419 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 19420 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 19421 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 19422 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 19423 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 19424 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 19425 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..26 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 19426 // CHECK11-NEXT: ret void 19427 // 19428 // 19429 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..26 19430 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 19431 // CHECK11-NEXT: entry: 19432 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 19433 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 19434 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 19435 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 19436 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 19437 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 19438 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 19439 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 19440 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 19441 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 19442 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 19443 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 19444 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 19445 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 19446 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 19447 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 19448 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 19449 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 19450 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 19451 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 19452 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 19453 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 19454 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 19455 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 19456 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 19457 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 19458 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 19459 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 19460 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19461 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 19462 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 19463 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 19464 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 19465 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 19466 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19467 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 19468 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 19469 // CHECK11: omp.precond.then: 19470 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 19471 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19472 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 19473 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 19474 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 19475 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19476 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 19477 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 19478 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19479 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19480 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 19481 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 19482 // CHECK11: cond.true: 19483 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19484 // CHECK11-NEXT: br label [[COND_END:%.*]] 19485 // CHECK11: cond.false: 19486 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19487 // CHECK11-NEXT: br label [[COND_END]] 19488 // CHECK11: cond.end: 19489 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 19490 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 19491 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19492 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 19493 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 19494 // CHECK11: omp.inner.for.cond: 19495 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19496 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19497 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 19498 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 19499 // CHECK11: omp.inner.for.body: 19500 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19501 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19502 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..27 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 19503 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 19504 // CHECK11: omp.inner.for.inc: 19505 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19506 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 19507 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 19508 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 19509 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 19510 // CHECK11: omp.inner.for.end: 19511 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 19512 // CHECK11: omp.loop.exit: 19513 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19514 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 19515 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 19516 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 19517 // CHECK11: omp.precond.end: 19518 // CHECK11-NEXT: ret void 19519 // 19520 // 19521 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..27 19522 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 19523 // CHECK11-NEXT: entry: 19524 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 19525 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 19526 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 19527 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 19528 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 19529 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 19530 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 19531 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 19532 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 19533 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 19534 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 19535 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 19536 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 19537 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 19538 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 19539 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 19540 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 19541 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 19542 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 19543 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 19544 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 19545 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 19546 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 19547 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 19548 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 19549 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 19550 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 19551 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 19552 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 19553 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 19554 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 19555 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 19556 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19557 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 19558 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 19559 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 19560 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 19561 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 19562 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19563 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 19564 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 19565 // CHECK11: omp.precond.then: 19566 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 19567 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19568 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 19569 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 19570 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 19571 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 19572 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 19573 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 19574 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 19575 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19576 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 19577 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 19578 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 19579 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19580 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 19581 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 19582 // CHECK11: cond.true: 19583 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19584 // CHECK11-NEXT: br label [[COND_END:%.*]] 19585 // CHECK11: cond.false: 19586 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 19587 // CHECK11-NEXT: br label [[COND_END]] 19588 // CHECK11: cond.end: 19589 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 19590 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 19591 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 19592 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 19593 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 19594 // CHECK11: omp.inner.for.cond: 19595 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19596 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 19597 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 19598 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 19599 // CHECK11: omp.inner.for.body: 19600 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19601 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 19602 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 19603 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 19604 // CHECK11-NEXT: [[TMP20:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19605 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[TMP20]], align 4 19606 // CHECK11-NEXT: [[TMP22:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* @[[GLOB3]], i32 [[TMP21]], i32 2) 19607 // CHECK11-NEXT: [[TMP23:%.*]] = icmp ne i32 [[TMP22]], 0 19608 // CHECK11-NEXT: br i1 [[TMP23]], label [[DOTCANCEL_EXIT:%.*]], label [[DOTCANCEL_CONTINUE:%.*]] 19609 // CHECK11: .cancel.exit: 19610 // CHECK11-NEXT: br label [[CANCEL_EXIT:%.*]] 19611 // CHECK11: .cancel.continue: 19612 // CHECK11-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP2]], align 4 19613 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4 19614 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i32 [[TMP25]] 19615 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 19616 // CHECK11-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP3]], align 4 19617 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4 19618 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i32 [[TMP28]] 19619 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 19620 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 19621 // CHECK11-NEXT: [[TMP30:%.*]] = load i32*, i32** [[TMP1]], align 4 19622 // CHECK11-NEXT: [[TMP31:%.*]] = load i32, i32* [[I3]], align 4 19623 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i32 [[TMP31]] 19624 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 19625 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 19626 // CHECK11: omp.body.continue: 19627 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 19628 // CHECK11: omp.inner.for.inc: 19629 // CHECK11-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19630 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 19631 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 19632 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 19633 // CHECK11: omp.inner.for.end: 19634 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 19635 // CHECK11: omp.loop.exit: 19636 // CHECK11-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19637 // CHECK11-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 19638 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 19639 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 19640 // CHECK11: cancel.exit: 19641 // CHECK11-NEXT: [[TMP35:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19642 // CHECK11-NEXT: [[TMP36:%.*]] = load i32, i32* [[TMP35]], align 4 19643 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP36]]) 19644 // CHECK11-NEXT: br label [[CANCEL_CONT:%.*]] 19645 // CHECK11: omp.precond.end: 19646 // CHECK11-NEXT: br label [[CANCEL_CONT]] 19647 // CHECK11: cancel.cont: 19648 // CHECK11-NEXT: ret void 19649 // 19650 // 19651 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51 19652 // CHECK11-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 19653 // CHECK11-NEXT: entry: 19654 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 19655 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 19656 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 19657 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 19658 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 19659 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 19660 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 19661 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 19662 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 19663 // CHECK11-NEXT: ret void 19664 // 19665 // 19666 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..30 19667 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 19668 // CHECK11-NEXT: entry: 19669 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 19670 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 19671 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 19672 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 19673 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 19674 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 19675 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 19676 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 19677 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 19678 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 19679 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 19680 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 19681 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 19682 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 19683 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 19684 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 19685 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 19686 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 19687 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 19688 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 19689 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 19690 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 19691 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 19692 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 19693 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 19694 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 19695 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 19696 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 19697 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19698 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 19699 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 19700 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 19701 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 19702 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 19703 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19704 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 19705 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 19706 // CHECK11: omp.precond.then: 19707 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 19708 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19709 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 19710 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 19711 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 19712 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19713 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 19714 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 19715 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19716 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19717 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 19718 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 19719 // CHECK11: cond.true: 19720 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19721 // CHECK11-NEXT: br label [[COND_END:%.*]] 19722 // CHECK11: cond.false: 19723 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19724 // CHECK11-NEXT: br label [[COND_END]] 19725 // CHECK11: cond.end: 19726 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 19727 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 19728 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19729 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 19730 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 19731 // CHECK11: omp.inner.for.cond: 19732 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19733 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19734 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 19735 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 19736 // CHECK11: omp.inner.for.body: 19737 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19738 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19739 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 19740 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 19741 // CHECK11: omp.inner.for.inc: 19742 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19743 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 19744 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 19745 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 19746 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 19747 // CHECK11: omp.inner.for.end: 19748 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 19749 // CHECK11: omp.loop.exit: 19750 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19751 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 19752 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 19753 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 19754 // CHECK11: omp.precond.end: 19755 // CHECK11-NEXT: ret void 19756 // 19757 // 19758 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..31 19759 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 19760 // CHECK11-NEXT: entry: 19761 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 19762 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 19763 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 19764 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 19765 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 19766 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 19767 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 19768 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 19769 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 19770 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 19771 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 19772 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 19773 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 19774 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 19775 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 19776 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 19777 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 19778 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 19779 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 19780 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 19781 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 19782 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 19783 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 19784 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 19785 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 19786 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 19787 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 19788 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 19789 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 19790 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 19791 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 19792 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 19793 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19794 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 19795 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 19796 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 19797 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 19798 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 19799 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19800 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 19801 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 19802 // CHECK11: omp.precond.then: 19803 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 19804 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19805 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 19806 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 19807 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 19808 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 19809 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 19810 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 19811 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 19812 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19813 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 19814 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 19815 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 19816 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19817 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 19818 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 19819 // CHECK11: cond.true: 19820 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19821 // CHECK11-NEXT: br label [[COND_END:%.*]] 19822 // CHECK11: cond.false: 19823 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 19824 // CHECK11-NEXT: br label [[COND_END]] 19825 // CHECK11: cond.end: 19826 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 19827 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 19828 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 19829 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 19830 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 19831 // CHECK11: omp.inner.for.cond: 19832 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19833 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 19834 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 19835 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 19836 // CHECK11: omp.inner.for.body: 19837 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19838 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 19839 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 19840 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 19841 // CHECK11-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 4 19842 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 19843 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i32 [[TMP21]] 19844 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 19845 // CHECK11-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 4 19846 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 19847 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 19848 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 19849 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 19850 // CHECK11-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 4 19851 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 19852 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 19853 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 19854 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 19855 // CHECK11: omp.body.continue: 19856 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 19857 // CHECK11: omp.inner.for.inc: 19858 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19859 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 19860 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 19861 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 19862 // CHECK11: omp.inner.for.end: 19863 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 19864 // CHECK11: omp.loop.exit: 19865 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19866 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 19867 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 19868 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 19869 // CHECK11: omp.precond.end: 19870 // CHECK11-NEXT: ret void 19871 // 19872 // 19873 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59 19874 // CHECK11-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 19875 // CHECK11-NEXT: entry: 19876 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 19877 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 19878 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 19879 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 19880 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 19881 // CHECK11-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 19882 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 19883 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 19884 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 19885 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 19886 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 19887 // CHECK11-NEXT: ret void 19888 // 19889 // 19890 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..34 19891 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 19892 // CHECK11-NEXT: entry: 19893 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 19894 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 19895 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 19896 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 19897 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 19898 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 19899 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 19900 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 19901 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 19902 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 19903 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 19904 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 19905 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 19906 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 19907 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 19908 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 19909 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 19910 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 19911 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 19912 // CHECK11-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 19913 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 19914 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 19915 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 19916 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 19917 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 19918 // CHECK11-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 19919 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 19920 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 19921 // CHECK11-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 19922 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 19923 // CHECK11-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 19924 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19925 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 19926 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 19927 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 19928 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 19929 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 19930 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 19931 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 19932 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 19933 // CHECK11: omp.precond.then: 19934 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 19935 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19936 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 19937 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 19938 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 19939 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 19940 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 19941 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 19942 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 19943 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19944 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19945 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 19946 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 19947 // CHECK11: cond.true: 19948 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19949 // CHECK11-NEXT: br label [[COND_END:%.*]] 19950 // CHECK11: cond.false: 19951 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19952 // CHECK11-NEXT: br label [[COND_END]] 19953 // CHECK11: cond.end: 19954 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 19955 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 19956 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19957 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 19958 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 19959 // CHECK11: omp.inner.for.cond: 19960 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19961 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19962 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 19963 // CHECK11-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 19964 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 19965 // CHECK11: omp.inner.for.body: 19966 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19967 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19968 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]]) 19969 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 19970 // CHECK11: omp.inner.for.inc: 19971 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 19972 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 19973 // CHECK11-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 19974 // CHECK11-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 19975 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19976 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 19977 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 19978 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 19979 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19980 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 19981 // CHECK11-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 19982 // CHECK11-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 19983 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19984 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19985 // CHECK11-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP27]], [[TMP28]] 19986 // CHECK11-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 19987 // CHECK11: cond.true10: 19988 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 19989 // CHECK11-NEXT: br label [[COND_END12:%.*]] 19990 // CHECK11: cond.false11: 19991 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 19992 // CHECK11-NEXT: br label [[COND_END12]] 19993 // CHECK11: cond.end12: 19994 // CHECK11-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP29]], [[COND_TRUE10]] ], [ [[TMP30]], [[COND_FALSE11]] ] 19995 // CHECK11-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 19996 // CHECK11-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 19997 // CHECK11-NEXT: store i32 [[TMP31]], i32* [[DOTOMP_IV]], align 4 19998 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 19999 // CHECK11: omp.inner.for.end: 20000 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20001 // CHECK11: omp.loop.exit: 20002 // CHECK11-NEXT: [[TMP32:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20003 // CHECK11-NEXT: [[TMP33:%.*]] = load i32, i32* [[TMP32]], align 4 20004 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP33]]) 20005 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20006 // CHECK11: omp.precond.end: 20007 // CHECK11-NEXT: ret void 20008 // 20009 // 20010 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..35 20011 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20012 // CHECK11-NEXT: entry: 20013 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20014 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20015 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 20016 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 20017 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20018 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20019 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20020 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20021 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20022 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20023 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20024 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20025 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20026 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 20027 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 20028 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20029 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20030 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 20031 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20032 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20033 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20034 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20035 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20036 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20037 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20038 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20039 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20040 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20041 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20042 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20043 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20044 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 20045 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20046 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20047 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20048 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 20049 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20050 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20051 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20052 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20053 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20054 // CHECK11: omp.precond.then: 20055 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 20056 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20057 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 20058 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20059 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20060 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 20061 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 20062 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20063 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20064 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20065 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 20066 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 20067 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20068 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20069 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 20070 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20071 // CHECK11: cond.true: 20072 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20073 // CHECK11-NEXT: br label [[COND_END:%.*]] 20074 // CHECK11: cond.false: 20075 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20076 // CHECK11-NEXT: br label [[COND_END]] 20077 // CHECK11: cond.end: 20078 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 20079 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 20080 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20081 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 20082 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20083 // CHECK11: omp.inner.for.cond: 20084 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20085 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20086 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 20087 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20088 // CHECK11: omp.inner.for.body: 20089 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20090 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 20091 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 20092 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 20093 // CHECK11-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 4 20094 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 20095 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i32 [[TMP21]] 20096 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 20097 // CHECK11-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 4 20098 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 20099 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 20100 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 20101 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 20102 // CHECK11-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 4 20103 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 20104 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 20105 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 20106 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 20107 // CHECK11: omp.body.continue: 20108 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20109 // CHECK11: omp.inner.for.inc: 20110 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20111 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 20112 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 20113 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20114 // CHECK11: omp.inner.for.end: 20115 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20116 // CHECK11: omp.loop.exit: 20117 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20118 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 20119 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 20120 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20121 // CHECK11: omp.precond.end: 20122 // CHECK11-NEXT: ret void 20123 // 20124 // 20125 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67 20126 // CHECK11-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 20127 // CHECK11-NEXT: entry: 20128 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 20129 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 20130 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 20131 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 20132 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 20133 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 20134 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 20135 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 20136 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..38 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 20137 // CHECK11-NEXT: ret void 20138 // 20139 // 20140 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..38 20141 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20142 // CHECK11-NEXT: entry: 20143 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20144 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20145 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20146 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20147 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20148 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20149 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20150 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20151 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20152 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20153 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20154 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 20155 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 20156 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20157 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20158 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 20159 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20160 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20161 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20162 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20163 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20164 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20165 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20166 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20167 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20168 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20169 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20170 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 20171 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20172 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20173 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20174 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 20175 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20176 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20177 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20178 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20179 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20180 // CHECK11: omp.precond.then: 20181 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 20182 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20183 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 20184 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20185 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20186 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20187 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 20188 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 20189 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20190 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20191 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 20192 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20193 // CHECK11: cond.true: 20194 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20195 // CHECK11-NEXT: br label [[COND_END:%.*]] 20196 // CHECK11: cond.false: 20197 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20198 // CHECK11-NEXT: br label [[COND_END]] 20199 // CHECK11: cond.end: 20200 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 20201 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 20202 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20203 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 20204 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20205 // CHECK11: omp.inner.for.cond: 20206 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20207 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20208 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 20209 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20210 // CHECK11: omp.inner.for.body: 20211 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20212 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20213 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 20214 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20215 // CHECK11: omp.inner.for.inc: 20216 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20217 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 20218 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 20219 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 20220 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20221 // CHECK11: omp.inner.for.end: 20222 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20223 // CHECK11: omp.loop.exit: 20224 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20225 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 20226 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 20227 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20228 // CHECK11: omp.precond.end: 20229 // CHECK11-NEXT: ret void 20230 // 20231 // 20232 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..39 20233 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20234 // CHECK11-NEXT: entry: 20235 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20236 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20237 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 20238 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 20239 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20240 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20241 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20242 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20243 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20244 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20245 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20246 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20247 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20248 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 20249 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 20250 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20251 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20252 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 20253 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20254 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20255 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20256 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20257 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20258 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20259 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20260 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20261 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20262 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20263 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20264 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20265 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20266 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 20267 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20268 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20269 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20270 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 20271 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20272 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20273 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20274 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20275 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20276 // CHECK11: omp.precond.then: 20277 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 20278 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20279 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 20280 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20281 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20282 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 20283 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 20284 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20285 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20286 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20287 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 20288 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 20289 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20290 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20291 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 20292 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20293 // CHECK11: cond.true: 20294 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20295 // CHECK11-NEXT: br label [[COND_END:%.*]] 20296 // CHECK11: cond.false: 20297 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20298 // CHECK11-NEXT: br label [[COND_END]] 20299 // CHECK11: cond.end: 20300 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 20301 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 20302 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20303 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 20304 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20305 // CHECK11: omp.inner.for.cond: 20306 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20307 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20308 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 20309 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20310 // CHECK11: omp.inner.for.body: 20311 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20312 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 20313 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 20314 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 20315 // CHECK11-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 4 20316 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 20317 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i32 [[TMP21]] 20318 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 20319 // CHECK11-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 4 20320 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 20321 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 20322 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 20323 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 20324 // CHECK11-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 4 20325 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 20326 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 20327 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 20328 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 20329 // CHECK11: omp.body.continue: 20330 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20331 // CHECK11: omp.inner.for.inc: 20332 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20333 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 20334 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 20335 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20336 // CHECK11: omp.inner.for.end: 20337 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20338 // CHECK11: omp.loop.exit: 20339 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20340 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 20341 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 20342 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20343 // CHECK11: omp.precond.end: 20344 // CHECK11-NEXT: ret void 20345 // 20346 // 20347 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75 20348 // CHECK11-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 20349 // CHECK11-NEXT: entry: 20350 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 20351 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 20352 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 20353 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 20354 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 20355 // CHECK11-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 20356 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 20357 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 20358 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 20359 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 20360 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..42 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 20361 // CHECK11-NEXT: ret void 20362 // 20363 // 20364 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..42 20365 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20366 // CHECK11-NEXT: entry: 20367 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20368 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20369 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 20370 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20371 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20372 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20373 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20374 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20375 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20376 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20377 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20378 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 20379 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20380 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 20381 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 20382 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20383 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20384 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 20385 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 20386 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20387 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20388 // CHECK11-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 20389 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20390 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20391 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20392 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20393 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 20394 // CHECK11-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20395 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20396 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20397 // CHECK11-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20398 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 20399 // CHECK11-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 20400 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 20401 // CHECK11-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20402 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20403 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 20404 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20405 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 20406 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 20407 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20408 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20409 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 20410 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20411 // CHECK11: omp.precond.then: 20412 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 20413 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20414 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 20415 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20416 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20417 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20418 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 20419 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 20420 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20421 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20422 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 20423 // CHECK11-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20424 // CHECK11: cond.true: 20425 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20426 // CHECK11-NEXT: br label [[COND_END:%.*]] 20427 // CHECK11: cond.false: 20428 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20429 // CHECK11-NEXT: br label [[COND_END]] 20430 // CHECK11: cond.end: 20431 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 20432 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 20433 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20434 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 20435 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20436 // CHECK11: omp.inner.for.cond: 20437 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20438 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20439 // CHECK11-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 20440 // CHECK11-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20441 // CHECK11: omp.inner.for.body: 20442 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20443 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20444 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20445 // CHECK11-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 20446 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 20447 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**, i32)* @.omp_outlined..43 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i32 [[TMP22]]) 20448 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20449 // CHECK11: omp.inner.for.inc: 20450 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20451 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 20452 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 20453 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 20454 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20455 // CHECK11: omp.inner.for.end: 20456 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20457 // CHECK11: omp.loop.exit: 20458 // CHECK11-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20459 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 20460 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 20461 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20462 // CHECK11: omp.precond.end: 20463 // CHECK11-NEXT: ret void 20464 // 20465 // 20466 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..43 20467 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 20468 // CHECK11-NEXT: entry: 20469 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20470 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20471 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 20472 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 20473 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20474 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20475 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20476 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20477 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 20478 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20479 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20480 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20481 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 20482 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20483 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 20484 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 20485 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20486 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20487 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 20488 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20489 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20490 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20491 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20492 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20493 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20494 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20495 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20496 // CHECK11-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 20497 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20498 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20499 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20500 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20501 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20502 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20503 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20504 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20505 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20506 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 20507 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 20508 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20509 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20510 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20511 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20512 // CHECK11: omp.precond.then: 20513 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 20514 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20515 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 20516 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20517 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20518 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 20519 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 20520 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20521 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20522 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 20523 // CHECK11-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20524 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 20525 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 20526 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 20527 // CHECK11: omp.dispatch.cond: 20528 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20529 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20530 // CHECK11-NEXT: [[CMP5:%.*]] = icmp ugt i32 [[TMP13]], [[TMP14]] 20531 // CHECK11-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20532 // CHECK11: cond.true: 20533 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20534 // CHECK11-NEXT: br label [[COND_END:%.*]] 20535 // CHECK11: cond.false: 20536 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20537 // CHECK11-NEXT: br label [[COND_END]] 20538 // CHECK11: cond.end: 20539 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP15]], [[COND_TRUE]] ], [ [[TMP16]], [[COND_FALSE]] ] 20540 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 20541 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20542 // CHECK11-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 20543 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20544 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20545 // CHECK11-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 20546 // CHECK11-NEXT: br i1 [[CMP6]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 20547 // CHECK11: omp.dispatch.body: 20548 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20549 // CHECK11: omp.inner.for.cond: 20550 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20551 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20552 // CHECK11-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 20553 // CHECK11-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20554 // CHECK11: omp.inner.for.body: 20555 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20556 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 20557 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 20558 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 20559 // CHECK11-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP2]], align 4 20560 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 20561 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 20562 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 20563 // CHECK11-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP3]], align 4 20564 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 20565 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 20566 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 20567 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP25]], [[TMP28]] 20568 // CHECK11-NEXT: [[TMP29:%.*]] = load i32*, i32** [[TMP1]], align 4 20569 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[I4]], align 4 20570 // CHECK11-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP29]], i32 [[TMP30]] 20571 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX10]], align 4 20572 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 20573 // CHECK11: omp.body.continue: 20574 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20575 // CHECK11: omp.inner.for.inc: 20576 // CHECK11-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20577 // CHECK11-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP31]], 1 20578 // CHECK11-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4 20579 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20580 // CHECK11: omp.inner.for.end: 20581 // CHECK11-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 20582 // CHECK11: omp.dispatch.inc: 20583 // CHECK11-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20584 // CHECK11-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 20585 // CHECK11-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 20586 // CHECK11-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_LB]], align 4 20587 // CHECK11-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20588 // CHECK11-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 20589 // CHECK11-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 20590 // CHECK11-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_UB]], align 4 20591 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND]] 20592 // CHECK11: omp.dispatch.end: 20593 // CHECK11-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20594 // CHECK11-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 20595 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 20596 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20597 // CHECK11: omp.precond.end: 20598 // CHECK11-NEXT: ret void 20599 // 20600 // 20601 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83 20602 // CHECK11-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 20603 // CHECK11-NEXT: entry: 20604 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 20605 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 20606 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 20607 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 20608 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 20609 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 20610 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 20611 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 20612 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..46 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 20613 // CHECK11-NEXT: ret void 20614 // 20615 // 20616 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..46 20617 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20618 // CHECK11-NEXT: entry: 20619 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20620 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20621 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20622 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20623 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20624 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20625 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20626 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20627 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20628 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20629 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20630 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 20631 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 20632 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20633 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20634 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 20635 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20636 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20637 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20638 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20639 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20640 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20641 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20642 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20643 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20644 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20645 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20646 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 20647 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20648 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20649 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20650 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 20651 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20652 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20653 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20654 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20655 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20656 // CHECK11: omp.precond.then: 20657 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 20658 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20659 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 20660 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20661 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20662 // CHECK11-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20663 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 20664 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 20665 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20666 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20667 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 20668 // CHECK11-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20669 // CHECK11: cond.true: 20670 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20671 // CHECK11-NEXT: br label [[COND_END:%.*]] 20672 // CHECK11: cond.false: 20673 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20674 // CHECK11-NEXT: br label [[COND_END]] 20675 // CHECK11: cond.end: 20676 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 20677 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 20678 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20679 // CHECK11-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 20680 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20681 // CHECK11: omp.inner.for.cond: 20682 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20683 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20684 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 20685 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20686 // CHECK11: omp.inner.for.body: 20687 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20688 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20689 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..47 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 20690 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20691 // CHECK11: omp.inner.for.inc: 20692 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20693 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 20694 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 20695 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 20696 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20697 // CHECK11: omp.inner.for.end: 20698 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20699 // CHECK11: omp.loop.exit: 20700 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20701 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 20702 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 20703 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20704 // CHECK11: omp.precond.end: 20705 // CHECK11-NEXT: ret void 20706 // 20707 // 20708 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..47 20709 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20710 // CHECK11-NEXT: entry: 20711 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20712 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20713 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 20714 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 20715 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20716 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20717 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20718 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20719 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20720 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20721 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20722 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20723 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20724 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 20725 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 20726 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20727 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20728 // CHECK11-NEXT: [[I3:%.*]] = alloca i32, align 4 20729 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20730 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20731 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20732 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20733 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20734 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20735 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20736 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20737 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20738 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20739 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20740 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20741 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20742 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 20743 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20744 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20745 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20746 // CHECK11-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 20747 // CHECK11-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20748 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20749 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20750 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20751 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20752 // CHECK11: omp.precond.then: 20753 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 20754 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20755 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 20756 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20757 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20758 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 20759 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 20760 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20761 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20762 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20763 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20764 // CHECK11-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20765 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 20766 // CHECK11-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 20767 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 20768 // CHECK11: omp.dispatch.cond: 20769 // CHECK11-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20770 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 20771 // CHECK11-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 20772 // CHECK11-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 20773 // CHECK11-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 20774 // CHECK11: omp.dispatch.body: 20775 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20776 // CHECK11-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 20777 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20778 // CHECK11: omp.inner.for.cond: 20779 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 20780 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !25 20781 // CHECK11-NEXT: [[CMP4:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 20782 // CHECK11-NEXT: br i1 [[CMP4]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20783 // CHECK11: omp.inner.for.body: 20784 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 20785 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 20786 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 20787 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I3]], align 4, !llvm.access.group !25 20788 // CHECK11-NEXT: [[TMP21:%.*]] = load i32*, i32** [[TMP2]], align 4, !llvm.access.group !25 20789 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !25 20790 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP21]], i32 [[TMP22]] 20791 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !25 20792 // CHECK11-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP3]], align 4, !llvm.access.group !25 20793 // CHECK11-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !25 20794 // CHECK11-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i32 [[TMP25]] 20795 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX5]], align 4, !llvm.access.group !25 20796 // CHECK11-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP26]] 20797 // CHECK11-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP1]], align 4, !llvm.access.group !25 20798 // CHECK11-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !25 20799 // CHECK11-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i32 [[TMP28]] 20800 // CHECK11-NEXT: store i32 [[ADD6]], i32* [[ARRAYIDX7]], align 4, !llvm.access.group !25 20801 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 20802 // CHECK11: omp.body.continue: 20803 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20804 // CHECK11: omp.inner.for.inc: 20805 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 20806 // CHECK11-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP29]], 1 20807 // CHECK11-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 20808 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP26:![0-9]+]] 20809 // CHECK11: omp.inner.for.end: 20810 // CHECK11-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 20811 // CHECK11: omp.dispatch.inc: 20812 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND]] 20813 // CHECK11: omp.dispatch.end: 20814 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20815 // CHECK11: omp.precond.end: 20816 // CHECK11-NEXT: ret void 20817 // 20818 // 20819 // CHECK11-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91 20820 // CHECK11-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 20821 // CHECK11-NEXT: entry: 20822 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 20823 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 20824 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 20825 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 20826 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 20827 // CHECK11-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 20828 // CHECK11-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 20829 // CHECK11-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 20830 // CHECK11-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 20831 // CHECK11-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 20832 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..50 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 20833 // CHECK11-NEXT: ret void 20834 // 20835 // 20836 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..50 20837 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 20838 // CHECK11-NEXT: entry: 20839 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20840 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20841 // CHECK11-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 20842 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20843 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20844 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20845 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20846 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 20847 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20848 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20849 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20850 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 20851 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20852 // CHECK11-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 20853 // CHECK11-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 20854 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20855 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20856 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 20857 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 20858 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20859 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20860 // CHECK11-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 20861 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20862 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20863 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20864 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20865 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 20866 // CHECK11-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20867 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20868 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20869 // CHECK11-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20870 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 20871 // CHECK11-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 20872 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 20873 // CHECK11-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20874 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20875 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 20876 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20877 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 20878 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 20879 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20880 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20881 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 20882 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20883 // CHECK11: omp.precond.then: 20884 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 20885 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20886 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 20887 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20888 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20889 // CHECK11-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20890 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 20891 // CHECK11-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 20892 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20893 // CHECK11-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20894 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 20895 // CHECK11-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 20896 // CHECK11: cond.true: 20897 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20898 // CHECK11-NEXT: br label [[COND_END:%.*]] 20899 // CHECK11: cond.false: 20900 // CHECK11-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20901 // CHECK11-NEXT: br label [[COND_END]] 20902 // CHECK11: cond.end: 20903 // CHECK11-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 20904 // CHECK11-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 20905 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20906 // CHECK11-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 20907 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 20908 // CHECK11: omp.inner.for.cond: 20909 // CHECK11-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20910 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20911 // CHECK11-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 20912 // CHECK11-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 20913 // CHECK11: omp.inner.for.body: 20914 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 20915 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 20916 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 20917 // CHECK11-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 20918 // CHECK11-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 20919 // CHECK11-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**, i32)* @.omp_outlined..51 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i32 [[TMP22]]) 20920 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 20921 // CHECK11: omp.inner.for.inc: 20922 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 20923 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 20924 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 20925 // CHECK11-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 20926 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]] 20927 // CHECK11: omp.inner.for.end: 20928 // CHECK11-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 20929 // CHECK11: omp.loop.exit: 20930 // CHECK11-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20931 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 20932 // CHECK11-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 20933 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 20934 // CHECK11: omp.precond.end: 20935 // CHECK11-NEXT: ret void 20936 // 20937 // 20938 // CHECK11-LABEL: define {{[^@]+}}@.omp_outlined..51 20939 // CHECK11-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 20940 // CHECK11-NEXT: entry: 20941 // CHECK11-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 20942 // CHECK11-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 20943 // CHECK11-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 20944 // CHECK11-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 20945 // CHECK11-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 20946 // CHECK11-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 20947 // CHECK11-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 20948 // CHECK11-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 20949 // CHECK11-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 20950 // CHECK11-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 20951 // CHECK11-NEXT: [[TMP:%.*]] = alloca i32, align 4 20952 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 20953 // CHECK11-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 20954 // CHECK11-NEXT: [[I:%.*]] = alloca i32, align 4 20955 // CHECK11-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 20956 // CHECK11-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 20957 // CHECK11-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 20958 // CHECK11-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 20959 // CHECK11-NEXT: [[I4:%.*]] = alloca i32, align 4 20960 // CHECK11-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 20961 // CHECK11-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 20962 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20963 // CHECK11-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20964 // CHECK11-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 20965 // CHECK11-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 20966 // CHECK11-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 20967 // CHECK11-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 20968 // CHECK11-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 20969 // CHECK11-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 20970 // CHECK11-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 20971 // CHECK11-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 20972 // CHECK11-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 20973 // CHECK11-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 20974 // CHECK11-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 20975 // CHECK11-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20976 // CHECK11-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 20977 // CHECK11-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 20978 // CHECK11-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 20979 // CHECK11-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 20980 // CHECK11-NEXT: store i32 0, i32* [[I]], align 4 20981 // CHECK11-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 20982 // CHECK11-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 20983 // CHECK11-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 20984 // CHECK11: omp.precond.then: 20985 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 20986 // CHECK11-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 20987 // CHECK11-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 20988 // CHECK11-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 20989 // CHECK11-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 20990 // CHECK11-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 20991 // CHECK11-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 20992 // CHECK11-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 20993 // CHECK11-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 20994 // CHECK11-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 20995 // CHECK11-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 20996 // CHECK11-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 20997 // CHECK11-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 20998 // CHECK11-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 20999 // CHECK11-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 21000 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 21001 // CHECK11: omp.dispatch.cond: 21002 // CHECK11-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21003 // CHECK11-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 21004 // CHECK11-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 21005 // CHECK11-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 21006 // CHECK11-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 21007 // CHECK11: omp.dispatch.body: 21008 // CHECK11-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 21009 // CHECK11-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 21010 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 21011 // CHECK11: omp.inner.for.cond: 21012 // CHECK11-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 21013 // CHECK11-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !28 21014 // CHECK11-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 21015 // CHECK11-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 21016 // CHECK11: omp.inner.for.body: 21017 // CHECK11-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 21018 // CHECK11-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 21019 // CHECK11-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 21020 // CHECK11-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !28 21021 // CHECK11-NEXT: [[TMP22:%.*]] = load i32*, i32** [[TMP2]], align 4, !llvm.access.group !28 21022 // CHECK11-NEXT: [[TMP23:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !28 21023 // CHECK11-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP22]], i32 [[TMP23]] 21024 // CHECK11-NEXT: [[TMP24:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !28 21025 // CHECK11-NEXT: [[TMP25:%.*]] = load i32*, i32** [[TMP3]], align 4, !llvm.access.group !28 21026 // CHECK11-NEXT: [[TMP26:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !28 21027 // CHECK11-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP25]], i32 [[TMP26]] 21028 // CHECK11-NEXT: [[TMP27:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4, !llvm.access.group !28 21029 // CHECK11-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP24]], [[TMP27]] 21030 // CHECK11-NEXT: [[TMP28:%.*]] = load i32*, i32** [[TMP1]], align 4, !llvm.access.group !28 21031 // CHECK11-NEXT: [[TMP29:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !28 21032 // CHECK11-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP28]], i32 [[TMP29]] 21033 // CHECK11-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4, !llvm.access.group !28 21034 // CHECK11-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 21035 // CHECK11: omp.body.continue: 21036 // CHECK11-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 21037 // CHECK11: omp.inner.for.inc: 21038 // CHECK11-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 21039 // CHECK11-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP30]], 1 21040 // CHECK11-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 21041 // CHECK11-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP29:![0-9]+]] 21042 // CHECK11: omp.inner.for.end: 21043 // CHECK11-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 21044 // CHECK11: omp.dispatch.inc: 21045 // CHECK11-NEXT: br label [[OMP_DISPATCH_COND]] 21046 // CHECK11: omp.dispatch.end: 21047 // CHECK11-NEXT: br label [[OMP_PRECOND_END]] 21048 // CHECK11: omp.precond.end: 21049 // CHECK11-NEXT: ret void 21050 // 21051 // 21052 // CHECK11-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 21053 // CHECK11-SAME: () #[[ATTR4:[0-9]+]] { 21054 // CHECK11-NEXT: entry: 21055 // CHECK11-NEXT: call void @__tgt_register_requires(i64 1) 21056 // CHECK11-NEXT: ret void 21057 // 21058 // 21059 // CHECK12-LABEL: define {{[^@]+}}@main 21060 // CHECK12-SAME: () #[[ATTR0:[0-9]+]] { 21061 // CHECK12-NEXT: entry: 21062 // CHECK12-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 21063 // CHECK12-NEXT: [[A:%.*]] = alloca double*, align 4 21064 // CHECK12-NEXT: [[B:%.*]] = alloca double*, align 4 21065 // CHECK12-NEXT: [[C:%.*]] = alloca double*, align 4 21066 // CHECK12-NEXT: [[N:%.*]] = alloca i32, align 4 21067 // CHECK12-NEXT: [[CH:%.*]] = alloca i32, align 4 21068 // CHECK12-NEXT: [[N_CASTED:%.*]] = alloca i32, align 4 21069 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 4 21070 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 4 21071 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 4 21072 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 21073 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 21074 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 21075 // CHECK12-NEXT: [[N_CASTED3:%.*]] = alloca i32, align 4 21076 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS4:%.*]] = alloca [4 x i8*], align 4 21077 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS5:%.*]] = alloca [4 x i8*], align 4 21078 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS6:%.*]] = alloca [4 x i8*], align 4 21079 // CHECK12-NEXT: [[_TMP7:%.*]] = alloca i32, align 4 21080 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_8:%.*]] = alloca i32, align 4 21081 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 21082 // CHECK12-NEXT: [[CH_CASTED:%.*]] = alloca i32, align 4 21083 // CHECK12-NEXT: [[N_CASTED16:%.*]] = alloca i32, align 4 21084 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS17:%.*]] = alloca [5 x i8*], align 4 21085 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS18:%.*]] = alloca [5 x i8*], align 4 21086 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS19:%.*]] = alloca [5 x i8*], align 4 21087 // CHECK12-NEXT: [[_TMP20:%.*]] = alloca i32, align 4 21088 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_21:%.*]] = alloca i32, align 4 21089 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_22:%.*]] = alloca i32, align 4 21090 // CHECK12-NEXT: [[N_CASTED29:%.*]] = alloca i32, align 4 21091 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS30:%.*]] = alloca [4 x i8*], align 4 21092 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS31:%.*]] = alloca [4 x i8*], align 4 21093 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS32:%.*]] = alloca [4 x i8*], align 4 21094 // CHECK12-NEXT: [[_TMP33:%.*]] = alloca i32, align 4 21095 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_34:%.*]] = alloca i32, align 4 21096 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_35:%.*]] = alloca i32, align 4 21097 // CHECK12-NEXT: [[CH_CASTED42:%.*]] = alloca i32, align 4 21098 // CHECK12-NEXT: [[N_CASTED43:%.*]] = alloca i32, align 4 21099 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS44:%.*]] = alloca [5 x i8*], align 4 21100 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS45:%.*]] = alloca [5 x i8*], align 4 21101 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS46:%.*]] = alloca [5 x i8*], align 4 21102 // CHECK12-NEXT: [[_TMP47:%.*]] = alloca i32, align 4 21103 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_48:%.*]] = alloca i32, align 4 21104 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_49:%.*]] = alloca i32, align 4 21105 // CHECK12-NEXT: [[N_CASTED56:%.*]] = alloca i32, align 4 21106 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS57:%.*]] = alloca [4 x i8*], align 4 21107 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS58:%.*]] = alloca [4 x i8*], align 4 21108 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS59:%.*]] = alloca [4 x i8*], align 4 21109 // CHECK12-NEXT: [[_TMP60:%.*]] = alloca i32, align 4 21110 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_61:%.*]] = alloca i32, align 4 21111 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_62:%.*]] = alloca i32, align 4 21112 // CHECK12-NEXT: [[CH_CASTED69:%.*]] = alloca i32, align 4 21113 // CHECK12-NEXT: [[N_CASTED70:%.*]] = alloca i32, align 4 21114 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS71:%.*]] = alloca [5 x i8*], align 4 21115 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS72:%.*]] = alloca [5 x i8*], align 4 21116 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS73:%.*]] = alloca [5 x i8*], align 4 21117 // CHECK12-NEXT: [[_TMP74:%.*]] = alloca i32, align 4 21118 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 21119 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_76:%.*]] = alloca i32, align 4 21120 // CHECK12-NEXT: store i32 0, i32* [[RETVAL]], align 4 21121 // CHECK12-NEXT: store i32 10000, i32* [[N]], align 4 21122 // CHECK12-NEXT: store i32 100, i32* [[CH]], align 4 21123 // CHECK12-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 21124 // CHECK12-NEXT: store i32 [[TMP0]], i32* [[N_CASTED]], align 4 21125 // CHECK12-NEXT: [[TMP1:%.*]] = load i32, i32* [[N_CASTED]], align 4 21126 // CHECK12-NEXT: [[TMP2:%.*]] = load double*, double** [[A]], align 4 21127 // CHECK12-NEXT: [[TMP3:%.*]] = load double*, double** [[B]], align 4 21128 // CHECK12-NEXT: [[TMP4:%.*]] = load double*, double** [[C]], align 4 21129 // CHECK12-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 21130 // CHECK12-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i32* 21131 // CHECK12-NEXT: store i32 [[TMP1]], i32* [[TMP6]], align 4 21132 // CHECK12-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 21133 // CHECK12-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i32* 21134 // CHECK12-NEXT: store i32 [[TMP1]], i32* [[TMP8]], align 4 21135 // CHECK12-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 0 21136 // CHECK12-NEXT: store i8* null, i8** [[TMP9]], align 4 21137 // CHECK12-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 21138 // CHECK12-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to double** 21139 // CHECK12-NEXT: store double* [[TMP2]], double** [[TMP11]], align 4 21140 // CHECK12-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 21141 // CHECK12-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to double** 21142 // CHECK12-NEXT: store double* [[TMP2]], double** [[TMP13]], align 4 21143 // CHECK12-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 1 21144 // CHECK12-NEXT: store i8* null, i8** [[TMP14]], align 4 21145 // CHECK12-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 21146 // CHECK12-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to double** 21147 // CHECK12-NEXT: store double* [[TMP3]], double** [[TMP16]], align 4 21148 // CHECK12-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 21149 // CHECK12-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to double** 21150 // CHECK12-NEXT: store double* [[TMP3]], double** [[TMP18]], align 4 21151 // CHECK12-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 2 21152 // CHECK12-NEXT: store i8* null, i8** [[TMP19]], align 4 21153 // CHECK12-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 21154 // CHECK12-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to double** 21155 // CHECK12-NEXT: store double* [[TMP4]], double** [[TMP21]], align 4 21156 // CHECK12-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 21157 // CHECK12-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to double** 21158 // CHECK12-NEXT: store double* [[TMP4]], double** [[TMP23]], align 4 21159 // CHECK12-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 3 21160 // CHECK12-NEXT: store i8* null, i8** [[TMP24]], align 4 21161 // CHECK12-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 21162 // CHECK12-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 21163 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 21164 // CHECK12-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 21165 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21166 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 21167 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 21168 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 21169 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 21170 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21171 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 21172 // CHECK12-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 21173 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3:[0-9]+]], i64 -1, i64 [[TMP30]]) 21174 // CHECK12-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21175 // CHECK12-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 21176 // CHECK12-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 21177 // CHECK12: omp_offload.failed: 21178 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369(i32 [[TMP1]], double* [[TMP2]], double* [[TMP3]], double* [[TMP4]]) #[[ATTR2:[0-9]+]] 21179 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT]] 21180 // CHECK12: omp_offload.cont: 21181 // CHECK12-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 21182 // CHECK12-NEXT: store i32 [[TMP33]], i32* [[N_CASTED3]], align 4 21183 // CHECK12-NEXT: [[TMP34:%.*]] = load i32, i32* [[N_CASTED3]], align 4 21184 // CHECK12-NEXT: [[TMP35:%.*]] = load double*, double** [[A]], align 4 21185 // CHECK12-NEXT: [[TMP36:%.*]] = load double*, double** [[B]], align 4 21186 // CHECK12-NEXT: [[TMP37:%.*]] = load double*, double** [[C]], align 4 21187 // CHECK12-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 21188 // CHECK12-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i32* 21189 // CHECK12-NEXT: store i32 [[TMP34]], i32* [[TMP39]], align 4 21190 // CHECK12-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 21191 // CHECK12-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i32* 21192 // CHECK12-NEXT: store i32 [[TMP34]], i32* [[TMP41]], align 4 21193 // CHECK12-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 0 21194 // CHECK12-NEXT: store i8* null, i8** [[TMP42]], align 4 21195 // CHECK12-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 1 21196 // CHECK12-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to double** 21197 // CHECK12-NEXT: store double* [[TMP35]], double** [[TMP44]], align 4 21198 // CHECK12-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 1 21199 // CHECK12-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to double** 21200 // CHECK12-NEXT: store double* [[TMP35]], double** [[TMP46]], align 4 21201 // CHECK12-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 1 21202 // CHECK12-NEXT: store i8* null, i8** [[TMP47]], align 4 21203 // CHECK12-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 2 21204 // CHECK12-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to double** 21205 // CHECK12-NEXT: store double* [[TMP36]], double** [[TMP49]], align 4 21206 // CHECK12-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 2 21207 // CHECK12-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to double** 21208 // CHECK12-NEXT: store double* [[TMP36]], double** [[TMP51]], align 4 21209 // CHECK12-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 2 21210 // CHECK12-NEXT: store i8* null, i8** [[TMP52]], align 4 21211 // CHECK12-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 3 21212 // CHECK12-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to double** 21213 // CHECK12-NEXT: store double* [[TMP37]], double** [[TMP54]], align 4 21214 // CHECK12-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 3 21215 // CHECK12-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to double** 21216 // CHECK12-NEXT: store double* [[TMP37]], double** [[TMP56]], align 4 21217 // CHECK12-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 3 21218 // CHECK12-NEXT: store i8* null, i8** [[TMP57]], align 4 21219 // CHECK12-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 21220 // CHECK12-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 21221 // CHECK12-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 21222 // CHECK12-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_8]], align 4 21223 // CHECK12-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_8]], align 4 21224 // CHECK12-NEXT: [[SUB10:%.*]] = sub nsw i32 [[TMP61]], 0 21225 // CHECK12-NEXT: [[DIV11:%.*]] = sdiv i32 [[SUB10]], 1 21226 // CHECK12-NEXT: [[SUB12:%.*]] = sub nsw i32 [[DIV11]], 1 21227 // CHECK12-NEXT: store i32 [[SUB12]], i32* [[DOTCAPTURE_EXPR_9]], align 4 21228 // CHECK12-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 21229 // CHECK12-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP62]], 1 21230 // CHECK12-NEXT: [[TMP63:%.*]] = zext i32 [[ADD13]] to i64 21231 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 21232 // CHECK12-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.4, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.5, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21233 // CHECK12-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 21234 // CHECK12-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED14:%.*]], label [[OMP_OFFLOAD_CONT15:%.*]] 21235 // CHECK12: omp_offload.failed14: 21236 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408(i32 [[TMP34]], double* [[TMP35]], double* [[TMP36]], double* [[TMP37]]) #[[ATTR2]] 21237 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT15]] 21238 // CHECK12: omp_offload.cont15: 21239 // CHECK12-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 21240 // CHECK12-NEXT: store i32 [[TMP66]], i32* [[CH_CASTED]], align 4 21241 // CHECK12-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH_CASTED]], align 4 21242 // CHECK12-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 21243 // CHECK12-NEXT: store i32 [[TMP68]], i32* [[N_CASTED16]], align 4 21244 // CHECK12-NEXT: [[TMP69:%.*]] = load i32, i32* [[N_CASTED16]], align 4 21245 // CHECK12-NEXT: [[TMP70:%.*]] = load double*, double** [[A]], align 4 21246 // CHECK12-NEXT: [[TMP71:%.*]] = load double*, double** [[B]], align 4 21247 // CHECK12-NEXT: [[TMP72:%.*]] = load double*, double** [[C]], align 4 21248 // CHECK12-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 21249 // CHECK12-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i32* 21250 // CHECK12-NEXT: store i32 [[TMP67]], i32* [[TMP74]], align 4 21251 // CHECK12-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 21252 // CHECK12-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i32* 21253 // CHECK12-NEXT: store i32 [[TMP67]], i32* [[TMP76]], align 4 21254 // CHECK12-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 0 21255 // CHECK12-NEXT: store i8* null, i8** [[TMP77]], align 4 21256 // CHECK12-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 1 21257 // CHECK12-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i32* 21258 // CHECK12-NEXT: store i32 [[TMP69]], i32* [[TMP79]], align 4 21259 // CHECK12-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 1 21260 // CHECK12-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i32* 21261 // CHECK12-NEXT: store i32 [[TMP69]], i32* [[TMP81]], align 4 21262 // CHECK12-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 1 21263 // CHECK12-NEXT: store i8* null, i8** [[TMP82]], align 4 21264 // CHECK12-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 2 21265 // CHECK12-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to double** 21266 // CHECK12-NEXT: store double* [[TMP70]], double** [[TMP84]], align 4 21267 // CHECK12-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 2 21268 // CHECK12-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to double** 21269 // CHECK12-NEXT: store double* [[TMP70]], double** [[TMP86]], align 4 21270 // CHECK12-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 2 21271 // CHECK12-NEXT: store i8* null, i8** [[TMP87]], align 4 21272 // CHECK12-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 3 21273 // CHECK12-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to double** 21274 // CHECK12-NEXT: store double* [[TMP71]], double** [[TMP89]], align 4 21275 // CHECK12-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 3 21276 // CHECK12-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to double** 21277 // CHECK12-NEXT: store double* [[TMP71]], double** [[TMP91]], align 4 21278 // CHECK12-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 3 21279 // CHECK12-NEXT: store i8* null, i8** [[TMP92]], align 4 21280 // CHECK12-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 4 21281 // CHECK12-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to double** 21282 // CHECK12-NEXT: store double* [[TMP72]], double** [[TMP94]], align 4 21283 // CHECK12-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 4 21284 // CHECK12-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to double** 21285 // CHECK12-NEXT: store double* [[TMP72]], double** [[TMP96]], align 4 21286 // CHECK12-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 4 21287 // CHECK12-NEXT: store i8* null, i8** [[TMP97]], align 4 21288 // CHECK12-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 21289 // CHECK12-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 21290 // CHECK12-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 21291 // CHECK12-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_21]], align 4 21292 // CHECK12-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_21]], align 4 21293 // CHECK12-NEXT: [[SUB23:%.*]] = sub nsw i32 [[TMP101]], 0 21294 // CHECK12-NEXT: [[DIV24:%.*]] = sdiv i32 [[SUB23]], 1 21295 // CHECK12-NEXT: [[SUB25:%.*]] = sub nsw i32 [[DIV24]], 1 21296 // CHECK12-NEXT: store i32 [[SUB25]], i32* [[DOTCAPTURE_EXPR_22]], align 4 21297 // CHECK12-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_22]], align 4 21298 // CHECK12-NEXT: [[ADD26:%.*]] = add nsw i32 [[TMP102]], 1 21299 // CHECK12-NEXT: [[TMP103:%.*]] = zext i32 [[ADD26]] to i64 21300 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 21301 // CHECK12-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.8, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.9, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21302 // CHECK12-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 21303 // CHECK12-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED27:%.*]], label [[OMP_OFFLOAD_CONT28:%.*]] 21304 // CHECK12: omp_offload.failed27: 21305 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447(i32 [[TMP67]], i32 [[TMP69]], double* [[TMP70]], double* [[TMP71]], double* [[TMP72]]) #[[ATTR2]] 21306 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT28]] 21307 // CHECK12: omp_offload.cont28: 21308 // CHECK12-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 21309 // CHECK12-NEXT: store i32 [[TMP106]], i32* [[N_CASTED29]], align 4 21310 // CHECK12-NEXT: [[TMP107:%.*]] = load i32, i32* [[N_CASTED29]], align 4 21311 // CHECK12-NEXT: [[TMP108:%.*]] = load double*, double** [[A]], align 4 21312 // CHECK12-NEXT: [[TMP109:%.*]] = load double*, double** [[B]], align 4 21313 // CHECK12-NEXT: [[TMP110:%.*]] = load double*, double** [[C]], align 4 21314 // CHECK12-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 21315 // CHECK12-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i32* 21316 // CHECK12-NEXT: store i32 [[TMP107]], i32* [[TMP112]], align 4 21317 // CHECK12-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 21318 // CHECK12-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i32* 21319 // CHECK12-NEXT: store i32 [[TMP107]], i32* [[TMP114]], align 4 21320 // CHECK12-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 0 21321 // CHECK12-NEXT: store i8* null, i8** [[TMP115]], align 4 21322 // CHECK12-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 1 21323 // CHECK12-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to double** 21324 // CHECK12-NEXT: store double* [[TMP108]], double** [[TMP117]], align 4 21325 // CHECK12-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 1 21326 // CHECK12-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to double** 21327 // CHECK12-NEXT: store double* [[TMP108]], double** [[TMP119]], align 4 21328 // CHECK12-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 1 21329 // CHECK12-NEXT: store i8* null, i8** [[TMP120]], align 4 21330 // CHECK12-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 2 21331 // CHECK12-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to double** 21332 // CHECK12-NEXT: store double* [[TMP109]], double** [[TMP122]], align 4 21333 // CHECK12-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 2 21334 // CHECK12-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to double** 21335 // CHECK12-NEXT: store double* [[TMP109]], double** [[TMP124]], align 4 21336 // CHECK12-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 2 21337 // CHECK12-NEXT: store i8* null, i8** [[TMP125]], align 4 21338 // CHECK12-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 3 21339 // CHECK12-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to double** 21340 // CHECK12-NEXT: store double* [[TMP110]], double** [[TMP127]], align 4 21341 // CHECK12-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 3 21342 // CHECK12-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to double** 21343 // CHECK12-NEXT: store double* [[TMP110]], double** [[TMP129]], align 4 21344 // CHECK12-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 3 21345 // CHECK12-NEXT: store i8* null, i8** [[TMP130]], align 4 21346 // CHECK12-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 21347 // CHECK12-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 21348 // CHECK12-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 21349 // CHECK12-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_34]], align 4 21350 // CHECK12-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_34]], align 4 21351 // CHECK12-NEXT: [[SUB36:%.*]] = sub nsw i32 [[TMP134]], 0 21352 // CHECK12-NEXT: [[DIV37:%.*]] = sdiv i32 [[SUB36]], 1 21353 // CHECK12-NEXT: [[SUB38:%.*]] = sub nsw i32 [[DIV37]], 1 21354 // CHECK12-NEXT: store i32 [[SUB38]], i32* [[DOTCAPTURE_EXPR_35]], align 4 21355 // CHECK12-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_35]], align 4 21356 // CHECK12-NEXT: [[ADD39:%.*]] = add nsw i32 [[TMP135]], 1 21357 // CHECK12-NEXT: [[TMP136:%.*]] = zext i32 [[ADD39]] to i64 21358 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 21359 // CHECK12-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.12, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.13, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21360 // CHECK12-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 21361 // CHECK12-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED40:%.*]], label [[OMP_OFFLOAD_CONT41:%.*]] 21362 // CHECK12: omp_offload.failed40: 21363 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478(i32 [[TMP107]], double* [[TMP108]], double* [[TMP109]], double* [[TMP110]]) #[[ATTR2]] 21364 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT41]] 21365 // CHECK12: omp_offload.cont41: 21366 // CHECK12-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 21367 // CHECK12-NEXT: store i32 [[TMP139]], i32* [[CH_CASTED42]], align 4 21368 // CHECK12-NEXT: [[TMP140:%.*]] = load i32, i32* [[CH_CASTED42]], align 4 21369 // CHECK12-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 21370 // CHECK12-NEXT: store i32 [[TMP141]], i32* [[N_CASTED43]], align 4 21371 // CHECK12-NEXT: [[TMP142:%.*]] = load i32, i32* [[N_CASTED43]], align 4 21372 // CHECK12-NEXT: [[TMP143:%.*]] = load double*, double** [[A]], align 4 21373 // CHECK12-NEXT: [[TMP144:%.*]] = load double*, double** [[B]], align 4 21374 // CHECK12-NEXT: [[TMP145:%.*]] = load double*, double** [[C]], align 4 21375 // CHECK12-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 21376 // CHECK12-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i32* 21377 // CHECK12-NEXT: store i32 [[TMP140]], i32* [[TMP147]], align 4 21378 // CHECK12-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 21379 // CHECK12-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i32* 21380 // CHECK12-NEXT: store i32 [[TMP140]], i32* [[TMP149]], align 4 21381 // CHECK12-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 0 21382 // CHECK12-NEXT: store i8* null, i8** [[TMP150]], align 4 21383 // CHECK12-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 1 21384 // CHECK12-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i32* 21385 // CHECK12-NEXT: store i32 [[TMP142]], i32* [[TMP152]], align 4 21386 // CHECK12-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 1 21387 // CHECK12-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i32* 21388 // CHECK12-NEXT: store i32 [[TMP142]], i32* [[TMP154]], align 4 21389 // CHECK12-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 1 21390 // CHECK12-NEXT: store i8* null, i8** [[TMP155]], align 4 21391 // CHECK12-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 2 21392 // CHECK12-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to double** 21393 // CHECK12-NEXT: store double* [[TMP143]], double** [[TMP157]], align 4 21394 // CHECK12-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 2 21395 // CHECK12-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to double** 21396 // CHECK12-NEXT: store double* [[TMP143]], double** [[TMP159]], align 4 21397 // CHECK12-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 2 21398 // CHECK12-NEXT: store i8* null, i8** [[TMP160]], align 4 21399 // CHECK12-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 3 21400 // CHECK12-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to double** 21401 // CHECK12-NEXT: store double* [[TMP144]], double** [[TMP162]], align 4 21402 // CHECK12-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 3 21403 // CHECK12-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to double** 21404 // CHECK12-NEXT: store double* [[TMP144]], double** [[TMP164]], align 4 21405 // CHECK12-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 3 21406 // CHECK12-NEXT: store i8* null, i8** [[TMP165]], align 4 21407 // CHECK12-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 4 21408 // CHECK12-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to double** 21409 // CHECK12-NEXT: store double* [[TMP145]], double** [[TMP167]], align 4 21410 // CHECK12-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 4 21411 // CHECK12-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to double** 21412 // CHECK12-NEXT: store double* [[TMP145]], double** [[TMP169]], align 4 21413 // CHECK12-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 4 21414 // CHECK12-NEXT: store i8* null, i8** [[TMP170]], align 4 21415 // CHECK12-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 21416 // CHECK12-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 21417 // CHECK12-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 21418 // CHECK12-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_48]], align 4 21419 // CHECK12-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_48]], align 4 21420 // CHECK12-NEXT: [[SUB50:%.*]] = sub nsw i32 [[TMP174]], 0 21421 // CHECK12-NEXT: [[DIV51:%.*]] = sdiv i32 [[SUB50]], 1 21422 // CHECK12-NEXT: [[SUB52:%.*]] = sub nsw i32 [[DIV51]], 1 21423 // CHECK12-NEXT: store i32 [[SUB52]], i32* [[DOTCAPTURE_EXPR_49]], align 4 21424 // CHECK12-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_49]], align 4 21425 // CHECK12-NEXT: [[ADD53:%.*]] = add nsw i32 [[TMP175]], 1 21426 // CHECK12-NEXT: [[TMP176:%.*]] = zext i32 [[ADD53]] to i64 21427 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 21428 // CHECK12-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.16, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.17, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21429 // CHECK12-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 21430 // CHECK12-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED54:%.*]], label [[OMP_OFFLOAD_CONT55:%.*]] 21431 // CHECK12: omp_offload.failed54: 21432 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506(i32 [[TMP140]], i32 [[TMP142]], double* [[TMP143]], double* [[TMP144]], double* [[TMP145]]) #[[ATTR2]] 21433 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT55]] 21434 // CHECK12: omp_offload.cont55: 21435 // CHECK12-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 21436 // CHECK12-NEXT: store i32 [[TMP179]], i32* [[N_CASTED56]], align 4 21437 // CHECK12-NEXT: [[TMP180:%.*]] = load i32, i32* [[N_CASTED56]], align 4 21438 // CHECK12-NEXT: [[TMP181:%.*]] = load double*, double** [[A]], align 4 21439 // CHECK12-NEXT: [[TMP182:%.*]] = load double*, double** [[B]], align 4 21440 // CHECK12-NEXT: [[TMP183:%.*]] = load double*, double** [[C]], align 4 21441 // CHECK12-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 21442 // CHECK12-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i32* 21443 // CHECK12-NEXT: store i32 [[TMP180]], i32* [[TMP185]], align 4 21444 // CHECK12-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 21445 // CHECK12-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i32* 21446 // CHECK12-NEXT: store i32 [[TMP180]], i32* [[TMP187]], align 4 21447 // CHECK12-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 0 21448 // CHECK12-NEXT: store i8* null, i8** [[TMP188]], align 4 21449 // CHECK12-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 1 21450 // CHECK12-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to double** 21451 // CHECK12-NEXT: store double* [[TMP181]], double** [[TMP190]], align 4 21452 // CHECK12-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 1 21453 // CHECK12-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to double** 21454 // CHECK12-NEXT: store double* [[TMP181]], double** [[TMP192]], align 4 21455 // CHECK12-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 1 21456 // CHECK12-NEXT: store i8* null, i8** [[TMP193]], align 4 21457 // CHECK12-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 2 21458 // CHECK12-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to double** 21459 // CHECK12-NEXT: store double* [[TMP182]], double** [[TMP195]], align 4 21460 // CHECK12-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 2 21461 // CHECK12-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to double** 21462 // CHECK12-NEXT: store double* [[TMP182]], double** [[TMP197]], align 4 21463 // CHECK12-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 2 21464 // CHECK12-NEXT: store i8* null, i8** [[TMP198]], align 4 21465 // CHECK12-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 3 21466 // CHECK12-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to double** 21467 // CHECK12-NEXT: store double* [[TMP183]], double** [[TMP200]], align 4 21468 // CHECK12-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 3 21469 // CHECK12-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to double** 21470 // CHECK12-NEXT: store double* [[TMP183]], double** [[TMP202]], align 4 21471 // CHECK12-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 3 21472 // CHECK12-NEXT: store i8* null, i8** [[TMP203]], align 4 21473 // CHECK12-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 21474 // CHECK12-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 21475 // CHECK12-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 21476 // CHECK12-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_61]], align 4 21477 // CHECK12-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_61]], align 4 21478 // CHECK12-NEXT: [[SUB63:%.*]] = sub nsw i32 [[TMP207]], 0 21479 // CHECK12-NEXT: [[DIV64:%.*]] = sdiv i32 [[SUB63]], 1 21480 // CHECK12-NEXT: [[SUB65:%.*]] = sub nsw i32 [[DIV64]], 1 21481 // CHECK12-NEXT: store i32 [[SUB65]], i32* [[DOTCAPTURE_EXPR_62]], align 4 21482 // CHECK12-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_62]], align 4 21483 // CHECK12-NEXT: [[ADD66:%.*]] = add nsw i32 [[TMP208]], 1 21484 // CHECK12-NEXT: [[TMP209:%.*]] = zext i32 [[ADD66]] to i64 21485 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 21486 // CHECK12-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.20, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.21, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21487 // CHECK12-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 21488 // CHECK12-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED67:%.*]], label [[OMP_OFFLOAD_CONT68:%.*]] 21489 // CHECK12: omp_offload.failed67: 21490 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536(i32 [[TMP180]], double* [[TMP181]], double* [[TMP182]], double* [[TMP183]]) #[[ATTR2]] 21491 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT68]] 21492 // CHECK12: omp_offload.cont68: 21493 // CHECK12-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 21494 // CHECK12-NEXT: store i32 [[TMP212]], i32* [[CH_CASTED69]], align 4 21495 // CHECK12-NEXT: [[TMP213:%.*]] = load i32, i32* [[CH_CASTED69]], align 4 21496 // CHECK12-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 21497 // CHECK12-NEXT: store i32 [[TMP214]], i32* [[N_CASTED70]], align 4 21498 // CHECK12-NEXT: [[TMP215:%.*]] = load i32, i32* [[N_CASTED70]], align 4 21499 // CHECK12-NEXT: [[TMP216:%.*]] = load double*, double** [[A]], align 4 21500 // CHECK12-NEXT: [[TMP217:%.*]] = load double*, double** [[B]], align 4 21501 // CHECK12-NEXT: [[TMP218:%.*]] = load double*, double** [[C]], align 4 21502 // CHECK12-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 21503 // CHECK12-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i32* 21504 // CHECK12-NEXT: store i32 [[TMP213]], i32* [[TMP220]], align 4 21505 // CHECK12-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 21506 // CHECK12-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i32* 21507 // CHECK12-NEXT: store i32 [[TMP213]], i32* [[TMP222]], align 4 21508 // CHECK12-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 0 21509 // CHECK12-NEXT: store i8* null, i8** [[TMP223]], align 4 21510 // CHECK12-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 1 21511 // CHECK12-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i32* 21512 // CHECK12-NEXT: store i32 [[TMP215]], i32* [[TMP225]], align 4 21513 // CHECK12-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 1 21514 // CHECK12-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i32* 21515 // CHECK12-NEXT: store i32 [[TMP215]], i32* [[TMP227]], align 4 21516 // CHECK12-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 1 21517 // CHECK12-NEXT: store i8* null, i8** [[TMP228]], align 4 21518 // CHECK12-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 2 21519 // CHECK12-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to double** 21520 // CHECK12-NEXT: store double* [[TMP216]], double** [[TMP230]], align 4 21521 // CHECK12-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 2 21522 // CHECK12-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to double** 21523 // CHECK12-NEXT: store double* [[TMP216]], double** [[TMP232]], align 4 21524 // CHECK12-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 2 21525 // CHECK12-NEXT: store i8* null, i8** [[TMP233]], align 4 21526 // CHECK12-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 3 21527 // CHECK12-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to double** 21528 // CHECK12-NEXT: store double* [[TMP217]], double** [[TMP235]], align 4 21529 // CHECK12-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 3 21530 // CHECK12-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to double** 21531 // CHECK12-NEXT: store double* [[TMP217]], double** [[TMP237]], align 4 21532 // CHECK12-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 3 21533 // CHECK12-NEXT: store i8* null, i8** [[TMP238]], align 4 21534 // CHECK12-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 4 21535 // CHECK12-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to double** 21536 // CHECK12-NEXT: store double* [[TMP218]], double** [[TMP240]], align 4 21537 // CHECK12-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 4 21538 // CHECK12-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to double** 21539 // CHECK12-NEXT: store double* [[TMP218]], double** [[TMP242]], align 4 21540 // CHECK12-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 4 21541 // CHECK12-NEXT: store i8* null, i8** [[TMP243]], align 4 21542 // CHECK12-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 21543 // CHECK12-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 21544 // CHECK12-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 21545 // CHECK12-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_75]], align 4 21546 // CHECK12-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_75]], align 4 21547 // CHECK12-NEXT: [[SUB77:%.*]] = sub nsw i32 [[TMP247]], 0 21548 // CHECK12-NEXT: [[DIV78:%.*]] = sdiv i32 [[SUB77]], 1 21549 // CHECK12-NEXT: [[SUB79:%.*]] = sub nsw i32 [[DIV78]], 1 21550 // CHECK12-NEXT: store i32 [[SUB79]], i32* [[DOTCAPTURE_EXPR_76]], align 4 21551 // CHECK12-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_76]], align 4 21552 // CHECK12-NEXT: [[ADD80:%.*]] = add nsw i32 [[TMP248]], 1 21553 // CHECK12-NEXT: [[TMP249:%.*]] = zext i32 [[ADD80]] to i64 21554 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 21555 // CHECK12-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.24, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.25, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 21556 // CHECK12-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 21557 // CHECK12-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED81:%.*]], label [[OMP_OFFLOAD_CONT82:%.*]] 21558 // CHECK12: omp_offload.failed81: 21559 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562(i32 [[TMP213]], i32 [[TMP215]], double* [[TMP216]], double* [[TMP217]], double* [[TMP218]]) #[[ATTR2]] 21560 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT82]] 21561 // CHECK12: omp_offload.cont82: 21562 // CHECK12-NEXT: [[CALL:%.*]] = call i32 @_Z5tmainIiET_v() 21563 // CHECK12-NEXT: ret i32 [[CALL]] 21564 // 21565 // 21566 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l369 21567 // CHECK12-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1:[0-9]+]] { 21568 // CHECK12-NEXT: entry: 21569 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 21570 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 21571 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 21572 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 21573 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 21574 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 21575 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 21576 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 21577 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 21578 // CHECK12-NEXT: ret void 21579 // 21580 // 21581 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined. 21582 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 21583 // CHECK12-NEXT: entry: 21584 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 21585 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 21586 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 21587 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 21588 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 21589 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 21590 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 21591 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 21592 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 21593 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 21594 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 21595 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 21596 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 21597 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 21598 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 21599 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 21600 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 21601 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 21602 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 21603 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 21604 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 21605 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 21606 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 21607 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 21608 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 21609 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 21610 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 21611 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 21612 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21613 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 21614 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 21615 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 21616 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 21617 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 21618 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21619 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 21620 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 21621 // CHECK12: omp.precond.then: 21622 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 21623 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21624 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 21625 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 21626 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 21627 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21628 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 21629 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1:[0-9]+]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 21630 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21631 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21632 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 21633 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 21634 // CHECK12: cond.true: 21635 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21636 // CHECK12-NEXT: br label [[COND_END:%.*]] 21637 // CHECK12: cond.false: 21638 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21639 // CHECK12-NEXT: br label [[COND_END]] 21640 // CHECK12: cond.end: 21641 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 21642 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 21643 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 21644 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 21645 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 21646 // CHECK12: omp.inner.for.cond: 21647 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21648 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21649 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 21650 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 21651 // CHECK12: omp.inner.for.body: 21652 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 21653 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21654 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 21655 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 21656 // CHECK12: omp.inner.for.inc: 21657 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21658 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 21659 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 21660 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 21661 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 21662 // CHECK12: omp.inner.for.end: 21663 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 21664 // CHECK12: omp.loop.exit: 21665 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21666 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 21667 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 21668 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 21669 // CHECK12: omp.precond.end: 21670 // CHECK12-NEXT: ret void 21671 // 21672 // 21673 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..1 21674 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 21675 // CHECK12-NEXT: entry: 21676 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 21677 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 21678 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 21679 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 21680 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 21681 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 21682 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 21683 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 21684 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 21685 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 21686 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 21687 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 21688 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 21689 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 21690 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 21691 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 21692 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 21693 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 21694 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 21695 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 21696 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 21697 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 21698 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 21699 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 21700 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 21701 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 21702 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 21703 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 21704 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 21705 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 21706 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 21707 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 21708 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21709 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 21710 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 21711 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 21712 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 21713 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 21714 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21715 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 21716 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 21717 // CHECK12: omp.precond.then: 21718 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 21719 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21720 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 21721 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 21722 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 21723 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 21724 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 21725 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 21726 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 21727 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21728 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 21729 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 21730 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 21731 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21732 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 21733 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 21734 // CHECK12: cond.true: 21735 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21736 // CHECK12-NEXT: br label [[COND_END:%.*]] 21737 // CHECK12: cond.false: 21738 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 21739 // CHECK12-NEXT: br label [[COND_END]] 21740 // CHECK12: cond.end: 21741 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 21742 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 21743 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 21744 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 21745 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 21746 // CHECK12: omp.inner.for.cond: 21747 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21748 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 21749 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 21750 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 21751 // CHECK12: omp.inner.for.body: 21752 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21753 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 21754 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 21755 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 21756 // CHECK12-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 21757 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 21758 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 21759 // CHECK12-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 21760 // CHECK12-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 21761 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 21762 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 21763 // CHECK12-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 21764 // CHECK12-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 21765 // CHECK12-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 21766 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 21767 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 21768 // CHECK12-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 21769 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 21770 // CHECK12: omp.body.continue: 21771 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 21772 // CHECK12: omp.inner.for.inc: 21773 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21774 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 21775 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 21776 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 21777 // CHECK12: omp.inner.for.end: 21778 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 21779 // CHECK12: omp.loop.exit: 21780 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21781 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 21782 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 21783 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 21784 // CHECK12: omp.precond.end: 21785 // CHECK12-NEXT: ret void 21786 // 21787 // 21788 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l408 21789 // CHECK12-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 21790 // CHECK12-NEXT: entry: 21791 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 21792 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 21793 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 21794 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 21795 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 21796 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 21797 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 21798 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 21799 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 21800 // CHECK12-NEXT: ret void 21801 // 21802 // 21803 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..2 21804 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 21805 // CHECK12-NEXT: entry: 21806 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 21807 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 21808 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 21809 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 21810 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 21811 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 21812 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 21813 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 21814 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 21815 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 21816 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 21817 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 21818 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 21819 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 21820 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 21821 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 21822 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 21823 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 21824 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 21825 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 21826 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 21827 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 21828 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 21829 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 21830 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 21831 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 21832 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 21833 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 21834 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21835 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 21836 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 21837 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 21838 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 21839 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 21840 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21841 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 21842 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 21843 // CHECK12: omp.precond.then: 21844 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 21845 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21846 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 21847 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 21848 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 21849 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21850 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 21851 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 21852 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21853 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21854 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 21855 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 21856 // CHECK12: cond.true: 21857 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21858 // CHECK12-NEXT: br label [[COND_END:%.*]] 21859 // CHECK12: cond.false: 21860 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21861 // CHECK12-NEXT: br label [[COND_END]] 21862 // CHECK12: cond.end: 21863 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 21864 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 21865 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 21866 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 21867 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 21868 // CHECK12: omp.inner.for.cond: 21869 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21870 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21871 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 21872 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 21873 // CHECK12: omp.inner.for.body: 21874 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 21875 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 21876 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 21877 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 21878 // CHECK12: omp.inner.for.inc: 21879 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21880 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 21881 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 21882 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 21883 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 21884 // CHECK12: omp.inner.for.end: 21885 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 21886 // CHECK12: omp.loop.exit: 21887 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21888 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 21889 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 21890 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 21891 // CHECK12: omp.precond.end: 21892 // CHECK12-NEXT: ret void 21893 // 21894 // 21895 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..3 21896 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 21897 // CHECK12-NEXT: entry: 21898 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 21899 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 21900 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 21901 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 21902 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 21903 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 21904 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 21905 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 21906 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 21907 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 21908 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 21909 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 21910 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 21911 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 21912 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 21913 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 21914 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 21915 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 21916 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 21917 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 21918 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 21919 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 21920 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 21921 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 21922 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 21923 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 21924 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 21925 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 21926 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 21927 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 21928 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 21929 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 21930 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21931 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 21932 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 21933 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 21934 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 21935 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 21936 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 21937 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 21938 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 21939 // CHECK12: omp.precond.then: 21940 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 21941 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21942 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 21943 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 21944 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 21945 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 21946 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 21947 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 21948 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 21949 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 21950 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 21951 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 21952 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 21953 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21954 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 21955 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 21956 // CHECK12: cond.true: 21957 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 21958 // CHECK12-NEXT: br label [[COND_END:%.*]] 21959 // CHECK12: cond.false: 21960 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 21961 // CHECK12-NEXT: br label [[COND_END]] 21962 // CHECK12: cond.end: 21963 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 21964 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 21965 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 21966 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 21967 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 21968 // CHECK12: omp.inner.for.cond: 21969 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21970 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 21971 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 21972 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 21973 // CHECK12: omp.inner.for.body: 21974 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21975 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 21976 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 21977 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 21978 // CHECK12-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 21979 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 21980 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 21981 // CHECK12-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 21982 // CHECK12-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 21983 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 21984 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 21985 // CHECK12-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 21986 // CHECK12-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 21987 // CHECK12-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 21988 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 21989 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 21990 // CHECK12-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 21991 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 21992 // CHECK12: omp.body.continue: 21993 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 21994 // CHECK12: omp.inner.for.inc: 21995 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 21996 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 21997 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 21998 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 21999 // CHECK12: omp.inner.for.end: 22000 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22001 // CHECK12: omp.loop.exit: 22002 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22003 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 22004 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 22005 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22006 // CHECK12: omp.precond.end: 22007 // CHECK12-NEXT: ret void 22008 // 22009 // 22010 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l447 22011 // CHECK12-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 22012 // CHECK12-NEXT: entry: 22013 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 22014 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 22015 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 22016 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 22017 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 22018 // CHECK12-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 22019 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 22020 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 22021 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 22022 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 22023 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 22024 // CHECK12-NEXT: ret void 22025 // 22026 // 22027 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..6 22028 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22029 // CHECK12-NEXT: entry: 22030 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22031 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22032 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 22033 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22034 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22035 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22036 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22037 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22038 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22039 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22040 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22041 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22042 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 22043 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 22044 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22045 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22046 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 22047 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22048 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22049 // CHECK12-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 22050 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22051 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22052 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22053 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22054 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 22055 // CHECK12-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22056 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 22057 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 22058 // CHECK12-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 22059 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 22060 // CHECK12-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 22061 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22062 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 22063 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22064 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 22065 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22066 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22067 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22068 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 22069 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22070 // CHECK12: omp.precond.then: 22071 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 22072 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22073 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 22074 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22075 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22076 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 22077 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22078 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 22079 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 22080 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22081 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22082 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 22083 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22084 // CHECK12: cond.true: 22085 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22086 // CHECK12-NEXT: br label [[COND_END:%.*]] 22087 // CHECK12: cond.false: 22088 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22089 // CHECK12-NEXT: br label [[COND_END]] 22090 // CHECK12: cond.end: 22091 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 22092 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 22093 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22094 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 22095 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22096 // CHECK12: omp.inner.for.cond: 22097 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22098 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22099 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 22100 // CHECK12-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 22101 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22102 // CHECK12: omp.inner.for.body: 22103 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22104 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22105 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]]) 22106 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22107 // CHECK12: omp.inner.for.inc: 22108 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22109 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22110 // CHECK12-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 22111 // CHECK12-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 22112 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22113 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22114 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 22115 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 22116 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22117 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22118 // CHECK12-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 22119 // CHECK12-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 22120 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22121 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22122 // CHECK12-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP27]], [[TMP28]] 22123 // CHECK12-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 22124 // CHECK12: cond.true10: 22125 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22126 // CHECK12-NEXT: br label [[COND_END12:%.*]] 22127 // CHECK12: cond.false11: 22128 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22129 // CHECK12-NEXT: br label [[COND_END12]] 22130 // CHECK12: cond.end12: 22131 // CHECK12-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP29]], [[COND_TRUE10]] ], [ [[TMP30]], [[COND_FALSE11]] ] 22132 // CHECK12-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 22133 // CHECK12-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22134 // CHECK12-NEXT: store i32 [[TMP31]], i32* [[DOTOMP_IV]], align 4 22135 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22136 // CHECK12: omp.inner.for.end: 22137 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22138 // CHECK12: omp.loop.exit: 22139 // CHECK12-NEXT: [[TMP32:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22140 // CHECK12-NEXT: [[TMP33:%.*]] = load i32, i32* [[TMP32]], align 4 22141 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP33]]) 22142 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22143 // CHECK12: omp.precond.end: 22144 // CHECK12-NEXT: ret void 22145 // 22146 // 22147 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..7 22148 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22149 // CHECK12-NEXT: entry: 22150 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22151 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22152 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 22153 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 22154 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22155 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22156 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22157 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22158 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22159 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22160 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22161 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22162 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22163 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 22164 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 22165 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22166 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22167 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 22168 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22169 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22170 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22171 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22172 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22173 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22174 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22175 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22176 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22177 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 22178 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 22179 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 22180 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 22181 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 22182 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22183 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 22184 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22185 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 22186 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22187 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22188 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22189 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 22190 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22191 // CHECK12: omp.precond.then: 22192 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 22193 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22194 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 22195 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22196 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22197 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 22198 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 22199 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22200 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22201 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22202 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 22203 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 22204 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22205 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22206 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 22207 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22208 // CHECK12: cond.true: 22209 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22210 // CHECK12-NEXT: br label [[COND_END:%.*]] 22211 // CHECK12: cond.false: 22212 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22213 // CHECK12-NEXT: br label [[COND_END]] 22214 // CHECK12: cond.end: 22215 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 22216 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 22217 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 22218 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 22219 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22220 // CHECK12: omp.inner.for.cond: 22221 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22222 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22223 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 22224 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22225 // CHECK12: omp.inner.for.body: 22226 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22227 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 22228 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 22229 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 22230 // CHECK12-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 22231 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 22232 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 22233 // CHECK12-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 22234 // CHECK12-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 22235 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 22236 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 22237 // CHECK12-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 22238 // CHECK12-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 22239 // CHECK12-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 22240 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 22241 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 22242 // CHECK12-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 22243 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 22244 // CHECK12: omp.body.continue: 22245 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22246 // CHECK12: omp.inner.for.inc: 22247 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22248 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 22249 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 22250 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22251 // CHECK12: omp.inner.for.end: 22252 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22253 // CHECK12: omp.loop.exit: 22254 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22255 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 22256 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 22257 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22258 // CHECK12: omp.precond.end: 22259 // CHECK12-NEXT: ret void 22260 // 22261 // 22262 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l478 22263 // CHECK12-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 22264 // CHECK12-NEXT: entry: 22265 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 22266 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 22267 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 22268 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 22269 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 22270 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 22271 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 22272 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 22273 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..10 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 22274 // CHECK12-NEXT: ret void 22275 // 22276 // 22277 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..10 22278 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22279 // CHECK12-NEXT: entry: 22280 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22281 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22282 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22283 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22284 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22285 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22286 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22287 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22288 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22289 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22290 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22291 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 22292 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 22293 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22294 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22295 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 22296 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22297 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22298 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22299 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22300 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22301 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22302 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22303 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 22304 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 22305 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 22306 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 22307 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 22308 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22309 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 22310 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22311 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 22312 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22313 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22314 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22315 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 22316 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22317 // CHECK12: omp.precond.then: 22318 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 22319 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22320 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 22321 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22322 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22323 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22324 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 22325 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 22326 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22327 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22328 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 22329 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22330 // CHECK12: cond.true: 22331 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22332 // CHECK12-NEXT: br label [[COND_END:%.*]] 22333 // CHECK12: cond.false: 22334 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22335 // CHECK12-NEXT: br label [[COND_END]] 22336 // CHECK12: cond.end: 22337 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 22338 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 22339 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22340 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 22341 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22342 // CHECK12: omp.inner.for.cond: 22343 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22344 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22345 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 22346 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22347 // CHECK12: omp.inner.for.body: 22348 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22349 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22350 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..11 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 22351 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22352 // CHECK12: omp.inner.for.inc: 22353 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22354 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22355 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 22356 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 22357 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22358 // CHECK12: omp.inner.for.end: 22359 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22360 // CHECK12: omp.loop.exit: 22361 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22362 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 22363 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 22364 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22365 // CHECK12: omp.precond.end: 22366 // CHECK12-NEXT: ret void 22367 // 22368 // 22369 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..11 22370 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22371 // CHECK12-NEXT: entry: 22372 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22373 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22374 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 22375 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 22376 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22377 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22378 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22379 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22380 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22381 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22382 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22383 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22384 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22385 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 22386 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 22387 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22388 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22389 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 22390 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22391 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22392 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22393 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22394 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22395 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22396 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22397 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22398 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22399 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 22400 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 22401 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 22402 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 22403 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 22404 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22405 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 22406 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22407 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 22408 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22409 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22410 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22411 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 22412 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22413 // CHECK12: omp.precond.then: 22414 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 22415 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22416 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 22417 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22418 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22419 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 22420 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 22421 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22422 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22423 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22424 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 22425 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 22426 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22427 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22428 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 22429 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22430 // CHECK12: cond.true: 22431 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22432 // CHECK12-NEXT: br label [[COND_END:%.*]] 22433 // CHECK12: cond.false: 22434 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22435 // CHECK12-NEXT: br label [[COND_END]] 22436 // CHECK12: cond.end: 22437 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 22438 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 22439 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 22440 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 22441 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22442 // CHECK12: omp.inner.for.cond: 22443 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22444 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22445 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 22446 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22447 // CHECK12: omp.inner.for.body: 22448 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22449 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 22450 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 22451 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 22452 // CHECK12-NEXT: [[TMP20:%.*]] = load double*, double** [[TMP2]], align 4 22453 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 22454 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP20]], i32 [[TMP21]] 22455 // CHECK12-NEXT: [[TMP22:%.*]] = load double, double* [[ARRAYIDX]], align 4 22456 // CHECK12-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP3]], align 4 22457 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 22458 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 22459 // CHECK12-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX6]], align 4 22460 // CHECK12-NEXT: [[ADD7:%.*]] = fadd double [[TMP22]], [[TMP25]] 22461 // CHECK12-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP1]], align 4 22462 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 22463 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 22464 // CHECK12-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4 22465 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 22466 // CHECK12: omp.body.continue: 22467 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22468 // CHECK12: omp.inner.for.inc: 22469 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22470 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 22471 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 22472 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22473 // CHECK12: omp.inner.for.end: 22474 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22475 // CHECK12: omp.loop.exit: 22476 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22477 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 22478 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 22479 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22480 // CHECK12: omp.precond.end: 22481 // CHECK12-NEXT: ret void 22482 // 22483 // 22484 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l506 22485 // CHECK12-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 22486 // CHECK12-NEXT: entry: 22487 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 22488 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 22489 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 22490 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 22491 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 22492 // CHECK12-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 22493 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 22494 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 22495 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 22496 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 22497 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 22498 // CHECK12-NEXT: ret void 22499 // 22500 // 22501 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..14 22502 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22503 // CHECK12-NEXT: entry: 22504 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22505 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22506 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 22507 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22508 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22509 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22510 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22511 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22512 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22513 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22514 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22515 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 22516 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22517 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 22518 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 22519 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22520 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22521 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 22522 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 22523 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22524 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22525 // CHECK12-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 22526 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22527 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22528 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22529 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22530 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 22531 // CHECK12-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22532 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 22533 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 22534 // CHECK12-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 22535 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 22536 // CHECK12-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 22537 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 22538 // CHECK12-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22539 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22540 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 22541 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22542 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 22543 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 22544 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22545 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22546 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 22547 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22548 // CHECK12: omp.precond.then: 22549 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 22550 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 22551 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 22552 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22553 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22554 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22555 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 22556 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 22557 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22558 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 22559 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 22560 // CHECK12-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22561 // CHECK12: cond.true: 22562 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 22563 // CHECK12-NEXT: br label [[COND_END:%.*]] 22564 // CHECK12: cond.false: 22565 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22566 // CHECK12-NEXT: br label [[COND_END]] 22567 // CHECK12: cond.end: 22568 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 22569 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 22570 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22571 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 22572 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22573 // CHECK12: omp.inner.for.cond: 22574 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22575 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22576 // CHECK12-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 22577 // CHECK12-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22578 // CHECK12: omp.inner.for.body: 22579 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22580 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22581 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22582 // CHECK12-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 22583 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 22584 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 22585 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22586 // CHECK12: omp.inner.for.inc: 22587 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22588 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22589 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 22590 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 22591 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22592 // CHECK12: omp.inner.for.end: 22593 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22594 // CHECK12: omp.loop.exit: 22595 // CHECK12-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22596 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 22597 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 22598 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22599 // CHECK12: omp.precond.end: 22600 // CHECK12-NEXT: ret void 22601 // 22602 // 22603 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..15 22604 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 22605 // CHECK12-NEXT: entry: 22606 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22607 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22608 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 22609 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 22610 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22611 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22612 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22613 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22614 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 22615 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22616 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22617 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22618 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 22619 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22620 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 22621 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 22622 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22623 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22624 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 22625 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22626 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22627 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22628 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22629 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22630 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22631 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22632 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22633 // CHECK12-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 22634 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22635 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 22636 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 22637 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 22638 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 22639 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22640 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22641 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 22642 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22643 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 22644 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 22645 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22646 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22647 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 22648 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22649 // CHECK12: omp.precond.then: 22650 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 22651 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 22652 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 22653 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22654 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22655 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 22656 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 22657 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22658 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22659 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 22660 // CHECK12-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22661 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 22662 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 22663 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 22664 // CHECK12: omp.dispatch.cond: 22665 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22666 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22667 // CHECK12-NEXT: [[CMP5:%.*]] = icmp ugt i32 [[TMP13]], [[TMP14]] 22668 // CHECK12-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22669 // CHECK12: cond.true: 22670 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22671 // CHECK12-NEXT: br label [[COND_END:%.*]] 22672 // CHECK12: cond.false: 22673 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22674 // CHECK12-NEXT: br label [[COND_END]] 22675 // CHECK12: cond.end: 22676 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP15]], [[COND_TRUE]] ], [ [[TMP16]], [[COND_FALSE]] ] 22677 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 22678 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 22679 // CHECK12-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 22680 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22681 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22682 // CHECK12-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 22683 // CHECK12-NEXT: br i1 [[CMP6]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 22684 // CHECK12: omp.dispatch.body: 22685 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22686 // CHECK12: omp.inner.for.cond: 22687 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22688 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22689 // CHECK12-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 22690 // CHECK12-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22691 // CHECK12: omp.inner.for.body: 22692 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22693 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 22694 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 22695 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 22696 // CHECK12-NEXT: [[TMP23:%.*]] = load double*, double** [[TMP2]], align 4 22697 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 22698 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP23]], i32 [[TMP24]] 22699 // CHECK12-NEXT: [[TMP25:%.*]] = load double, double* [[ARRAYIDX]], align 4 22700 // CHECK12-NEXT: [[TMP26:%.*]] = load double*, double** [[TMP3]], align 4 22701 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 22702 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP26]], i32 [[TMP27]] 22703 // CHECK12-NEXT: [[TMP28:%.*]] = load double, double* [[ARRAYIDX8]], align 4 22704 // CHECK12-NEXT: [[ADD9:%.*]] = fadd double [[TMP25]], [[TMP28]] 22705 // CHECK12-NEXT: [[TMP29:%.*]] = load double*, double** [[TMP1]], align 4 22706 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[I4]], align 4 22707 // CHECK12-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP29]], i32 [[TMP30]] 22708 // CHECK12-NEXT: store double [[ADD9]], double* [[ARRAYIDX10]], align 4 22709 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 22710 // CHECK12: omp.body.continue: 22711 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22712 // CHECK12: omp.inner.for.inc: 22713 // CHECK12-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22714 // CHECK12-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP31]], 1 22715 // CHECK12-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4 22716 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22717 // CHECK12: omp.inner.for.end: 22718 // CHECK12-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 22719 // CHECK12: omp.dispatch.inc: 22720 // CHECK12-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 22721 // CHECK12-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22722 // CHECK12-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 22723 // CHECK12-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_LB]], align 4 22724 // CHECK12-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22725 // CHECK12-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22726 // CHECK12-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 22727 // CHECK12-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_UB]], align 4 22728 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND]] 22729 // CHECK12: omp.dispatch.end: 22730 // CHECK12-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22731 // CHECK12-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 22732 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 22733 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22734 // CHECK12: omp.precond.end: 22735 // CHECK12-NEXT: ret void 22736 // 22737 // 22738 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l536 22739 // CHECK12-SAME: (i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 22740 // CHECK12-NEXT: entry: 22741 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 22742 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 22743 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 22744 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 22745 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 22746 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 22747 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 22748 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 22749 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 22750 // CHECK12-NEXT: ret void 22751 // 22752 // 22753 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..18 22754 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22755 // CHECK12-NEXT: entry: 22756 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22757 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22758 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22759 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22760 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22761 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22762 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22763 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22764 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22765 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22766 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22767 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 22768 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 22769 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22770 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22771 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 22772 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22773 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22774 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22775 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22776 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22777 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22778 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22779 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 22780 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 22781 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 22782 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 22783 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 22784 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22785 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 22786 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22787 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 22788 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22789 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22790 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22791 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 22792 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22793 // CHECK12: omp.precond.then: 22794 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 22795 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22796 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 22797 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22798 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22799 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22800 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 22801 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 22802 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22803 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22804 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 22805 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 22806 // CHECK12: cond.true: 22807 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22808 // CHECK12-NEXT: br label [[COND_END:%.*]] 22809 // CHECK12: cond.false: 22810 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22811 // CHECK12-NEXT: br label [[COND_END]] 22812 // CHECK12: cond.end: 22813 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 22814 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 22815 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22816 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 22817 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22818 // CHECK12: omp.inner.for.cond: 22819 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22820 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22821 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 22822 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22823 // CHECK12: omp.inner.for.body: 22824 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 22825 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 22826 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], double** [[TMP1]], double** [[TMP2]], double** [[TMP3]]) 22827 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22828 // CHECK12: omp.inner.for.inc: 22829 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 22830 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 22831 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 22832 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 22833 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 22834 // CHECK12: omp.inner.for.end: 22835 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 22836 // CHECK12: omp.loop.exit: 22837 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22838 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 22839 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 22840 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22841 // CHECK12: omp.precond.end: 22842 // CHECK12-NEXT: ret void 22843 // 22844 // 22845 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..19 22846 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22847 // CHECK12-NEXT: entry: 22848 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22849 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22850 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 22851 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 22852 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22853 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22854 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22855 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22856 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22857 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22858 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22859 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22860 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22861 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 22862 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 22863 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22864 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22865 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 22866 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22867 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22868 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22869 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22870 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22871 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 22872 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 22873 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 22874 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 22875 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 22876 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 22877 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 22878 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 22879 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 22880 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22881 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 22882 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 22883 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 22884 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 22885 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 22886 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 22887 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 22888 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 22889 // CHECK12: omp.precond.then: 22890 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 22891 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 22892 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 22893 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 22894 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 22895 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 22896 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 22897 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 22898 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 22899 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 22900 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 22901 // CHECK12-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22902 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 22903 // CHECK12-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 22904 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 22905 // CHECK12: omp.dispatch.cond: 22906 // CHECK12-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 22907 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 22908 // CHECK12-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 22909 // CHECK12-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 22910 // CHECK12-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 22911 // CHECK12: omp.dispatch.body: 22912 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 22913 // CHECK12-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 22914 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 22915 // CHECK12: omp.inner.for.cond: 22916 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 22917 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !19 22918 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 22919 // CHECK12-NEXT: br i1 [[CMP4]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 22920 // CHECK12: omp.inner.for.body: 22921 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 22922 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 22923 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 22924 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4, !llvm.access.group !19 22925 // CHECK12-NEXT: [[TMP21:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !19 22926 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !19 22927 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP21]], i32 [[TMP22]] 22928 // CHECK12-NEXT: [[TMP23:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !19 22929 // CHECK12-NEXT: [[TMP24:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !19 22930 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !19 22931 // CHECK12-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds double, double* [[TMP24]], i32 [[TMP25]] 22932 // CHECK12-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX5]], align 4, !llvm.access.group !19 22933 // CHECK12-NEXT: [[ADD6:%.*]] = fadd double [[TMP23]], [[TMP26]] 22934 // CHECK12-NEXT: [[TMP27:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !19 22935 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !19 22936 // CHECK12-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP27]], i32 [[TMP28]] 22937 // CHECK12-NEXT: store double [[ADD6]], double* [[ARRAYIDX7]], align 4, !llvm.access.group !19 22938 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 22939 // CHECK12: omp.body.continue: 22940 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 22941 // CHECK12: omp.inner.for.inc: 22942 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 22943 // CHECK12-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP29]], 1 22944 // CHECK12-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !19 22945 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP20:![0-9]+]] 22946 // CHECK12: omp.inner.for.end: 22947 // CHECK12-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 22948 // CHECK12: omp.dispatch.inc: 22949 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND]] 22950 // CHECK12: omp.dispatch.end: 22951 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 22952 // CHECK12: omp.precond.end: 22953 // CHECK12-NEXT: ret void 22954 // 22955 // 22956 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}_main_l562 22957 // CHECK12-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], double* [[A:%.*]], double* [[B:%.*]], double* [[C:%.*]]) #[[ATTR1]] { 22958 // CHECK12-NEXT: entry: 22959 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 22960 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 22961 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double*, align 4 22962 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double*, align 4 22963 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double*, align 4 22964 // CHECK12-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 22965 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 22966 // CHECK12-NEXT: store double* [[A]], double** [[A_ADDR]], align 4 22967 // CHECK12-NEXT: store double* [[B]], double** [[B_ADDR]], align 4 22968 // CHECK12-NEXT: store double* [[C]], double** [[C_ADDR]], align 4 22969 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, double**, double**, double**)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], double** [[A_ADDR]], double** [[B_ADDR]], double** [[C_ADDR]]) 22970 // CHECK12-NEXT: ret void 22971 // 22972 // 22973 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..22 22974 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 22975 // CHECK12-NEXT: entry: 22976 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 22977 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 22978 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 22979 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 22980 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 22981 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 22982 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 22983 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 22984 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 22985 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 22986 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 22987 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 22988 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 22989 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 22990 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 22991 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 22992 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 22993 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 22994 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 22995 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 22996 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 22997 // CHECK12-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 22998 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 22999 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 23000 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 23001 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 23002 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 23003 // CHECK12-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 23004 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[A_ADDR]], align 4 23005 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[B_ADDR]], align 4 23006 // CHECK12-NEXT: [[TMP4:%.*]] = load double**, double*** [[C_ADDR]], align 4 23007 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 23008 // CHECK12-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 23009 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 23010 // CHECK12-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 23011 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23012 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 23013 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 23014 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 23015 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 23016 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 23017 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23018 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 23019 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 23020 // CHECK12: omp.precond.then: 23021 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 23022 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 23023 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 23024 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 23025 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 23026 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23027 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 23028 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 23029 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23030 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 23031 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 23032 // CHECK12-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 23033 // CHECK12: cond.true: 23034 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 23035 // CHECK12-NEXT: br label [[COND_END:%.*]] 23036 // CHECK12: cond.false: 23037 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23038 // CHECK12-NEXT: br label [[COND_END]] 23039 // CHECK12: cond.end: 23040 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 23041 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 23042 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 23043 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 23044 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 23045 // CHECK12: omp.inner.for.cond: 23046 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23047 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23048 // CHECK12-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 23049 // CHECK12-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 23050 // CHECK12: omp.inner.for.body: 23051 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 23052 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23053 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23054 // CHECK12-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 23055 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 23056 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, double**, double**, double**, i32)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], double** [[TMP2]], double** [[TMP3]], double** [[TMP4]], i32 [[TMP22]]) 23057 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 23058 // CHECK12: omp.inner.for.inc: 23059 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23060 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 23061 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 23062 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 23063 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 23064 // CHECK12: omp.inner.for.end: 23065 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 23066 // CHECK12: omp.loop.exit: 23067 // CHECK12-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23068 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 23069 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 23070 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 23071 // CHECK12: omp.precond.end: 23072 // CHECK12-NEXT: ret void 23073 // 23074 // 23075 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..23 23076 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], double** nonnull align 4 dereferenceable(4) [[A:%.*]], double** nonnull align 4 dereferenceable(4) [[B:%.*]], double** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 23077 // CHECK12-NEXT: entry: 23078 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 23079 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 23080 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 23081 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 23082 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 23083 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca double**, align 4 23084 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca double**, align 4 23085 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca double**, align 4 23086 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 23087 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 23088 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 23089 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 23090 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 23091 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 23092 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 23093 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 23094 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 23095 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 23096 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 23097 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 23098 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 23099 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 23100 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 23101 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 23102 // CHECK12-NEXT: store double** [[A]], double*** [[A_ADDR]], align 4 23103 // CHECK12-NEXT: store double** [[B]], double*** [[B_ADDR]], align 4 23104 // CHECK12-NEXT: store double** [[C]], double*** [[C_ADDR]], align 4 23105 // CHECK12-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 23106 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 23107 // CHECK12-NEXT: [[TMP1:%.*]] = load double**, double*** [[A_ADDR]], align 4 23108 // CHECK12-NEXT: [[TMP2:%.*]] = load double**, double*** [[B_ADDR]], align 4 23109 // CHECK12-NEXT: [[TMP3:%.*]] = load double**, double*** [[C_ADDR]], align 4 23110 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 23111 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 23112 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23113 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 23114 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 23115 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 23116 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 23117 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 23118 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23119 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 23120 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 23121 // CHECK12: omp.precond.then: 23122 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 23123 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 23124 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 23125 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 23126 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 23127 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 23128 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 23129 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 23130 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 23131 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 23132 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 23133 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 23134 // CHECK12-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23135 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 23136 // CHECK12-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 23137 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 23138 // CHECK12: omp.dispatch.cond: 23139 // CHECK12-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23140 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 23141 // CHECK12-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 23142 // CHECK12-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 23143 // CHECK12-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 23144 // CHECK12: omp.dispatch.body: 23145 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 23146 // CHECK12-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 23147 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 23148 // CHECK12: omp.inner.for.cond: 23149 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 23150 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !22 23151 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 23152 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 23153 // CHECK12: omp.inner.for.body: 23154 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 23155 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 23156 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 23157 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !22 23158 // CHECK12-NEXT: [[TMP22:%.*]] = load double*, double** [[TMP2]], align 4, !llvm.access.group !22 23159 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !22 23160 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP22]], i32 [[TMP23]] 23161 // CHECK12-NEXT: [[TMP24:%.*]] = load double, double* [[ARRAYIDX]], align 4, !llvm.access.group !22 23162 // CHECK12-NEXT: [[TMP25:%.*]] = load double*, double** [[TMP3]], align 4, !llvm.access.group !22 23163 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !22 23164 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds double, double* [[TMP25]], i32 [[TMP26]] 23165 // CHECK12-NEXT: [[TMP27:%.*]] = load double, double* [[ARRAYIDX6]], align 4, !llvm.access.group !22 23166 // CHECK12-NEXT: [[ADD7:%.*]] = fadd double [[TMP24]], [[TMP27]] 23167 // CHECK12-NEXT: [[TMP28:%.*]] = load double*, double** [[TMP1]], align 4, !llvm.access.group !22 23168 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !22 23169 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP28]], i32 [[TMP29]] 23170 // CHECK12-NEXT: store double [[ADD7]], double* [[ARRAYIDX8]], align 4, !llvm.access.group !22 23171 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 23172 // CHECK12: omp.body.continue: 23173 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 23174 // CHECK12: omp.inner.for.inc: 23175 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 23176 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP30]], 1 23177 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !22 23178 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP23:![0-9]+]] 23179 // CHECK12: omp.inner.for.end: 23180 // CHECK12-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 23181 // CHECK12: omp.dispatch.inc: 23182 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND]] 23183 // CHECK12: omp.dispatch.end: 23184 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 23185 // CHECK12: omp.precond.end: 23186 // CHECK12-NEXT: ret void 23187 // 23188 // 23189 // CHECK12-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 23190 // CHECK12-SAME: () #[[ATTR3:[0-9]+]] comdat { 23191 // CHECK12-NEXT: entry: 23192 // CHECK12-NEXT: [[A:%.*]] = alloca i32*, align 4 23193 // CHECK12-NEXT: [[B:%.*]] = alloca i32*, align 4 23194 // CHECK12-NEXT: [[C:%.*]] = alloca i32*, align 4 23195 // CHECK12-NEXT: [[N:%.*]] = alloca i32, align 4 23196 // CHECK12-NEXT: [[CH:%.*]] = alloca i32, align 4 23197 // CHECK12-NEXT: [[N_CASTED:%.*]] = alloca i32, align 4 23198 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [4 x i8*], align 4 23199 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [4 x i8*], align 4 23200 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [4 x i8*], align 4 23201 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 23202 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 23203 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 23204 // CHECK12-NEXT: [[N_CASTED3:%.*]] = alloca i32, align 4 23205 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS4:%.*]] = alloca [4 x i8*], align 4 23206 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS5:%.*]] = alloca [4 x i8*], align 4 23207 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS6:%.*]] = alloca [4 x i8*], align 4 23208 // CHECK12-NEXT: [[_TMP7:%.*]] = alloca i32, align 4 23209 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_8:%.*]] = alloca i32, align 4 23210 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_9:%.*]] = alloca i32, align 4 23211 // CHECK12-NEXT: [[CH_CASTED:%.*]] = alloca i32, align 4 23212 // CHECK12-NEXT: [[N_CASTED16:%.*]] = alloca i32, align 4 23213 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS17:%.*]] = alloca [5 x i8*], align 4 23214 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS18:%.*]] = alloca [5 x i8*], align 4 23215 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS19:%.*]] = alloca [5 x i8*], align 4 23216 // CHECK12-NEXT: [[_TMP20:%.*]] = alloca i32, align 4 23217 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_21:%.*]] = alloca i32, align 4 23218 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_22:%.*]] = alloca i32, align 4 23219 // CHECK12-NEXT: [[N_CASTED29:%.*]] = alloca i32, align 4 23220 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS30:%.*]] = alloca [4 x i8*], align 4 23221 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS31:%.*]] = alloca [4 x i8*], align 4 23222 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS32:%.*]] = alloca [4 x i8*], align 4 23223 // CHECK12-NEXT: [[_TMP33:%.*]] = alloca i32, align 4 23224 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_34:%.*]] = alloca i32, align 4 23225 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_35:%.*]] = alloca i32, align 4 23226 // CHECK12-NEXT: [[CH_CASTED42:%.*]] = alloca i32, align 4 23227 // CHECK12-NEXT: [[N_CASTED43:%.*]] = alloca i32, align 4 23228 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS44:%.*]] = alloca [5 x i8*], align 4 23229 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS45:%.*]] = alloca [5 x i8*], align 4 23230 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS46:%.*]] = alloca [5 x i8*], align 4 23231 // CHECK12-NEXT: [[_TMP47:%.*]] = alloca i32, align 4 23232 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_48:%.*]] = alloca i32, align 4 23233 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_49:%.*]] = alloca i32, align 4 23234 // CHECK12-NEXT: [[N_CASTED56:%.*]] = alloca i32, align 4 23235 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS57:%.*]] = alloca [4 x i8*], align 4 23236 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS58:%.*]] = alloca [4 x i8*], align 4 23237 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS59:%.*]] = alloca [4 x i8*], align 4 23238 // CHECK12-NEXT: [[_TMP60:%.*]] = alloca i32, align 4 23239 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_61:%.*]] = alloca i32, align 4 23240 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_62:%.*]] = alloca i32, align 4 23241 // CHECK12-NEXT: [[CH_CASTED69:%.*]] = alloca i32, align 4 23242 // CHECK12-NEXT: [[N_CASTED70:%.*]] = alloca i32, align 4 23243 // CHECK12-NEXT: [[DOTOFFLOAD_BASEPTRS71:%.*]] = alloca [5 x i8*], align 4 23244 // CHECK12-NEXT: [[DOTOFFLOAD_PTRS72:%.*]] = alloca [5 x i8*], align 4 23245 // CHECK12-NEXT: [[DOTOFFLOAD_MAPPERS73:%.*]] = alloca [5 x i8*], align 4 23246 // CHECK12-NEXT: [[_TMP74:%.*]] = alloca i32, align 4 23247 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 23248 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_76:%.*]] = alloca i32, align 4 23249 // CHECK12-NEXT: store i32 10000, i32* [[N]], align 4 23250 // CHECK12-NEXT: store i32 100, i32* [[CH]], align 4 23251 // CHECK12-NEXT: [[TMP0:%.*]] = load i32, i32* [[N]], align 4 23252 // CHECK12-NEXT: store i32 [[TMP0]], i32* [[N_CASTED]], align 4 23253 // CHECK12-NEXT: [[TMP1:%.*]] = load i32, i32* [[N_CASTED]], align 4 23254 // CHECK12-NEXT: [[TMP2:%.*]] = load i32*, i32** [[A]], align 4 23255 // CHECK12-NEXT: [[TMP3:%.*]] = load i32*, i32** [[B]], align 4 23256 // CHECK12-NEXT: [[TMP4:%.*]] = load i32*, i32** [[C]], align 4 23257 // CHECK12-NEXT: [[TMP5:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 23258 // CHECK12-NEXT: [[TMP6:%.*]] = bitcast i8** [[TMP5]] to i32* 23259 // CHECK12-NEXT: store i32 [[TMP1]], i32* [[TMP6]], align 4 23260 // CHECK12-NEXT: [[TMP7:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 23261 // CHECK12-NEXT: [[TMP8:%.*]] = bitcast i8** [[TMP7]] to i32* 23262 // CHECK12-NEXT: store i32 [[TMP1]], i32* [[TMP8]], align 4 23263 // CHECK12-NEXT: [[TMP9:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 0 23264 // CHECK12-NEXT: store i8* null, i8** [[TMP9]], align 4 23265 // CHECK12-NEXT: [[TMP10:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 1 23266 // CHECK12-NEXT: [[TMP11:%.*]] = bitcast i8** [[TMP10]] to i32** 23267 // CHECK12-NEXT: store i32* [[TMP2]], i32** [[TMP11]], align 4 23268 // CHECK12-NEXT: [[TMP12:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 1 23269 // CHECK12-NEXT: [[TMP13:%.*]] = bitcast i8** [[TMP12]] to i32** 23270 // CHECK12-NEXT: store i32* [[TMP2]], i32** [[TMP13]], align 4 23271 // CHECK12-NEXT: [[TMP14:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 1 23272 // CHECK12-NEXT: store i8* null, i8** [[TMP14]], align 4 23273 // CHECK12-NEXT: [[TMP15:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 2 23274 // CHECK12-NEXT: [[TMP16:%.*]] = bitcast i8** [[TMP15]] to i32** 23275 // CHECK12-NEXT: store i32* [[TMP3]], i32** [[TMP16]], align 4 23276 // CHECK12-NEXT: [[TMP17:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 2 23277 // CHECK12-NEXT: [[TMP18:%.*]] = bitcast i8** [[TMP17]] to i32** 23278 // CHECK12-NEXT: store i32* [[TMP3]], i32** [[TMP18]], align 4 23279 // CHECK12-NEXT: [[TMP19:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 2 23280 // CHECK12-NEXT: store i8* null, i8** [[TMP19]], align 4 23281 // CHECK12-NEXT: [[TMP20:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 3 23282 // CHECK12-NEXT: [[TMP21:%.*]] = bitcast i8** [[TMP20]] to i32** 23283 // CHECK12-NEXT: store i32* [[TMP4]], i32** [[TMP21]], align 4 23284 // CHECK12-NEXT: [[TMP22:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 3 23285 // CHECK12-NEXT: [[TMP23:%.*]] = bitcast i8** [[TMP22]] to i32** 23286 // CHECK12-NEXT: store i32* [[TMP4]], i32** [[TMP23]], align 4 23287 // CHECK12-NEXT: [[TMP24:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS]], i32 0, i32 3 23288 // CHECK12-NEXT: store i8* null, i8** [[TMP24]], align 4 23289 // CHECK12-NEXT: [[TMP25:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0 23290 // CHECK12-NEXT: [[TMP26:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS]], i32 0, i32 0 23291 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[N]], align 4 23292 // CHECK12-NEXT: store i32 [[TMP27]], i32* [[DOTCAPTURE_EXPR_]], align 4 23293 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23294 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP28]], 0 23295 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 23296 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 23297 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 23298 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23299 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP29]], 1 23300 // CHECK12-NEXT: [[TMP30:%.*]] = zext i32 [[ADD]] to i64 23301 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP30]]) 23302 // CHECK12-NEXT: [[TMP31:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42.region_id, i32 4, i8** [[TMP25]], i8** [[TMP26]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.28, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.29, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23303 // CHECK12-NEXT: [[TMP32:%.*]] = icmp ne i32 [[TMP31]], 0 23304 // CHECK12-NEXT: br i1 [[TMP32]], label [[OMP_OFFLOAD_FAILED:%.*]], label [[OMP_OFFLOAD_CONT:%.*]] 23305 // CHECK12: omp_offload.failed: 23306 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42(i32 [[TMP1]], i32* [[TMP2]], i32* [[TMP3]], i32* [[TMP4]]) #[[ATTR2]] 23307 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT]] 23308 // CHECK12: omp_offload.cont: 23309 // CHECK12-NEXT: [[TMP33:%.*]] = load i32, i32* [[N]], align 4 23310 // CHECK12-NEXT: store i32 [[TMP33]], i32* [[N_CASTED3]], align 4 23311 // CHECK12-NEXT: [[TMP34:%.*]] = load i32, i32* [[N_CASTED3]], align 4 23312 // CHECK12-NEXT: [[TMP35:%.*]] = load i32*, i32** [[A]], align 4 23313 // CHECK12-NEXT: [[TMP36:%.*]] = load i32*, i32** [[B]], align 4 23314 // CHECK12-NEXT: [[TMP37:%.*]] = load i32*, i32** [[C]], align 4 23315 // CHECK12-NEXT: [[TMP38:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 23316 // CHECK12-NEXT: [[TMP39:%.*]] = bitcast i8** [[TMP38]] to i32* 23317 // CHECK12-NEXT: store i32 [[TMP34]], i32* [[TMP39]], align 4 23318 // CHECK12-NEXT: [[TMP40:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 23319 // CHECK12-NEXT: [[TMP41:%.*]] = bitcast i8** [[TMP40]] to i32* 23320 // CHECK12-NEXT: store i32 [[TMP34]], i32* [[TMP41]], align 4 23321 // CHECK12-NEXT: [[TMP42:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 0 23322 // CHECK12-NEXT: store i8* null, i8** [[TMP42]], align 4 23323 // CHECK12-NEXT: [[TMP43:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 1 23324 // CHECK12-NEXT: [[TMP44:%.*]] = bitcast i8** [[TMP43]] to i32** 23325 // CHECK12-NEXT: store i32* [[TMP35]], i32** [[TMP44]], align 4 23326 // CHECK12-NEXT: [[TMP45:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 1 23327 // CHECK12-NEXT: [[TMP46:%.*]] = bitcast i8** [[TMP45]] to i32** 23328 // CHECK12-NEXT: store i32* [[TMP35]], i32** [[TMP46]], align 4 23329 // CHECK12-NEXT: [[TMP47:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 1 23330 // CHECK12-NEXT: store i8* null, i8** [[TMP47]], align 4 23331 // CHECK12-NEXT: [[TMP48:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 2 23332 // CHECK12-NEXT: [[TMP49:%.*]] = bitcast i8** [[TMP48]] to i32** 23333 // CHECK12-NEXT: store i32* [[TMP36]], i32** [[TMP49]], align 4 23334 // CHECK12-NEXT: [[TMP50:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 2 23335 // CHECK12-NEXT: [[TMP51:%.*]] = bitcast i8** [[TMP50]] to i32** 23336 // CHECK12-NEXT: store i32* [[TMP36]], i32** [[TMP51]], align 4 23337 // CHECK12-NEXT: [[TMP52:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 2 23338 // CHECK12-NEXT: store i8* null, i8** [[TMP52]], align 4 23339 // CHECK12-NEXT: [[TMP53:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 3 23340 // CHECK12-NEXT: [[TMP54:%.*]] = bitcast i8** [[TMP53]] to i32** 23341 // CHECK12-NEXT: store i32* [[TMP37]], i32** [[TMP54]], align 4 23342 // CHECK12-NEXT: [[TMP55:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 3 23343 // CHECK12-NEXT: [[TMP56:%.*]] = bitcast i8** [[TMP55]] to i32** 23344 // CHECK12-NEXT: store i32* [[TMP37]], i32** [[TMP56]], align 4 23345 // CHECK12-NEXT: [[TMP57:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS6]], i32 0, i32 3 23346 // CHECK12-NEXT: store i8* null, i8** [[TMP57]], align 4 23347 // CHECK12-NEXT: [[TMP58:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS4]], i32 0, i32 0 23348 // CHECK12-NEXT: [[TMP59:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS5]], i32 0, i32 0 23349 // CHECK12-NEXT: [[TMP60:%.*]] = load i32, i32* [[N]], align 4 23350 // CHECK12-NEXT: store i32 [[TMP60]], i32* [[DOTCAPTURE_EXPR_8]], align 4 23351 // CHECK12-NEXT: [[TMP61:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_8]], align 4 23352 // CHECK12-NEXT: [[SUB10:%.*]] = sub nsw i32 [[TMP61]], 0 23353 // CHECK12-NEXT: [[DIV11:%.*]] = sdiv i32 [[SUB10]], 1 23354 // CHECK12-NEXT: [[SUB12:%.*]] = sub nsw i32 [[DIV11]], 1 23355 // CHECK12-NEXT: store i32 [[SUB12]], i32* [[DOTCAPTURE_EXPR_9]], align 4 23356 // CHECK12-NEXT: [[TMP62:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_9]], align 4 23357 // CHECK12-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP62]], 1 23358 // CHECK12-NEXT: [[TMP63:%.*]] = zext i32 [[ADD13]] to i64 23359 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP63]]) 23360 // CHECK12-NEXT: [[TMP64:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51.region_id, i32 4, i8** [[TMP58]], i8** [[TMP59]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.32, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.33, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23361 // CHECK12-NEXT: [[TMP65:%.*]] = icmp ne i32 [[TMP64]], 0 23362 // CHECK12-NEXT: br i1 [[TMP65]], label [[OMP_OFFLOAD_FAILED14:%.*]], label [[OMP_OFFLOAD_CONT15:%.*]] 23363 // CHECK12: omp_offload.failed14: 23364 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51(i32 [[TMP34]], i32* [[TMP35]], i32* [[TMP36]], i32* [[TMP37]]) #[[ATTR2]] 23365 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT15]] 23366 // CHECK12: omp_offload.cont15: 23367 // CHECK12-NEXT: [[TMP66:%.*]] = load i32, i32* [[CH]], align 4 23368 // CHECK12-NEXT: store i32 [[TMP66]], i32* [[CH_CASTED]], align 4 23369 // CHECK12-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH_CASTED]], align 4 23370 // CHECK12-NEXT: [[TMP68:%.*]] = load i32, i32* [[N]], align 4 23371 // CHECK12-NEXT: store i32 [[TMP68]], i32* [[N_CASTED16]], align 4 23372 // CHECK12-NEXT: [[TMP69:%.*]] = load i32, i32* [[N_CASTED16]], align 4 23373 // CHECK12-NEXT: [[TMP70:%.*]] = load i32*, i32** [[A]], align 4 23374 // CHECK12-NEXT: [[TMP71:%.*]] = load i32*, i32** [[B]], align 4 23375 // CHECK12-NEXT: [[TMP72:%.*]] = load i32*, i32** [[C]], align 4 23376 // CHECK12-NEXT: [[TMP73:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 23377 // CHECK12-NEXT: [[TMP74:%.*]] = bitcast i8** [[TMP73]] to i32* 23378 // CHECK12-NEXT: store i32 [[TMP67]], i32* [[TMP74]], align 4 23379 // CHECK12-NEXT: [[TMP75:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 23380 // CHECK12-NEXT: [[TMP76:%.*]] = bitcast i8** [[TMP75]] to i32* 23381 // CHECK12-NEXT: store i32 [[TMP67]], i32* [[TMP76]], align 4 23382 // CHECK12-NEXT: [[TMP77:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 0 23383 // CHECK12-NEXT: store i8* null, i8** [[TMP77]], align 4 23384 // CHECK12-NEXT: [[TMP78:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 1 23385 // CHECK12-NEXT: [[TMP79:%.*]] = bitcast i8** [[TMP78]] to i32* 23386 // CHECK12-NEXT: store i32 [[TMP69]], i32* [[TMP79]], align 4 23387 // CHECK12-NEXT: [[TMP80:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 1 23388 // CHECK12-NEXT: [[TMP81:%.*]] = bitcast i8** [[TMP80]] to i32* 23389 // CHECK12-NEXT: store i32 [[TMP69]], i32* [[TMP81]], align 4 23390 // CHECK12-NEXT: [[TMP82:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 1 23391 // CHECK12-NEXT: store i8* null, i8** [[TMP82]], align 4 23392 // CHECK12-NEXT: [[TMP83:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 2 23393 // CHECK12-NEXT: [[TMP84:%.*]] = bitcast i8** [[TMP83]] to i32** 23394 // CHECK12-NEXT: store i32* [[TMP70]], i32** [[TMP84]], align 4 23395 // CHECK12-NEXT: [[TMP85:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 2 23396 // CHECK12-NEXT: [[TMP86:%.*]] = bitcast i8** [[TMP85]] to i32** 23397 // CHECK12-NEXT: store i32* [[TMP70]], i32** [[TMP86]], align 4 23398 // CHECK12-NEXT: [[TMP87:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 2 23399 // CHECK12-NEXT: store i8* null, i8** [[TMP87]], align 4 23400 // CHECK12-NEXT: [[TMP88:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 3 23401 // CHECK12-NEXT: [[TMP89:%.*]] = bitcast i8** [[TMP88]] to i32** 23402 // CHECK12-NEXT: store i32* [[TMP71]], i32** [[TMP89]], align 4 23403 // CHECK12-NEXT: [[TMP90:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 3 23404 // CHECK12-NEXT: [[TMP91:%.*]] = bitcast i8** [[TMP90]] to i32** 23405 // CHECK12-NEXT: store i32* [[TMP71]], i32** [[TMP91]], align 4 23406 // CHECK12-NEXT: [[TMP92:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 3 23407 // CHECK12-NEXT: store i8* null, i8** [[TMP92]], align 4 23408 // CHECK12-NEXT: [[TMP93:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 4 23409 // CHECK12-NEXT: [[TMP94:%.*]] = bitcast i8** [[TMP93]] to i32** 23410 // CHECK12-NEXT: store i32* [[TMP72]], i32** [[TMP94]], align 4 23411 // CHECK12-NEXT: [[TMP95:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 4 23412 // CHECK12-NEXT: [[TMP96:%.*]] = bitcast i8** [[TMP95]] to i32** 23413 // CHECK12-NEXT: store i32* [[TMP72]], i32** [[TMP96]], align 4 23414 // CHECK12-NEXT: [[TMP97:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS19]], i32 0, i32 4 23415 // CHECK12-NEXT: store i8* null, i8** [[TMP97]], align 4 23416 // CHECK12-NEXT: [[TMP98:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS17]], i32 0, i32 0 23417 // CHECK12-NEXT: [[TMP99:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS18]], i32 0, i32 0 23418 // CHECK12-NEXT: [[TMP100:%.*]] = load i32, i32* [[N]], align 4 23419 // CHECK12-NEXT: store i32 [[TMP100]], i32* [[DOTCAPTURE_EXPR_21]], align 4 23420 // CHECK12-NEXT: [[TMP101:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_21]], align 4 23421 // CHECK12-NEXT: [[SUB23:%.*]] = sub nsw i32 [[TMP101]], 0 23422 // CHECK12-NEXT: [[DIV24:%.*]] = sdiv i32 [[SUB23]], 1 23423 // CHECK12-NEXT: [[SUB25:%.*]] = sub nsw i32 [[DIV24]], 1 23424 // CHECK12-NEXT: store i32 [[SUB25]], i32* [[DOTCAPTURE_EXPR_22]], align 4 23425 // CHECK12-NEXT: [[TMP102:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_22]], align 4 23426 // CHECK12-NEXT: [[ADD26:%.*]] = add nsw i32 [[TMP102]], 1 23427 // CHECK12-NEXT: [[TMP103:%.*]] = zext i32 [[ADD26]] to i64 23428 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP103]]) 23429 // CHECK12-NEXT: [[TMP104:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59.region_id, i32 5, i8** [[TMP98]], i8** [[TMP99]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.36, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.37, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23430 // CHECK12-NEXT: [[TMP105:%.*]] = icmp ne i32 [[TMP104]], 0 23431 // CHECK12-NEXT: br i1 [[TMP105]], label [[OMP_OFFLOAD_FAILED27:%.*]], label [[OMP_OFFLOAD_CONT28:%.*]] 23432 // CHECK12: omp_offload.failed27: 23433 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59(i32 [[TMP67]], i32 [[TMP69]], i32* [[TMP70]], i32* [[TMP71]], i32* [[TMP72]]) #[[ATTR2]] 23434 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT28]] 23435 // CHECK12: omp_offload.cont28: 23436 // CHECK12-NEXT: [[TMP106:%.*]] = load i32, i32* [[N]], align 4 23437 // CHECK12-NEXT: store i32 [[TMP106]], i32* [[N_CASTED29]], align 4 23438 // CHECK12-NEXT: [[TMP107:%.*]] = load i32, i32* [[N_CASTED29]], align 4 23439 // CHECK12-NEXT: [[TMP108:%.*]] = load i32*, i32** [[A]], align 4 23440 // CHECK12-NEXT: [[TMP109:%.*]] = load i32*, i32** [[B]], align 4 23441 // CHECK12-NEXT: [[TMP110:%.*]] = load i32*, i32** [[C]], align 4 23442 // CHECK12-NEXT: [[TMP111:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 23443 // CHECK12-NEXT: [[TMP112:%.*]] = bitcast i8** [[TMP111]] to i32* 23444 // CHECK12-NEXT: store i32 [[TMP107]], i32* [[TMP112]], align 4 23445 // CHECK12-NEXT: [[TMP113:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 23446 // CHECK12-NEXT: [[TMP114:%.*]] = bitcast i8** [[TMP113]] to i32* 23447 // CHECK12-NEXT: store i32 [[TMP107]], i32* [[TMP114]], align 4 23448 // CHECK12-NEXT: [[TMP115:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 0 23449 // CHECK12-NEXT: store i8* null, i8** [[TMP115]], align 4 23450 // CHECK12-NEXT: [[TMP116:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 1 23451 // CHECK12-NEXT: [[TMP117:%.*]] = bitcast i8** [[TMP116]] to i32** 23452 // CHECK12-NEXT: store i32* [[TMP108]], i32** [[TMP117]], align 4 23453 // CHECK12-NEXT: [[TMP118:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 1 23454 // CHECK12-NEXT: [[TMP119:%.*]] = bitcast i8** [[TMP118]] to i32** 23455 // CHECK12-NEXT: store i32* [[TMP108]], i32** [[TMP119]], align 4 23456 // CHECK12-NEXT: [[TMP120:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 1 23457 // CHECK12-NEXT: store i8* null, i8** [[TMP120]], align 4 23458 // CHECK12-NEXT: [[TMP121:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 2 23459 // CHECK12-NEXT: [[TMP122:%.*]] = bitcast i8** [[TMP121]] to i32** 23460 // CHECK12-NEXT: store i32* [[TMP109]], i32** [[TMP122]], align 4 23461 // CHECK12-NEXT: [[TMP123:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 2 23462 // CHECK12-NEXT: [[TMP124:%.*]] = bitcast i8** [[TMP123]] to i32** 23463 // CHECK12-NEXT: store i32* [[TMP109]], i32** [[TMP124]], align 4 23464 // CHECK12-NEXT: [[TMP125:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 2 23465 // CHECK12-NEXT: store i8* null, i8** [[TMP125]], align 4 23466 // CHECK12-NEXT: [[TMP126:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 3 23467 // CHECK12-NEXT: [[TMP127:%.*]] = bitcast i8** [[TMP126]] to i32** 23468 // CHECK12-NEXT: store i32* [[TMP110]], i32** [[TMP127]], align 4 23469 // CHECK12-NEXT: [[TMP128:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 3 23470 // CHECK12-NEXT: [[TMP129:%.*]] = bitcast i8** [[TMP128]] to i32** 23471 // CHECK12-NEXT: store i32* [[TMP110]], i32** [[TMP129]], align 4 23472 // CHECK12-NEXT: [[TMP130:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS32]], i32 0, i32 3 23473 // CHECK12-NEXT: store i8* null, i8** [[TMP130]], align 4 23474 // CHECK12-NEXT: [[TMP131:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS30]], i32 0, i32 0 23475 // CHECK12-NEXT: [[TMP132:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS31]], i32 0, i32 0 23476 // CHECK12-NEXT: [[TMP133:%.*]] = load i32, i32* [[N]], align 4 23477 // CHECK12-NEXT: store i32 [[TMP133]], i32* [[DOTCAPTURE_EXPR_34]], align 4 23478 // CHECK12-NEXT: [[TMP134:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_34]], align 4 23479 // CHECK12-NEXT: [[SUB36:%.*]] = sub nsw i32 [[TMP134]], 0 23480 // CHECK12-NEXT: [[DIV37:%.*]] = sdiv i32 [[SUB36]], 1 23481 // CHECK12-NEXT: [[SUB38:%.*]] = sub nsw i32 [[DIV37]], 1 23482 // CHECK12-NEXT: store i32 [[SUB38]], i32* [[DOTCAPTURE_EXPR_35]], align 4 23483 // CHECK12-NEXT: [[TMP135:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_35]], align 4 23484 // CHECK12-NEXT: [[ADD39:%.*]] = add nsw i32 [[TMP135]], 1 23485 // CHECK12-NEXT: [[TMP136:%.*]] = zext i32 [[ADD39]] to i64 23486 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP136]]) 23487 // CHECK12-NEXT: [[TMP137:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67.region_id, i32 4, i8** [[TMP131]], i8** [[TMP132]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.40, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.41, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23488 // CHECK12-NEXT: [[TMP138:%.*]] = icmp ne i32 [[TMP137]], 0 23489 // CHECK12-NEXT: br i1 [[TMP138]], label [[OMP_OFFLOAD_FAILED40:%.*]], label [[OMP_OFFLOAD_CONT41:%.*]] 23490 // CHECK12: omp_offload.failed40: 23491 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67(i32 [[TMP107]], i32* [[TMP108]], i32* [[TMP109]], i32* [[TMP110]]) #[[ATTR2]] 23492 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT41]] 23493 // CHECK12: omp_offload.cont41: 23494 // CHECK12-NEXT: [[TMP139:%.*]] = load i32, i32* [[CH]], align 4 23495 // CHECK12-NEXT: store i32 [[TMP139]], i32* [[CH_CASTED42]], align 4 23496 // CHECK12-NEXT: [[TMP140:%.*]] = load i32, i32* [[CH_CASTED42]], align 4 23497 // CHECK12-NEXT: [[TMP141:%.*]] = load i32, i32* [[N]], align 4 23498 // CHECK12-NEXT: store i32 [[TMP141]], i32* [[N_CASTED43]], align 4 23499 // CHECK12-NEXT: [[TMP142:%.*]] = load i32, i32* [[N_CASTED43]], align 4 23500 // CHECK12-NEXT: [[TMP143:%.*]] = load i32*, i32** [[A]], align 4 23501 // CHECK12-NEXT: [[TMP144:%.*]] = load i32*, i32** [[B]], align 4 23502 // CHECK12-NEXT: [[TMP145:%.*]] = load i32*, i32** [[C]], align 4 23503 // CHECK12-NEXT: [[TMP146:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 23504 // CHECK12-NEXT: [[TMP147:%.*]] = bitcast i8** [[TMP146]] to i32* 23505 // CHECK12-NEXT: store i32 [[TMP140]], i32* [[TMP147]], align 4 23506 // CHECK12-NEXT: [[TMP148:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 23507 // CHECK12-NEXT: [[TMP149:%.*]] = bitcast i8** [[TMP148]] to i32* 23508 // CHECK12-NEXT: store i32 [[TMP140]], i32* [[TMP149]], align 4 23509 // CHECK12-NEXT: [[TMP150:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 0 23510 // CHECK12-NEXT: store i8* null, i8** [[TMP150]], align 4 23511 // CHECK12-NEXT: [[TMP151:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 1 23512 // CHECK12-NEXT: [[TMP152:%.*]] = bitcast i8** [[TMP151]] to i32* 23513 // CHECK12-NEXT: store i32 [[TMP142]], i32* [[TMP152]], align 4 23514 // CHECK12-NEXT: [[TMP153:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 1 23515 // CHECK12-NEXT: [[TMP154:%.*]] = bitcast i8** [[TMP153]] to i32* 23516 // CHECK12-NEXT: store i32 [[TMP142]], i32* [[TMP154]], align 4 23517 // CHECK12-NEXT: [[TMP155:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 1 23518 // CHECK12-NEXT: store i8* null, i8** [[TMP155]], align 4 23519 // CHECK12-NEXT: [[TMP156:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 2 23520 // CHECK12-NEXT: [[TMP157:%.*]] = bitcast i8** [[TMP156]] to i32** 23521 // CHECK12-NEXT: store i32* [[TMP143]], i32** [[TMP157]], align 4 23522 // CHECK12-NEXT: [[TMP158:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 2 23523 // CHECK12-NEXT: [[TMP159:%.*]] = bitcast i8** [[TMP158]] to i32** 23524 // CHECK12-NEXT: store i32* [[TMP143]], i32** [[TMP159]], align 4 23525 // CHECK12-NEXT: [[TMP160:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 2 23526 // CHECK12-NEXT: store i8* null, i8** [[TMP160]], align 4 23527 // CHECK12-NEXT: [[TMP161:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 3 23528 // CHECK12-NEXT: [[TMP162:%.*]] = bitcast i8** [[TMP161]] to i32** 23529 // CHECK12-NEXT: store i32* [[TMP144]], i32** [[TMP162]], align 4 23530 // CHECK12-NEXT: [[TMP163:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 3 23531 // CHECK12-NEXT: [[TMP164:%.*]] = bitcast i8** [[TMP163]] to i32** 23532 // CHECK12-NEXT: store i32* [[TMP144]], i32** [[TMP164]], align 4 23533 // CHECK12-NEXT: [[TMP165:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 3 23534 // CHECK12-NEXT: store i8* null, i8** [[TMP165]], align 4 23535 // CHECK12-NEXT: [[TMP166:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 4 23536 // CHECK12-NEXT: [[TMP167:%.*]] = bitcast i8** [[TMP166]] to i32** 23537 // CHECK12-NEXT: store i32* [[TMP145]], i32** [[TMP167]], align 4 23538 // CHECK12-NEXT: [[TMP168:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 4 23539 // CHECK12-NEXT: [[TMP169:%.*]] = bitcast i8** [[TMP168]] to i32** 23540 // CHECK12-NEXT: store i32* [[TMP145]], i32** [[TMP169]], align 4 23541 // CHECK12-NEXT: [[TMP170:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS46]], i32 0, i32 4 23542 // CHECK12-NEXT: store i8* null, i8** [[TMP170]], align 4 23543 // CHECK12-NEXT: [[TMP171:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS44]], i32 0, i32 0 23544 // CHECK12-NEXT: [[TMP172:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS45]], i32 0, i32 0 23545 // CHECK12-NEXT: [[TMP173:%.*]] = load i32, i32* [[N]], align 4 23546 // CHECK12-NEXT: store i32 [[TMP173]], i32* [[DOTCAPTURE_EXPR_48]], align 4 23547 // CHECK12-NEXT: [[TMP174:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_48]], align 4 23548 // CHECK12-NEXT: [[SUB50:%.*]] = sub nsw i32 [[TMP174]], 0 23549 // CHECK12-NEXT: [[DIV51:%.*]] = sdiv i32 [[SUB50]], 1 23550 // CHECK12-NEXT: [[SUB52:%.*]] = sub nsw i32 [[DIV51]], 1 23551 // CHECK12-NEXT: store i32 [[SUB52]], i32* [[DOTCAPTURE_EXPR_49]], align 4 23552 // CHECK12-NEXT: [[TMP175:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_49]], align 4 23553 // CHECK12-NEXT: [[ADD53:%.*]] = add nsw i32 [[TMP175]], 1 23554 // CHECK12-NEXT: [[TMP176:%.*]] = zext i32 [[ADD53]] to i64 23555 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP176]]) 23556 // CHECK12-NEXT: [[TMP177:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75.region_id, i32 5, i8** [[TMP171]], i8** [[TMP172]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.44, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.45, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23557 // CHECK12-NEXT: [[TMP178:%.*]] = icmp ne i32 [[TMP177]], 0 23558 // CHECK12-NEXT: br i1 [[TMP178]], label [[OMP_OFFLOAD_FAILED54:%.*]], label [[OMP_OFFLOAD_CONT55:%.*]] 23559 // CHECK12: omp_offload.failed54: 23560 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75(i32 [[TMP140]], i32 [[TMP142]], i32* [[TMP143]], i32* [[TMP144]], i32* [[TMP145]]) #[[ATTR2]] 23561 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT55]] 23562 // CHECK12: omp_offload.cont55: 23563 // CHECK12-NEXT: [[TMP179:%.*]] = load i32, i32* [[N]], align 4 23564 // CHECK12-NEXT: store i32 [[TMP179]], i32* [[N_CASTED56]], align 4 23565 // CHECK12-NEXT: [[TMP180:%.*]] = load i32, i32* [[N_CASTED56]], align 4 23566 // CHECK12-NEXT: [[TMP181:%.*]] = load i32*, i32** [[A]], align 4 23567 // CHECK12-NEXT: [[TMP182:%.*]] = load i32*, i32** [[B]], align 4 23568 // CHECK12-NEXT: [[TMP183:%.*]] = load i32*, i32** [[C]], align 4 23569 // CHECK12-NEXT: [[TMP184:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 23570 // CHECK12-NEXT: [[TMP185:%.*]] = bitcast i8** [[TMP184]] to i32* 23571 // CHECK12-NEXT: store i32 [[TMP180]], i32* [[TMP185]], align 4 23572 // CHECK12-NEXT: [[TMP186:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 23573 // CHECK12-NEXT: [[TMP187:%.*]] = bitcast i8** [[TMP186]] to i32* 23574 // CHECK12-NEXT: store i32 [[TMP180]], i32* [[TMP187]], align 4 23575 // CHECK12-NEXT: [[TMP188:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 0 23576 // CHECK12-NEXT: store i8* null, i8** [[TMP188]], align 4 23577 // CHECK12-NEXT: [[TMP189:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 1 23578 // CHECK12-NEXT: [[TMP190:%.*]] = bitcast i8** [[TMP189]] to i32** 23579 // CHECK12-NEXT: store i32* [[TMP181]], i32** [[TMP190]], align 4 23580 // CHECK12-NEXT: [[TMP191:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 1 23581 // CHECK12-NEXT: [[TMP192:%.*]] = bitcast i8** [[TMP191]] to i32** 23582 // CHECK12-NEXT: store i32* [[TMP181]], i32** [[TMP192]], align 4 23583 // CHECK12-NEXT: [[TMP193:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 1 23584 // CHECK12-NEXT: store i8* null, i8** [[TMP193]], align 4 23585 // CHECK12-NEXT: [[TMP194:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 2 23586 // CHECK12-NEXT: [[TMP195:%.*]] = bitcast i8** [[TMP194]] to i32** 23587 // CHECK12-NEXT: store i32* [[TMP182]], i32** [[TMP195]], align 4 23588 // CHECK12-NEXT: [[TMP196:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 2 23589 // CHECK12-NEXT: [[TMP197:%.*]] = bitcast i8** [[TMP196]] to i32** 23590 // CHECK12-NEXT: store i32* [[TMP182]], i32** [[TMP197]], align 4 23591 // CHECK12-NEXT: [[TMP198:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 2 23592 // CHECK12-NEXT: store i8* null, i8** [[TMP198]], align 4 23593 // CHECK12-NEXT: [[TMP199:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 3 23594 // CHECK12-NEXT: [[TMP200:%.*]] = bitcast i8** [[TMP199]] to i32** 23595 // CHECK12-NEXT: store i32* [[TMP183]], i32** [[TMP200]], align 4 23596 // CHECK12-NEXT: [[TMP201:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 3 23597 // CHECK12-NEXT: [[TMP202:%.*]] = bitcast i8** [[TMP201]] to i32** 23598 // CHECK12-NEXT: store i32* [[TMP183]], i32** [[TMP202]], align 4 23599 // CHECK12-NEXT: [[TMP203:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_MAPPERS59]], i32 0, i32 3 23600 // CHECK12-NEXT: store i8* null, i8** [[TMP203]], align 4 23601 // CHECK12-NEXT: [[TMP204:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_BASEPTRS57]], i32 0, i32 0 23602 // CHECK12-NEXT: [[TMP205:%.*]] = getelementptr inbounds [4 x i8*], [4 x i8*]* [[DOTOFFLOAD_PTRS58]], i32 0, i32 0 23603 // CHECK12-NEXT: [[TMP206:%.*]] = load i32, i32* [[N]], align 4 23604 // CHECK12-NEXT: store i32 [[TMP206]], i32* [[DOTCAPTURE_EXPR_61]], align 4 23605 // CHECK12-NEXT: [[TMP207:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_61]], align 4 23606 // CHECK12-NEXT: [[SUB63:%.*]] = sub nsw i32 [[TMP207]], 0 23607 // CHECK12-NEXT: [[DIV64:%.*]] = sdiv i32 [[SUB63]], 1 23608 // CHECK12-NEXT: [[SUB65:%.*]] = sub nsw i32 [[DIV64]], 1 23609 // CHECK12-NEXT: store i32 [[SUB65]], i32* [[DOTCAPTURE_EXPR_62]], align 4 23610 // CHECK12-NEXT: [[TMP208:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_62]], align 4 23611 // CHECK12-NEXT: [[ADD66:%.*]] = add nsw i32 [[TMP208]], 1 23612 // CHECK12-NEXT: [[TMP209:%.*]] = zext i32 [[ADD66]] to i64 23613 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP209]]) 23614 // CHECK12-NEXT: [[TMP210:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83.region_id, i32 4, i8** [[TMP204]], i8** [[TMP205]], i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_sizes.48, i32 0, i32 0), i64* getelementptr inbounds ([4 x i64], [4 x i64]* @.offload_maptypes.49, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23615 // CHECK12-NEXT: [[TMP211:%.*]] = icmp ne i32 [[TMP210]], 0 23616 // CHECK12-NEXT: br i1 [[TMP211]], label [[OMP_OFFLOAD_FAILED67:%.*]], label [[OMP_OFFLOAD_CONT68:%.*]] 23617 // CHECK12: omp_offload.failed67: 23618 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83(i32 [[TMP180]], i32* [[TMP181]], i32* [[TMP182]], i32* [[TMP183]]) #[[ATTR2]] 23619 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT68]] 23620 // CHECK12: omp_offload.cont68: 23621 // CHECK12-NEXT: [[TMP212:%.*]] = load i32, i32* [[CH]], align 4 23622 // CHECK12-NEXT: store i32 [[TMP212]], i32* [[CH_CASTED69]], align 4 23623 // CHECK12-NEXT: [[TMP213:%.*]] = load i32, i32* [[CH_CASTED69]], align 4 23624 // CHECK12-NEXT: [[TMP214:%.*]] = load i32, i32* [[N]], align 4 23625 // CHECK12-NEXT: store i32 [[TMP214]], i32* [[N_CASTED70]], align 4 23626 // CHECK12-NEXT: [[TMP215:%.*]] = load i32, i32* [[N_CASTED70]], align 4 23627 // CHECK12-NEXT: [[TMP216:%.*]] = load i32*, i32** [[A]], align 4 23628 // CHECK12-NEXT: [[TMP217:%.*]] = load i32*, i32** [[B]], align 4 23629 // CHECK12-NEXT: [[TMP218:%.*]] = load i32*, i32** [[C]], align 4 23630 // CHECK12-NEXT: [[TMP219:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 23631 // CHECK12-NEXT: [[TMP220:%.*]] = bitcast i8** [[TMP219]] to i32* 23632 // CHECK12-NEXT: store i32 [[TMP213]], i32* [[TMP220]], align 4 23633 // CHECK12-NEXT: [[TMP221:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 23634 // CHECK12-NEXT: [[TMP222:%.*]] = bitcast i8** [[TMP221]] to i32* 23635 // CHECK12-NEXT: store i32 [[TMP213]], i32* [[TMP222]], align 4 23636 // CHECK12-NEXT: [[TMP223:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 0 23637 // CHECK12-NEXT: store i8* null, i8** [[TMP223]], align 4 23638 // CHECK12-NEXT: [[TMP224:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 1 23639 // CHECK12-NEXT: [[TMP225:%.*]] = bitcast i8** [[TMP224]] to i32* 23640 // CHECK12-NEXT: store i32 [[TMP215]], i32* [[TMP225]], align 4 23641 // CHECK12-NEXT: [[TMP226:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 1 23642 // CHECK12-NEXT: [[TMP227:%.*]] = bitcast i8** [[TMP226]] to i32* 23643 // CHECK12-NEXT: store i32 [[TMP215]], i32* [[TMP227]], align 4 23644 // CHECK12-NEXT: [[TMP228:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 1 23645 // CHECK12-NEXT: store i8* null, i8** [[TMP228]], align 4 23646 // CHECK12-NEXT: [[TMP229:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 2 23647 // CHECK12-NEXT: [[TMP230:%.*]] = bitcast i8** [[TMP229]] to i32** 23648 // CHECK12-NEXT: store i32* [[TMP216]], i32** [[TMP230]], align 4 23649 // CHECK12-NEXT: [[TMP231:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 2 23650 // CHECK12-NEXT: [[TMP232:%.*]] = bitcast i8** [[TMP231]] to i32** 23651 // CHECK12-NEXT: store i32* [[TMP216]], i32** [[TMP232]], align 4 23652 // CHECK12-NEXT: [[TMP233:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 2 23653 // CHECK12-NEXT: store i8* null, i8** [[TMP233]], align 4 23654 // CHECK12-NEXT: [[TMP234:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 3 23655 // CHECK12-NEXT: [[TMP235:%.*]] = bitcast i8** [[TMP234]] to i32** 23656 // CHECK12-NEXT: store i32* [[TMP217]], i32** [[TMP235]], align 4 23657 // CHECK12-NEXT: [[TMP236:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 3 23658 // CHECK12-NEXT: [[TMP237:%.*]] = bitcast i8** [[TMP236]] to i32** 23659 // CHECK12-NEXT: store i32* [[TMP217]], i32** [[TMP237]], align 4 23660 // CHECK12-NEXT: [[TMP238:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 3 23661 // CHECK12-NEXT: store i8* null, i8** [[TMP238]], align 4 23662 // CHECK12-NEXT: [[TMP239:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 4 23663 // CHECK12-NEXT: [[TMP240:%.*]] = bitcast i8** [[TMP239]] to i32** 23664 // CHECK12-NEXT: store i32* [[TMP218]], i32** [[TMP240]], align 4 23665 // CHECK12-NEXT: [[TMP241:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 4 23666 // CHECK12-NEXT: [[TMP242:%.*]] = bitcast i8** [[TMP241]] to i32** 23667 // CHECK12-NEXT: store i32* [[TMP218]], i32** [[TMP242]], align 4 23668 // CHECK12-NEXT: [[TMP243:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_MAPPERS73]], i32 0, i32 4 23669 // CHECK12-NEXT: store i8* null, i8** [[TMP243]], align 4 23670 // CHECK12-NEXT: [[TMP244:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_BASEPTRS71]], i32 0, i32 0 23671 // CHECK12-NEXT: [[TMP245:%.*]] = getelementptr inbounds [5 x i8*], [5 x i8*]* [[DOTOFFLOAD_PTRS72]], i32 0, i32 0 23672 // CHECK12-NEXT: [[TMP246:%.*]] = load i32, i32* [[N]], align 4 23673 // CHECK12-NEXT: store i32 [[TMP246]], i32* [[DOTCAPTURE_EXPR_75]], align 4 23674 // CHECK12-NEXT: [[TMP247:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_75]], align 4 23675 // CHECK12-NEXT: [[SUB77:%.*]] = sub nsw i32 [[TMP247]], 0 23676 // CHECK12-NEXT: [[DIV78:%.*]] = sdiv i32 [[SUB77]], 1 23677 // CHECK12-NEXT: [[SUB79:%.*]] = sub nsw i32 [[DIV78]], 1 23678 // CHECK12-NEXT: store i32 [[SUB79]], i32* [[DOTCAPTURE_EXPR_76]], align 4 23679 // CHECK12-NEXT: [[TMP248:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_76]], align 4 23680 // CHECK12-NEXT: [[ADD80:%.*]] = add nsw i32 [[TMP248]], 1 23681 // CHECK12-NEXT: [[TMP249:%.*]] = zext i32 [[ADD80]] to i64 23682 // CHECK12-NEXT: call void @__kmpc_push_target_tripcount_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i64 [[TMP249]]) 23683 // CHECK12-NEXT: [[TMP250:%.*]] = call i32 @__tgt_target_teams_mapper(%struct.ident_t* @[[GLOB3]], i64 -1, i8* @.{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91.region_id, i32 5, i8** [[TMP244]], i8** [[TMP245]], i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_sizes.52, i32 0, i32 0), i64* getelementptr inbounds ([5 x i64], [5 x i64]* @.offload_maptypes.53, i32 0, i32 0), i8** null, i8** null, i32 0, i32 0) 23684 // CHECK12-NEXT: [[TMP251:%.*]] = icmp ne i32 [[TMP250]], 0 23685 // CHECK12-NEXT: br i1 [[TMP251]], label [[OMP_OFFLOAD_FAILED81:%.*]], label [[OMP_OFFLOAD_CONT82:%.*]] 23686 // CHECK12: omp_offload.failed81: 23687 // CHECK12-NEXT: call void @{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91(i32 [[TMP213]], i32 [[TMP215]], i32* [[TMP216]], i32* [[TMP217]], i32* [[TMP218]]) #[[ATTR2]] 23688 // CHECK12-NEXT: br label [[OMP_OFFLOAD_CONT82]] 23689 // CHECK12: omp_offload.cont82: 23690 // CHECK12-NEXT: ret i32 0 23691 // 23692 // 23693 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l42 23694 // CHECK12-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 23695 // CHECK12-NEXT: entry: 23696 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 23697 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 23698 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 23699 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 23700 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 23701 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 23702 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 23703 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 23704 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..26 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 23705 // CHECK12-NEXT: ret void 23706 // 23707 // 23708 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..26 23709 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 23710 // CHECK12-NEXT: entry: 23711 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 23712 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 23713 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 23714 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 23715 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 23716 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 23717 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 23718 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 23719 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 23720 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 23721 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 23722 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 23723 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 23724 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 23725 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 23726 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 23727 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 23728 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 23729 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 23730 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 23731 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 23732 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 23733 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 23734 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 23735 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 23736 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 23737 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 23738 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 23739 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23740 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 23741 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 23742 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 23743 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 23744 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 23745 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23746 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 23747 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 23748 // CHECK12: omp.precond.then: 23749 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 23750 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23751 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 23752 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 23753 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 23754 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23755 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 23756 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 23757 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23758 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23759 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 23760 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 23761 // CHECK12: cond.true: 23762 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23763 // CHECK12-NEXT: br label [[COND_END:%.*]] 23764 // CHECK12: cond.false: 23765 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23766 // CHECK12-NEXT: br label [[COND_END]] 23767 // CHECK12: cond.end: 23768 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 23769 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 23770 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 23771 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 23772 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 23773 // CHECK12: omp.inner.for.cond: 23774 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23775 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23776 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 23777 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 23778 // CHECK12: omp.inner.for.body: 23779 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 23780 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23781 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..27 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 23782 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 23783 // CHECK12: omp.inner.for.inc: 23784 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23785 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 23786 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 23787 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 23788 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 23789 // CHECK12: omp.inner.for.end: 23790 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 23791 // CHECK12: omp.loop.exit: 23792 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23793 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 23794 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 23795 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 23796 // CHECK12: omp.precond.end: 23797 // CHECK12-NEXT: ret void 23798 // 23799 // 23800 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..27 23801 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 23802 // CHECK12-NEXT: entry: 23803 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 23804 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 23805 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 23806 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 23807 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 23808 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 23809 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 23810 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 23811 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 23812 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 23813 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 23814 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 23815 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 23816 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 23817 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 23818 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 23819 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 23820 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 23821 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 23822 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 23823 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 23824 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 23825 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 23826 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 23827 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 23828 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 23829 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 23830 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 23831 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 23832 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 23833 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 23834 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 23835 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23836 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 23837 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 23838 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 23839 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 23840 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 23841 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23842 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 23843 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 23844 // CHECK12: omp.precond.then: 23845 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 23846 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23847 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 23848 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 23849 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 23850 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 23851 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 23852 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 23853 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 23854 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23855 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 23856 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 23857 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 23858 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23859 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 23860 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 23861 // CHECK12: cond.true: 23862 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23863 // CHECK12-NEXT: br label [[COND_END:%.*]] 23864 // CHECK12: cond.false: 23865 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 23866 // CHECK12-NEXT: br label [[COND_END]] 23867 // CHECK12: cond.end: 23868 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 23869 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 23870 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 23871 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 23872 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 23873 // CHECK12: omp.inner.for.cond: 23874 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23875 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 23876 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 23877 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 23878 // CHECK12: omp.inner.for.body: 23879 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23880 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 23881 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 23882 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 23883 // CHECK12-NEXT: [[TMP20:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23884 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[TMP20]], align 4 23885 // CHECK12-NEXT: [[TMP22:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* @[[GLOB3]], i32 [[TMP21]], i32 2) 23886 // CHECK12-NEXT: [[TMP23:%.*]] = icmp ne i32 [[TMP22]], 0 23887 // CHECK12-NEXT: br i1 [[TMP23]], label [[DOTCANCEL_EXIT:%.*]], label [[DOTCANCEL_CONTINUE:%.*]] 23888 // CHECK12: .cancel.exit: 23889 // CHECK12-NEXT: br label [[CANCEL_EXIT:%.*]] 23890 // CHECK12: .cancel.continue: 23891 // CHECK12-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP2]], align 4 23892 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4 23893 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i32 [[TMP25]] 23894 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 23895 // CHECK12-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP3]], align 4 23896 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4 23897 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i32 [[TMP28]] 23898 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 23899 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 23900 // CHECK12-NEXT: [[TMP30:%.*]] = load i32*, i32** [[TMP1]], align 4 23901 // CHECK12-NEXT: [[TMP31:%.*]] = load i32, i32* [[I3]], align 4 23902 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i32 [[TMP31]] 23903 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 23904 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 23905 // CHECK12: omp.body.continue: 23906 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 23907 // CHECK12: omp.inner.for.inc: 23908 // CHECK12-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 23909 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP32]], 1 23910 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 23911 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 23912 // CHECK12: omp.inner.for.end: 23913 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 23914 // CHECK12: omp.loop.exit: 23915 // CHECK12-NEXT: [[TMP33:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23916 // CHECK12-NEXT: [[TMP34:%.*]] = load i32, i32* [[TMP33]], align 4 23917 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP34]]) 23918 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 23919 // CHECK12: cancel.exit: 23920 // CHECK12-NEXT: [[TMP35:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23921 // CHECK12-NEXT: [[TMP36:%.*]] = load i32, i32* [[TMP35]], align 4 23922 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP36]]) 23923 // CHECK12-NEXT: br label [[CANCEL_CONT:%.*]] 23924 // CHECK12: omp.precond.end: 23925 // CHECK12-NEXT: br label [[CANCEL_CONT]] 23926 // CHECK12: cancel.cont: 23927 // CHECK12-NEXT: ret void 23928 // 23929 // 23930 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l51 23931 // CHECK12-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 23932 // CHECK12-NEXT: entry: 23933 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 23934 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 23935 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 23936 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 23937 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 23938 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 23939 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 23940 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 23941 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 23942 // CHECK12-NEXT: ret void 23943 // 23944 // 23945 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..30 23946 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 23947 // CHECK12-NEXT: entry: 23948 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 23949 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 23950 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 23951 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 23952 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 23953 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 23954 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 23955 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 23956 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 23957 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 23958 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 23959 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 23960 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 23961 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 23962 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 23963 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 23964 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 23965 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 23966 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 23967 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 23968 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 23969 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 23970 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 23971 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 23972 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 23973 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 23974 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 23975 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 23976 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23977 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 23978 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 23979 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 23980 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 23981 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 23982 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 23983 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 23984 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 23985 // CHECK12: omp.precond.then: 23986 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 23987 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23988 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 23989 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 23990 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 23991 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 23992 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 23993 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 23994 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 23995 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 23996 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 23997 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 23998 // CHECK12: cond.true: 23999 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24000 // CHECK12-NEXT: br label [[COND_END:%.*]] 24001 // CHECK12: cond.false: 24002 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24003 // CHECK12-NEXT: br label [[COND_END]] 24004 // CHECK12: cond.end: 24005 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 24006 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 24007 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24008 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 24009 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24010 // CHECK12: omp.inner.for.cond: 24011 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24012 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24013 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 24014 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24015 // CHECK12: omp.inner.for.body: 24016 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24017 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24018 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 24019 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24020 // CHECK12: omp.inner.for.inc: 24021 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24022 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24023 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 24024 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 24025 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24026 // CHECK12: omp.inner.for.end: 24027 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24028 // CHECK12: omp.loop.exit: 24029 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24030 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 24031 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 24032 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24033 // CHECK12: omp.precond.end: 24034 // CHECK12-NEXT: ret void 24035 // 24036 // 24037 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..31 24038 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24039 // CHECK12-NEXT: entry: 24040 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24041 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24042 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 24043 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 24044 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24045 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24046 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24047 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24048 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24049 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24050 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24051 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24052 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24053 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 24054 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 24055 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24056 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24057 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 24058 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24059 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24060 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24061 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24062 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24063 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24064 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24065 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24066 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24067 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24068 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24069 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24070 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 24071 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 24072 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24073 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 24074 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24075 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 24076 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24077 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24078 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24079 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 24080 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24081 // CHECK12: omp.precond.then: 24082 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 24083 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24084 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 24085 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24086 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24087 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 24088 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 24089 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24090 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24091 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24092 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 24093 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 24094 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24095 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24096 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 24097 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24098 // CHECK12: cond.true: 24099 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24100 // CHECK12-NEXT: br label [[COND_END:%.*]] 24101 // CHECK12: cond.false: 24102 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24103 // CHECK12-NEXT: br label [[COND_END]] 24104 // CHECK12: cond.end: 24105 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 24106 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 24107 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 24108 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 24109 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24110 // CHECK12: omp.inner.for.cond: 24111 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24112 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24113 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 24114 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24115 // CHECK12: omp.inner.for.body: 24116 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24117 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 24118 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 24119 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 24120 // CHECK12-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 4 24121 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 24122 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i32 [[TMP21]] 24123 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 24124 // CHECK12-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 4 24125 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 24126 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 24127 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 24128 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 24129 // CHECK12-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 4 24130 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 24131 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 24132 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 24133 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 24134 // CHECK12: omp.body.continue: 24135 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24136 // CHECK12: omp.inner.for.inc: 24137 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24138 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 24139 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 24140 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24141 // CHECK12: omp.inner.for.end: 24142 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24143 // CHECK12: omp.loop.exit: 24144 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24145 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 24146 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 24147 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24148 // CHECK12: omp.precond.end: 24149 // CHECK12-NEXT: ret void 24150 // 24151 // 24152 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l59 24153 // CHECK12-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 24154 // CHECK12-NEXT: entry: 24155 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 24156 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 24157 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 24158 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 24159 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 24160 // CHECK12-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 24161 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 24162 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 24163 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 24164 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 24165 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 24166 // CHECK12-NEXT: ret void 24167 // 24168 // 24169 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..34 24170 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24171 // CHECK12-NEXT: entry: 24172 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24173 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24174 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 24175 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24176 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24177 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24178 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24179 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24180 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24181 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24182 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24183 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24184 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 24185 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 24186 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24187 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24188 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 24189 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24190 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24191 // CHECK12-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 24192 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24193 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24194 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24195 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24196 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 24197 // CHECK12-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24198 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24199 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24200 // CHECK12-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24201 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP1]], align 4 24202 // CHECK12-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 24203 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24204 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP6]], 0 24205 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24206 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 24207 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24208 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24209 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24210 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP7]] 24211 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24212 // CHECK12: omp.precond.then: 24213 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 24214 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24215 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_COMB_UB]], align 4 24216 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24217 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24218 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP0]], align 4 24219 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24220 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 24221 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 91, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP9]]) 24222 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24223 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24224 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 24225 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24226 // CHECK12: cond.true: 24227 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24228 // CHECK12-NEXT: br label [[COND_END:%.*]] 24229 // CHECK12: cond.false: 24230 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24231 // CHECK12-NEXT: br label [[COND_END]] 24232 // CHECK12: cond.end: 24233 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 24234 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 24235 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24236 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 24237 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24238 // CHECK12: omp.inner.for.cond: 24239 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24240 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24241 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP18]], 1 24242 // CHECK12-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP17]], [[ADD]] 24243 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24244 // CHECK12: omp.inner.for.body: 24245 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24246 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24247 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]]) 24248 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24249 // CHECK12: omp.inner.for.inc: 24250 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24251 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24252 // CHECK12-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP21]], [[TMP22]] 24253 // CHECK12-NEXT: store i32 [[ADD6]], i32* [[DOTOMP_IV]], align 4 24254 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24255 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24256 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 24257 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[DOTOMP_COMB_LB]], align 4 24258 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24259 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24260 // CHECK12-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP25]], [[TMP26]] 24261 // CHECK12-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_COMB_UB]], align 4 24262 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24263 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24264 // CHECK12-NEXT: [[CMP9:%.*]] = icmp sgt i32 [[TMP27]], [[TMP28]] 24265 // CHECK12-NEXT: br i1 [[CMP9]], label [[COND_TRUE10:%.*]], label [[COND_FALSE11:%.*]] 24266 // CHECK12: cond.true10: 24267 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24268 // CHECK12-NEXT: br label [[COND_END12:%.*]] 24269 // CHECK12: cond.false11: 24270 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24271 // CHECK12-NEXT: br label [[COND_END12]] 24272 // CHECK12: cond.end12: 24273 // CHECK12-NEXT: [[COND13:%.*]] = phi i32 [ [[TMP29]], [[COND_TRUE10]] ], [ [[TMP30]], [[COND_FALSE11]] ] 24274 // CHECK12-NEXT: store i32 [[COND13]], i32* [[DOTOMP_COMB_UB]], align 4 24275 // CHECK12-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24276 // CHECK12-NEXT: store i32 [[TMP31]], i32* [[DOTOMP_IV]], align 4 24277 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24278 // CHECK12: omp.inner.for.end: 24279 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24280 // CHECK12: omp.loop.exit: 24281 // CHECK12-NEXT: [[TMP32:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24282 // CHECK12-NEXT: [[TMP33:%.*]] = load i32, i32* [[TMP32]], align 4 24283 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP33]]) 24284 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24285 // CHECK12: omp.precond.end: 24286 // CHECK12-NEXT: ret void 24287 // 24288 // 24289 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..35 24290 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24291 // CHECK12-NEXT: entry: 24292 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24293 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24294 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 24295 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 24296 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24297 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24298 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24299 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24300 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24301 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24302 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24303 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24304 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24305 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 24306 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 24307 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24308 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24309 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 24310 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24311 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24312 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24313 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24314 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24315 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24316 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24317 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24318 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24319 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24320 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24321 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24322 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 24323 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 24324 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24325 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 24326 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24327 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 24328 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24329 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24330 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24331 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 24332 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24333 // CHECK12: omp.precond.then: 24334 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 24335 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24336 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 24337 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24338 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24339 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 24340 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 24341 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24342 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24343 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24344 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 24345 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 24346 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24347 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24348 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 24349 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24350 // CHECK12: cond.true: 24351 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24352 // CHECK12-NEXT: br label [[COND_END:%.*]] 24353 // CHECK12: cond.false: 24354 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24355 // CHECK12-NEXT: br label [[COND_END]] 24356 // CHECK12: cond.end: 24357 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 24358 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 24359 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 24360 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 24361 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24362 // CHECK12: omp.inner.for.cond: 24363 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24364 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24365 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 24366 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24367 // CHECK12: omp.inner.for.body: 24368 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24369 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 24370 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 24371 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 24372 // CHECK12-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 4 24373 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 24374 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i32 [[TMP21]] 24375 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 24376 // CHECK12-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 4 24377 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 24378 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 24379 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 24380 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 24381 // CHECK12-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 4 24382 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 24383 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 24384 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 24385 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 24386 // CHECK12: omp.body.continue: 24387 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24388 // CHECK12: omp.inner.for.inc: 24389 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24390 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 24391 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 24392 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24393 // CHECK12: omp.inner.for.end: 24394 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24395 // CHECK12: omp.loop.exit: 24396 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24397 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 24398 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 24399 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24400 // CHECK12: omp.precond.end: 24401 // CHECK12-NEXT: ret void 24402 // 24403 // 24404 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l67 24405 // CHECK12-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 24406 // CHECK12-NEXT: entry: 24407 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 24408 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 24409 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 24410 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 24411 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 24412 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 24413 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 24414 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 24415 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..38 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 24416 // CHECK12-NEXT: ret void 24417 // 24418 // 24419 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..38 24420 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24421 // CHECK12-NEXT: entry: 24422 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24423 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24424 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24425 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24426 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24427 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24428 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24429 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24430 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24431 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24432 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24433 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 24434 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 24435 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24436 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24437 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 24438 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24439 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24440 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24441 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24442 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24443 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24444 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24445 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24446 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24447 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24448 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 24449 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 24450 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24451 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 24452 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24453 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 24454 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24455 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24456 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24457 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 24458 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24459 // CHECK12: omp.precond.then: 24460 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 24461 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24462 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 24463 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24464 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24465 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24466 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 24467 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 24468 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24469 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24470 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 24471 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24472 // CHECK12: cond.true: 24473 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24474 // CHECK12-NEXT: br label [[COND_END:%.*]] 24475 // CHECK12: cond.false: 24476 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24477 // CHECK12-NEXT: br label [[COND_END]] 24478 // CHECK12: cond.end: 24479 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 24480 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 24481 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24482 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 24483 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24484 // CHECK12: omp.inner.for.cond: 24485 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24486 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24487 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 24488 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24489 // CHECK12: omp.inner.for.body: 24490 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24491 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24492 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 24493 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24494 // CHECK12: omp.inner.for.inc: 24495 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24496 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24497 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 24498 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 24499 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24500 // CHECK12: omp.inner.for.end: 24501 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24502 // CHECK12: omp.loop.exit: 24503 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24504 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 24505 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 24506 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24507 // CHECK12: omp.precond.end: 24508 // CHECK12-NEXT: ret void 24509 // 24510 // 24511 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..39 24512 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24513 // CHECK12-NEXT: entry: 24514 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24515 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24516 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 24517 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 24518 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24519 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24520 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24521 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24522 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24523 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24524 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24525 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24526 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24527 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 24528 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 24529 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24530 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24531 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 24532 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24533 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24534 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24535 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24536 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24537 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24538 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24539 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24540 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24541 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24542 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24543 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24544 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 24545 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 24546 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24547 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 24548 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24549 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 24550 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24551 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24552 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24553 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 24554 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24555 // CHECK12: omp.precond.then: 24556 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 24557 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24558 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 24559 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24560 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24561 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 24562 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 24563 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24564 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24565 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24566 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 24567 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP11]], i32 34, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 24568 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24569 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24570 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 24571 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24572 // CHECK12: cond.true: 24573 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24574 // CHECK12-NEXT: br label [[COND_END:%.*]] 24575 // CHECK12: cond.false: 24576 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24577 // CHECK12-NEXT: br label [[COND_END]] 24578 // CHECK12: cond.end: 24579 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 24580 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 24581 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 24582 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 24583 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24584 // CHECK12: omp.inner.for.cond: 24585 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24586 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24587 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 24588 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24589 // CHECK12: omp.inner.for.body: 24590 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24591 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP19]], 1 24592 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 24593 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4 24594 // CHECK12-NEXT: [[TMP20:%.*]] = load i32*, i32** [[TMP2]], align 4 24595 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 24596 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP20]], i32 [[TMP21]] 24597 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 24598 // CHECK12-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP3]], align 4 24599 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I3]], align 4 24600 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 24601 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4 24602 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP22]], [[TMP25]] 24603 // CHECK12-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP1]], align 4 24604 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I3]], align 4 24605 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 24606 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4 24607 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 24608 // CHECK12: omp.body.continue: 24609 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24610 // CHECK12: omp.inner.for.inc: 24611 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24612 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP28]], 1 24613 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4 24614 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24615 // CHECK12: omp.inner.for.end: 24616 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24617 // CHECK12: omp.loop.exit: 24618 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24619 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[TMP29]], align 4 24620 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP30]]) 24621 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24622 // CHECK12: omp.precond.end: 24623 // CHECK12-NEXT: ret void 24624 // 24625 // 24626 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l75 24627 // CHECK12-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 24628 // CHECK12-NEXT: entry: 24629 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 24630 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 24631 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 24632 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 24633 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 24634 // CHECK12-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 24635 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 24636 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 24637 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 24638 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 24639 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..42 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 24640 // CHECK12-NEXT: ret void 24641 // 24642 // 24643 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..42 24644 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24645 // CHECK12-NEXT: entry: 24646 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24647 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24648 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 24649 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24650 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24651 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24652 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24653 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24654 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24655 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24656 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24657 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 24658 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24659 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 24660 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 24661 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24662 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24663 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 24664 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 24665 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24666 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24667 // CHECK12-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 24668 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24669 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24670 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24671 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24672 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 24673 // CHECK12-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24674 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24675 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24676 // CHECK12-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24677 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 24678 // CHECK12-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 24679 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 24680 // CHECK12-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24681 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24682 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 24683 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24684 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 24685 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 24686 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24687 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24688 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 24689 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24690 // CHECK12: omp.precond.then: 24691 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 24692 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 24693 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 24694 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24695 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24696 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24697 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 24698 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 24699 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24700 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 24701 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 24702 // CHECK12-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24703 // CHECK12: cond.true: 24704 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 24705 // CHECK12-NEXT: br label [[COND_END:%.*]] 24706 // CHECK12: cond.false: 24707 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24708 // CHECK12-NEXT: br label [[COND_END]] 24709 // CHECK12: cond.end: 24710 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 24711 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 24712 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24713 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 24714 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24715 // CHECK12: omp.inner.for.cond: 24716 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24717 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24718 // CHECK12-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 24719 // CHECK12-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24720 // CHECK12: omp.inner.for.body: 24721 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24722 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24723 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24724 // CHECK12-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 24725 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 24726 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**, i32)* @.omp_outlined..43 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i32 [[TMP22]]) 24727 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24728 // CHECK12: omp.inner.for.inc: 24729 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24730 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24731 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 24732 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 24733 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24734 // CHECK12: omp.inner.for.end: 24735 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24736 // CHECK12: omp.loop.exit: 24737 // CHECK12-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24738 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 24739 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 24740 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24741 // CHECK12: omp.precond.end: 24742 // CHECK12-NEXT: ret void 24743 // 24744 // 24745 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..43 24746 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 24747 // CHECK12-NEXT: entry: 24748 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24749 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24750 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 24751 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 24752 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24753 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24754 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24755 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24756 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 24757 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24758 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24759 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24760 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 24761 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24762 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 24763 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 24764 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24765 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24766 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 24767 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24768 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24769 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24770 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24771 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24772 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24773 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24774 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24775 // CHECK12-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 24776 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24777 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24778 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24779 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24780 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 24781 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24782 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24783 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 24784 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24785 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 24786 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 24787 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24788 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24789 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 24790 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24791 // CHECK12: omp.precond.then: 24792 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 24793 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 24794 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 24795 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 24796 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24797 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 24798 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 24799 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24800 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24801 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 24802 // CHECK12-NEXT: [[TMP11:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24803 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[TMP11]], align 4 24804 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB2]], i32 [[TMP12]], i32 33, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 [[TMP10]]) 24805 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 24806 // CHECK12: omp.dispatch.cond: 24807 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24808 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24809 // CHECK12-NEXT: [[CMP5:%.*]] = icmp ugt i32 [[TMP13]], [[TMP14]] 24810 // CHECK12-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24811 // CHECK12: cond.true: 24812 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 24813 // CHECK12-NEXT: br label [[COND_END:%.*]] 24814 // CHECK12: cond.false: 24815 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24816 // CHECK12-NEXT: br label [[COND_END]] 24817 // CHECK12: cond.end: 24818 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP15]], [[COND_TRUE]] ], [ [[TMP16]], [[COND_FALSE]] ] 24819 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_UB]], align 4 24820 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 24821 // CHECK12-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 24822 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24823 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24824 // CHECK12-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 24825 // CHECK12-NEXT: br i1 [[CMP6]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 24826 // CHECK12: omp.dispatch.body: 24827 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24828 // CHECK12: omp.inner.for.cond: 24829 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24830 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24831 // CHECK12-NEXT: [[CMP7:%.*]] = icmp sle i32 [[TMP20]], [[TMP21]] 24832 // CHECK12-NEXT: br i1 [[CMP7]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24833 // CHECK12: omp.inner.for.body: 24834 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24835 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP22]], 1 24836 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 24837 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I4]], align 4 24838 // CHECK12-NEXT: [[TMP23:%.*]] = load i32*, i32** [[TMP2]], align 4 24839 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[I4]], align 4 24840 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP23]], i32 [[TMP24]] 24841 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 24842 // CHECK12-NEXT: [[TMP26:%.*]] = load i32*, i32** [[TMP3]], align 4 24843 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[I4]], align 4 24844 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP26]], i32 [[TMP27]] 24845 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 24846 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP25]], [[TMP28]] 24847 // CHECK12-NEXT: [[TMP29:%.*]] = load i32*, i32** [[TMP1]], align 4 24848 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[I4]], align 4 24849 // CHECK12-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP29]], i32 [[TMP30]] 24850 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX10]], align 4 24851 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 24852 // CHECK12: omp.body.continue: 24853 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24854 // CHECK12: omp.inner.for.inc: 24855 // CHECK12-NEXT: [[TMP31:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24856 // CHECK12-NEXT: [[ADD11:%.*]] = add nsw i32 [[TMP31]], 1 24857 // CHECK12-NEXT: store i32 [[ADD11]], i32* [[DOTOMP_IV]], align 4 24858 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24859 // CHECK12: omp.inner.for.end: 24860 // CHECK12-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 24861 // CHECK12: omp.dispatch.inc: 24862 // CHECK12-NEXT: [[TMP32:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 24863 // CHECK12-NEXT: [[TMP33:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24864 // CHECK12-NEXT: [[ADD12:%.*]] = add nsw i32 [[TMP32]], [[TMP33]] 24865 // CHECK12-NEXT: store i32 [[ADD12]], i32* [[DOTOMP_LB]], align 4 24866 // CHECK12-NEXT: [[TMP34:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 24867 // CHECK12-NEXT: [[TMP35:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24868 // CHECK12-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP34]], [[TMP35]] 24869 // CHECK12-NEXT: store i32 [[ADD13]], i32* [[DOTOMP_UB]], align 4 24870 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND]] 24871 // CHECK12: omp.dispatch.end: 24872 // CHECK12-NEXT: [[TMP36:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24873 // CHECK12-NEXT: [[TMP37:%.*]] = load i32, i32* [[TMP36]], align 4 24874 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP37]]) 24875 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24876 // CHECK12: omp.precond.end: 24877 // CHECK12-NEXT: ret void 24878 // 24879 // 24880 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l83 24881 // CHECK12-SAME: (i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 24882 // CHECK12-NEXT: entry: 24883 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 24884 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 24885 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 24886 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 24887 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 24888 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 24889 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 24890 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 24891 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 4, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..46 to void (i32*, i32*, ...)*), i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 24892 // CHECK12-NEXT: ret void 24893 // 24894 // 24895 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..46 24896 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24897 // CHECK12-NEXT: entry: 24898 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24899 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24900 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24901 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24902 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24903 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24904 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24905 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 24906 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 24907 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 24908 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 24909 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 24910 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 24911 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 24912 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 24913 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 24914 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 24915 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 24916 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 24917 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 24918 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 24919 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 24920 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 24921 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 24922 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 24923 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 24924 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 24925 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 24926 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24927 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 24928 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 24929 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 24930 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 24931 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 24932 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 24933 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 24934 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 24935 // CHECK12: omp.precond.then: 24936 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 24937 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24938 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_COMB_UB]], align 4 24939 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 24940 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 24941 // CHECK12-NEXT: [[TMP8:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24942 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[TMP8]], align 4 24943 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP9]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 24944 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24945 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24946 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sgt i32 [[TMP10]], [[TMP11]] 24947 // CHECK12-NEXT: br i1 [[CMP4]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 24948 // CHECK12: cond.true: 24949 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 24950 // CHECK12-NEXT: br label [[COND_END:%.*]] 24951 // CHECK12: cond.false: 24952 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24953 // CHECK12-NEXT: br label [[COND_END]] 24954 // CHECK12: cond.end: 24955 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP12]], [[COND_TRUE]] ], [ [[TMP13]], [[COND_FALSE]] ] 24956 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 24957 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24958 // CHECK12-NEXT: store i32 [[TMP14]], i32* [[DOTOMP_IV]], align 4 24959 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 24960 // CHECK12: omp.inner.for.cond: 24961 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24962 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24963 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP15]], [[TMP16]] 24964 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 24965 // CHECK12: omp.inner.for.body: 24966 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 24967 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 24968 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 6, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**)* @.omp_outlined..47 to void (i32*, i32*, ...)*), i32 [[TMP17]], i32 [[TMP18]], i32* [[TMP0]], i32** [[TMP1]], i32** [[TMP2]], i32** [[TMP3]]) 24969 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 24970 // CHECK12: omp.inner.for.inc: 24971 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 24972 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 24973 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP19]], [[TMP20]] 24974 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 24975 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 24976 // CHECK12: omp.inner.for.end: 24977 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 24978 // CHECK12: omp.loop.exit: 24979 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 24980 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[TMP21]], align 4 24981 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP22]]) 24982 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 24983 // CHECK12: omp.precond.end: 24984 // CHECK12-NEXT: ret void 24985 // 24986 // 24987 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..47 24988 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 24989 // CHECK12-NEXT: entry: 24990 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 24991 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 24992 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 24993 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 24994 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 24995 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 24996 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 24997 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 24998 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 24999 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 25000 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 25001 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 25002 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 25003 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 25004 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 25005 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 25006 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 25007 // CHECK12-NEXT: [[I3:%.*]] = alloca i32, align 4 25008 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 25009 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 25010 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 25011 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 25012 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 25013 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 25014 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 25015 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 25016 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 25017 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 25018 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 25019 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 25020 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 25021 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_]], align 4 25022 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 25023 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 25024 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 25025 // CHECK12-NEXT: [[SUB2:%.*]] = sub nsw i32 [[DIV]], 1 25026 // CHECK12-NEXT: store i32 [[SUB2]], i32* [[DOTCAPTURE_EXPR_1]], align 4 25027 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 25028 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 25029 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 25030 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 25031 // CHECK12: omp.precond.then: 25032 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 25033 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 25034 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 25035 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 25036 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 25037 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 25038 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 25039 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 25040 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 25041 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 25042 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 25043 // CHECK12-NEXT: [[TMP12:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 25044 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[TMP12]], align 4 25045 // CHECK12-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP13]], i32 35, i32 [[TMP10]], i32 [[TMP11]], i32 1, i32 1) 25046 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 25047 // CHECK12: omp.dispatch.cond: 25048 // CHECK12-NEXT: [[TMP14:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 25049 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[TMP14]], align 4 25050 // CHECK12-NEXT: [[TMP16:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP15]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 25051 // CHECK12-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP16]], 0 25052 // CHECK12-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 25053 // CHECK12: omp.dispatch.body: 25054 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 25055 // CHECK12-NEXT: store i32 [[TMP17]], i32* [[DOTOMP_IV]], align 4 25056 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 25057 // CHECK12: omp.inner.for.cond: 25058 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 25059 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !25 25060 // CHECK12-NEXT: [[CMP4:%.*]] = icmp sle i32 [[TMP18]], [[TMP19]] 25061 // CHECK12-NEXT: br i1 [[CMP4]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 25062 // CHECK12: omp.inner.for.body: 25063 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 25064 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP20]], 1 25065 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 25066 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I3]], align 4, !llvm.access.group !25 25067 // CHECK12-NEXT: [[TMP21:%.*]] = load i32*, i32** [[TMP2]], align 4, !llvm.access.group !25 25068 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !25 25069 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP21]], i32 [[TMP22]] 25070 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !25 25071 // CHECK12-NEXT: [[TMP24:%.*]] = load i32*, i32** [[TMP3]], align 4, !llvm.access.group !25 25072 // CHECK12-NEXT: [[TMP25:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !25 25073 // CHECK12-NEXT: [[ARRAYIDX5:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i32 [[TMP25]] 25074 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX5]], align 4, !llvm.access.group !25 25075 // CHECK12-NEXT: [[ADD6:%.*]] = add nsw i32 [[TMP23]], [[TMP26]] 25076 // CHECK12-NEXT: [[TMP27:%.*]] = load i32*, i32** [[TMP1]], align 4, !llvm.access.group !25 25077 // CHECK12-NEXT: [[TMP28:%.*]] = load i32, i32* [[I3]], align 4, !llvm.access.group !25 25078 // CHECK12-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i32 [[TMP28]] 25079 // CHECK12-NEXT: store i32 [[ADD6]], i32* [[ARRAYIDX7]], align 4, !llvm.access.group !25 25080 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 25081 // CHECK12: omp.body.continue: 25082 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 25083 // CHECK12: omp.inner.for.inc: 25084 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 25085 // CHECK12-NEXT: [[ADD8:%.*]] = add nsw i32 [[TMP29]], 1 25086 // CHECK12-NEXT: store i32 [[ADD8]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !25 25087 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP26:![0-9]+]] 25088 // CHECK12: omp.inner.for.end: 25089 // CHECK12-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 25090 // CHECK12: omp.dispatch.inc: 25091 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND]] 25092 // CHECK12: omp.dispatch.end: 25093 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 25094 // CHECK12: omp.precond.end: 25095 // CHECK12-NEXT: ret void 25096 // 25097 // 25098 // CHECK12-LABEL: define {{[^@]+}}@{{__omp_offloading_[0-9a-z]+_[0-9a-z]+}}__Z5tmainIiET_v_l91 25099 // CHECK12-SAME: (i32 [[CH:%.*]], i32 [[N:%.*]], i32* [[A:%.*]], i32* [[B:%.*]], i32* [[C:%.*]]) #[[ATTR1]] { 25100 // CHECK12-NEXT: entry: 25101 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32, align 4 25102 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32, align 4 25103 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32*, align 4 25104 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32*, align 4 25105 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32*, align 4 25106 // CHECK12-NEXT: store i32 [[CH]], i32* [[CH_ADDR]], align 4 25107 // CHECK12-NEXT: store i32 [[N]], i32* [[N_ADDR]], align 4 25108 // CHECK12-NEXT: store i32* [[A]], i32** [[A_ADDR]], align 4 25109 // CHECK12-NEXT: store i32* [[B]], i32** [[B_ADDR]], align 4 25110 // CHECK12-NEXT: store i32* [[C]], i32** [[C_ADDR]], align 4 25111 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_teams(%struct.ident_t* @[[GLOB3]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32**, i32**, i32**)* @.omp_outlined..50 to void (i32*, i32*, ...)*), i32* [[CH_ADDR]], i32* [[N_ADDR]], i32** [[A_ADDR]], i32** [[B_ADDR]], i32** [[C_ADDR]]) 25112 // CHECK12-NEXT: ret void 25113 // 25114 // 25115 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..50 25116 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32* nonnull align 4 dereferenceable(4) [[CH:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]]) #[[ATTR1]] { 25117 // CHECK12-NEXT: entry: 25118 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 25119 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 25120 // CHECK12-NEXT: [[CH_ADDR:%.*]] = alloca i32*, align 4 25121 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 25122 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 25123 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 25124 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 25125 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 25126 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 25127 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 25128 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 25129 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 25130 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 25131 // CHECK12-NEXT: [[DOTOMP_COMB_LB:%.*]] = alloca i32, align 4 25132 // CHECK12-NEXT: [[DOTOMP_COMB_UB:%.*]] = alloca i32, align 4 25133 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 25134 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 25135 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 25136 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__CASTED:%.*]] = alloca i32, align 4 25137 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 25138 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 25139 // CHECK12-NEXT: store i32* [[CH]], i32** [[CH_ADDR]], align 4 25140 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 25141 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 25142 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 25143 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 25144 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[CH_ADDR]], align 4 25145 // CHECK12-NEXT: [[TMP1:%.*]] = load i32*, i32** [[N_ADDR]], align 4 25146 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 25147 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 25148 // CHECK12-NEXT: [[TMP4:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 25149 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[TMP0]], align 4 25150 // CHECK12-NEXT: store i32 [[TMP5]], i32* [[DOTCAPTURE_EXPR_]], align 4 25151 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[TMP1]], align 4 25152 // CHECK12-NEXT: store i32 [[TMP6]], i32* [[DOTCAPTURE_EXPR_1]], align 4 25153 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 25154 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP7]], 0 25155 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 25156 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 25157 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 25158 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 25159 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 25160 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP8]] 25161 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 25162 // CHECK12: omp.precond.then: 25163 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_COMB_LB]], align 4 25164 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 25165 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_COMB_UB]], align 4 25166 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 25167 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 25168 // CHECK12-NEXT: [[TMP10:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 25169 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[TMP10]], align 4 25170 // CHECK12-NEXT: call void @__kmpc_for_static_init_4(%struct.ident_t* @[[GLOB1]], i32 [[TMP11]], i32 92, i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_COMB_LB]], i32* [[DOTOMP_COMB_UB]], i32* [[DOTOMP_STRIDE]], i32 1, i32 1) 25171 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 25172 // CHECK12-NEXT: [[TMP13:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 25173 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP12]], [[TMP13]] 25174 // CHECK12-NEXT: br i1 [[CMP5]], label [[COND_TRUE:%.*]], label [[COND_FALSE:%.*]] 25175 // CHECK12: cond.true: 25176 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 25177 // CHECK12-NEXT: br label [[COND_END:%.*]] 25178 // CHECK12: cond.false: 25179 // CHECK12-NEXT: [[TMP15:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 25180 // CHECK12-NEXT: br label [[COND_END]] 25181 // CHECK12: cond.end: 25182 // CHECK12-NEXT: [[COND:%.*]] = phi i32 [ [[TMP14]], [[COND_TRUE]] ], [ [[TMP15]], [[COND_FALSE]] ] 25183 // CHECK12-NEXT: store i32 [[COND]], i32* [[DOTOMP_COMB_UB]], align 4 25184 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 25185 // CHECK12-NEXT: store i32 [[TMP16]], i32* [[DOTOMP_IV]], align 4 25186 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 25187 // CHECK12: omp.inner.for.cond: 25188 // CHECK12-NEXT: [[TMP17:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 25189 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 25190 // CHECK12-NEXT: [[CMP6:%.*]] = icmp sle i32 [[TMP17]], [[TMP18]] 25191 // CHECK12-NEXT: br i1 [[CMP6]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 25192 // CHECK12: omp.inner.for.body: 25193 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_COMB_LB]], align 4 25194 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_COMB_UB]], align 4 25195 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_]], align 4 25196 // CHECK12-NEXT: store i32 [[TMP21]], i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 25197 // CHECK12-NEXT: [[TMP22:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__CASTED]], align 4 25198 // CHECK12-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB3]], i32 7, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32, i32, i32*, i32**, i32**, i32**, i32)* @.omp_outlined..51 to void (i32*, i32*, ...)*), i32 [[TMP19]], i32 [[TMP20]], i32* [[TMP1]], i32** [[TMP2]], i32** [[TMP3]], i32** [[TMP4]], i32 [[TMP22]]) 25199 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 25200 // CHECK12: omp.inner.for.inc: 25201 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4 25202 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[DOTOMP_STRIDE]], align 4 25203 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP23]], [[TMP24]] 25204 // CHECK12-NEXT: store i32 [[ADD]], i32* [[DOTOMP_IV]], align 4 25205 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]] 25206 // CHECK12: omp.inner.for.end: 25207 // CHECK12-NEXT: br label [[OMP_LOOP_EXIT:%.*]] 25208 // CHECK12: omp.loop.exit: 25209 // CHECK12-NEXT: [[TMP25:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 25210 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[TMP25]], align 4 25211 // CHECK12-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @[[GLOB1]], i32 [[TMP26]]) 25212 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 25213 // CHECK12: omp.precond.end: 25214 // CHECK12-NEXT: ret void 25215 // 25216 // 25217 // CHECK12-LABEL: define {{[^@]+}}@.omp_outlined..51 25218 // CHECK12-SAME: (i32* noalias [[DOTGLOBAL_TID_:%.*]], i32* noalias [[DOTBOUND_TID_:%.*]], i32 [[DOTPREVIOUS_LB_:%.*]], i32 [[DOTPREVIOUS_UB_:%.*]], i32* nonnull align 4 dereferenceable(4) [[N:%.*]], i32** nonnull align 4 dereferenceable(4) [[A:%.*]], i32** nonnull align 4 dereferenceable(4) [[B:%.*]], i32** nonnull align 4 dereferenceable(4) [[C:%.*]], i32 [[DOTCAPTURE_EXPR_:%.*]]) #[[ATTR1]] { 25219 // CHECK12-NEXT: entry: 25220 // CHECK12-NEXT: [[DOTGLOBAL_TID__ADDR:%.*]] = alloca i32*, align 4 25221 // CHECK12-NEXT: [[DOTBOUND_TID__ADDR:%.*]] = alloca i32*, align 4 25222 // CHECK12-NEXT: [[DOTPREVIOUS_LB__ADDR:%.*]] = alloca i32, align 4 25223 // CHECK12-NEXT: [[DOTPREVIOUS_UB__ADDR:%.*]] = alloca i32, align 4 25224 // CHECK12-NEXT: [[N_ADDR:%.*]] = alloca i32*, align 4 25225 // CHECK12-NEXT: [[A_ADDR:%.*]] = alloca i32**, align 4 25226 // CHECK12-NEXT: [[B_ADDR:%.*]] = alloca i32**, align 4 25227 // CHECK12-NEXT: [[C_ADDR:%.*]] = alloca i32**, align 4 25228 // CHECK12-NEXT: [[DOTCAPTURE_EXPR__ADDR:%.*]] = alloca i32, align 4 25229 // CHECK12-NEXT: [[DOTOMP_IV:%.*]] = alloca i32, align 4 25230 // CHECK12-NEXT: [[TMP:%.*]] = alloca i32, align 4 25231 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_1:%.*]] = alloca i32, align 4 25232 // CHECK12-NEXT: [[DOTCAPTURE_EXPR_2:%.*]] = alloca i32, align 4 25233 // CHECK12-NEXT: [[I:%.*]] = alloca i32, align 4 25234 // CHECK12-NEXT: [[DOTOMP_LB:%.*]] = alloca i32, align 4 25235 // CHECK12-NEXT: [[DOTOMP_UB:%.*]] = alloca i32, align 4 25236 // CHECK12-NEXT: [[DOTOMP_STRIDE:%.*]] = alloca i32, align 4 25237 // CHECK12-NEXT: [[DOTOMP_IS_LAST:%.*]] = alloca i32, align 4 25238 // CHECK12-NEXT: [[I4:%.*]] = alloca i32, align 4 25239 // CHECK12-NEXT: store i32* [[DOTGLOBAL_TID_]], i32** [[DOTGLOBAL_TID__ADDR]], align 4 25240 // CHECK12-NEXT: store i32* [[DOTBOUND_TID_]], i32** [[DOTBOUND_TID__ADDR]], align 4 25241 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_LB_]], i32* [[DOTPREVIOUS_LB__ADDR]], align 4 25242 // CHECK12-NEXT: store i32 [[DOTPREVIOUS_UB_]], i32* [[DOTPREVIOUS_UB__ADDR]], align 4 25243 // CHECK12-NEXT: store i32* [[N]], i32** [[N_ADDR]], align 4 25244 // CHECK12-NEXT: store i32** [[A]], i32*** [[A_ADDR]], align 4 25245 // CHECK12-NEXT: store i32** [[B]], i32*** [[B_ADDR]], align 4 25246 // CHECK12-NEXT: store i32** [[C]], i32*** [[C_ADDR]], align 4 25247 // CHECK12-NEXT: store i32 [[DOTCAPTURE_EXPR_]], i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 25248 // CHECK12-NEXT: [[TMP0:%.*]] = load i32*, i32** [[N_ADDR]], align 4 25249 // CHECK12-NEXT: [[TMP1:%.*]] = load i32**, i32*** [[A_ADDR]], align 4 25250 // CHECK12-NEXT: [[TMP2:%.*]] = load i32**, i32*** [[B_ADDR]], align 4 25251 // CHECK12-NEXT: [[TMP3:%.*]] = load i32**, i32*** [[C_ADDR]], align 4 25252 // CHECK12-NEXT: [[TMP4:%.*]] = load i32, i32* [[TMP0]], align 4 25253 // CHECK12-NEXT: store i32 [[TMP4]], i32* [[DOTCAPTURE_EXPR_1]], align 4 25254 // CHECK12-NEXT: [[TMP5:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 25255 // CHECK12-NEXT: [[SUB:%.*]] = sub nsw i32 [[TMP5]], 0 25256 // CHECK12-NEXT: [[DIV:%.*]] = sdiv i32 [[SUB]], 1 25257 // CHECK12-NEXT: [[SUB3:%.*]] = sub nsw i32 [[DIV]], 1 25258 // CHECK12-NEXT: store i32 [[SUB3]], i32* [[DOTCAPTURE_EXPR_2]], align 4 25259 // CHECK12-NEXT: store i32 0, i32* [[I]], align 4 25260 // CHECK12-NEXT: [[TMP6:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_1]], align 4 25261 // CHECK12-NEXT: [[CMP:%.*]] = icmp slt i32 0, [[TMP6]] 25262 // CHECK12-NEXT: br i1 [[CMP]], label [[OMP_PRECOND_THEN:%.*]], label [[OMP_PRECOND_END:%.*]] 25263 // CHECK12: omp.precond.then: 25264 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_LB]], align 4 25265 // CHECK12-NEXT: [[TMP7:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR_2]], align 4 25266 // CHECK12-NEXT: store i32 [[TMP7]], i32* [[DOTOMP_UB]], align 4 25267 // CHECK12-NEXT: [[TMP8:%.*]] = load i32, i32* [[DOTPREVIOUS_LB__ADDR]], align 4 25268 // CHECK12-NEXT: [[TMP9:%.*]] = load i32, i32* [[DOTPREVIOUS_UB__ADDR]], align 4 25269 // CHECK12-NEXT: store i32 [[TMP8]], i32* [[DOTOMP_LB]], align 4 25270 // CHECK12-NEXT: store i32 [[TMP9]], i32* [[DOTOMP_UB]], align 4 25271 // CHECK12-NEXT: store i32 1, i32* [[DOTOMP_STRIDE]], align 4 25272 // CHECK12-NEXT: store i32 0, i32* [[DOTOMP_IS_LAST]], align 4 25273 // CHECK12-NEXT: [[TMP10:%.*]] = load i32, i32* [[DOTCAPTURE_EXPR__ADDR]], align 4 25274 // CHECK12-NEXT: [[TMP11:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 25275 // CHECK12-NEXT: [[TMP12:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4 25276 // CHECK12-NEXT: [[TMP13:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 25277 // CHECK12-NEXT: [[TMP14:%.*]] = load i32, i32* [[TMP13]], align 4 25278 // CHECK12-NEXT: call void @__kmpc_dispatch_init_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP14]], i32 35, i32 [[TMP11]], i32 [[TMP12]], i32 1, i32 [[TMP10]]) 25279 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND:%.*]] 25280 // CHECK12: omp.dispatch.cond: 25281 // CHECK12-NEXT: [[TMP15:%.*]] = load i32*, i32** [[DOTGLOBAL_TID__ADDR]], align 4 25282 // CHECK12-NEXT: [[TMP16:%.*]] = load i32, i32* [[TMP15]], align 4 25283 // CHECK12-NEXT: [[TMP17:%.*]] = call i32 @__kmpc_dispatch_next_4(%struct.ident_t* @[[GLOB3]], i32 [[TMP16]], i32* [[DOTOMP_IS_LAST]], i32* [[DOTOMP_LB]], i32* [[DOTOMP_UB]], i32* [[DOTOMP_STRIDE]]) 25284 // CHECK12-NEXT: [[TOBOOL:%.*]] = icmp ne i32 [[TMP17]], 0 25285 // CHECK12-NEXT: br i1 [[TOBOOL]], label [[OMP_DISPATCH_BODY:%.*]], label [[OMP_DISPATCH_END:%.*]] 25286 // CHECK12: omp.dispatch.body: 25287 // CHECK12-NEXT: [[TMP18:%.*]] = load i32, i32* [[DOTOMP_LB]], align 4 25288 // CHECK12-NEXT: store i32 [[TMP18]], i32* [[DOTOMP_IV]], align 4 25289 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND:%.*]] 25290 // CHECK12: omp.inner.for.cond: 25291 // CHECK12-NEXT: [[TMP19:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 25292 // CHECK12-NEXT: [[TMP20:%.*]] = load i32, i32* [[DOTOMP_UB]], align 4, !llvm.access.group !28 25293 // CHECK12-NEXT: [[CMP5:%.*]] = icmp sle i32 [[TMP19]], [[TMP20]] 25294 // CHECK12-NEXT: br i1 [[CMP5]], label [[OMP_INNER_FOR_BODY:%.*]], label [[OMP_INNER_FOR_END:%.*]] 25295 // CHECK12: omp.inner.for.body: 25296 // CHECK12-NEXT: [[TMP21:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 25297 // CHECK12-NEXT: [[MUL:%.*]] = mul nsw i32 [[TMP21]], 1 25298 // CHECK12-NEXT: [[ADD:%.*]] = add nsw i32 0, [[MUL]] 25299 // CHECK12-NEXT: store i32 [[ADD]], i32* [[I4]], align 4, !llvm.access.group !28 25300 // CHECK12-NEXT: [[TMP22:%.*]] = load i32*, i32** [[TMP2]], align 4, !llvm.access.group !28 25301 // CHECK12-NEXT: [[TMP23:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !28 25302 // CHECK12-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP22]], i32 [[TMP23]] 25303 // CHECK12-NEXT: [[TMP24:%.*]] = load i32, i32* [[ARRAYIDX]], align 4, !llvm.access.group !28 25304 // CHECK12-NEXT: [[TMP25:%.*]] = load i32*, i32** [[TMP3]], align 4, !llvm.access.group !28 25305 // CHECK12-NEXT: [[TMP26:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !28 25306 // CHECK12-NEXT: [[ARRAYIDX6:%.*]] = getelementptr inbounds i32, i32* [[TMP25]], i32 [[TMP26]] 25307 // CHECK12-NEXT: [[TMP27:%.*]] = load i32, i32* [[ARRAYIDX6]], align 4, !llvm.access.group !28 25308 // CHECK12-NEXT: [[ADD7:%.*]] = add nsw i32 [[TMP24]], [[TMP27]] 25309 // CHECK12-NEXT: [[TMP28:%.*]] = load i32*, i32** [[TMP1]], align 4, !llvm.access.group !28 25310 // CHECK12-NEXT: [[TMP29:%.*]] = load i32, i32* [[I4]], align 4, !llvm.access.group !28 25311 // CHECK12-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP28]], i32 [[TMP29]] 25312 // CHECK12-NEXT: store i32 [[ADD7]], i32* [[ARRAYIDX8]], align 4, !llvm.access.group !28 25313 // CHECK12-NEXT: br label [[OMP_BODY_CONTINUE:%.*]] 25314 // CHECK12: omp.body.continue: 25315 // CHECK12-NEXT: br label [[OMP_INNER_FOR_INC:%.*]] 25316 // CHECK12: omp.inner.for.inc: 25317 // CHECK12-NEXT: [[TMP30:%.*]] = load i32, i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 25318 // CHECK12-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP30]], 1 25319 // CHECK12-NEXT: store i32 [[ADD9]], i32* [[DOTOMP_IV]], align 4, !llvm.access.group !28 25320 // CHECK12-NEXT: br label [[OMP_INNER_FOR_COND]], !llvm.loop [[LOOP29:![0-9]+]] 25321 // CHECK12: omp.inner.for.end: 25322 // CHECK12-NEXT: br label [[OMP_DISPATCH_INC:%.*]] 25323 // CHECK12: omp.dispatch.inc: 25324 // CHECK12-NEXT: br label [[OMP_DISPATCH_COND]] 25325 // CHECK12: omp.dispatch.end: 25326 // CHECK12-NEXT: br label [[OMP_PRECOND_END]] 25327 // CHECK12: omp.precond.end: 25328 // CHECK12-NEXT: ret void 25329 // 25330 // 25331 // CHECK12-LABEL: define {{[^@]+}}@.omp_offloading.requires_reg 25332 // CHECK12-SAME: () #[[ATTR4:[0-9]+]] { 25333 // CHECK12-NEXT: entry: 25334 // CHECK12-NEXT: call void @__tgt_register_requires(i64 1) 25335 // CHECK12-NEXT: ret void 25336 // 25337 // 25338 // CHECK13-LABEL: define {{[^@]+}}@main 25339 // CHECK13-SAME: () #[[ATTR0:[0-9]+]] { 25340 // CHECK13-NEXT: entry: 25341 // CHECK13-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 25342 // CHECK13-NEXT: [[A:%.*]] = alloca double*, align 8 25343 // CHECK13-NEXT: [[B:%.*]] = alloca double*, align 8 25344 // CHECK13-NEXT: [[C:%.*]] = alloca double*, align 8 25345 // CHECK13-NEXT: [[N:%.*]] = alloca i32, align 4 25346 // CHECK13-NEXT: [[CH:%.*]] = alloca i32, align 4 25347 // CHECK13-NEXT: [[I:%.*]] = alloca i32, align 4 25348 // CHECK13-NEXT: [[I5:%.*]] = alloca i32, align 4 25349 // CHECK13-NEXT: [[I19:%.*]] = alloca i32, align 4 25350 // CHECK13-NEXT: [[I33:%.*]] = alloca i32, align 4 25351 // CHECK13-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 25352 // CHECK13-NEXT: [[I47:%.*]] = alloca i32, align 4 25353 // CHECK13-NEXT: [[I61:%.*]] = alloca i32, align 4 25354 // CHECK13-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 25355 // CHECK13-NEXT: [[I76:%.*]] = alloca i32, align 4 25356 // CHECK13-NEXT: store i32 0, i32* [[RETVAL]], align 4 25357 // CHECK13-NEXT: store i32 10000, i32* [[N]], align 4 25358 // CHECK13-NEXT: store i32 100, i32* [[CH]], align 4 25359 // CHECK13-NEXT: store i32 0, i32* [[I]], align 4 25360 // CHECK13-NEXT: br label [[FOR_COND:%.*]] 25361 // CHECK13: for.cond: 25362 // CHECK13-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 25363 // CHECK13-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 25364 // CHECK13-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 25365 // CHECK13-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 25366 // CHECK13: for.body: 25367 // CHECK13-NEXT: [[TMP2:%.*]] = load double*, double** [[B]], align 8 25368 // CHECK13-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 25369 // CHECK13-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP3]] to i64 25370 // CHECK13-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP2]], i64 [[IDXPROM]] 25371 // CHECK13-NEXT: [[TMP4:%.*]] = load double, double* [[ARRAYIDX]], align 8 25372 // CHECK13-NEXT: [[TMP5:%.*]] = load double*, double** [[C]], align 8 25373 // CHECK13-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 25374 // CHECK13-NEXT: [[IDXPROM1:%.*]] = sext i32 [[TMP6]] to i64 25375 // CHECK13-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds double, double* [[TMP5]], i64 [[IDXPROM1]] 25376 // CHECK13-NEXT: [[TMP7:%.*]] = load double, double* [[ARRAYIDX2]], align 8 25377 // CHECK13-NEXT: [[ADD:%.*]] = fadd double [[TMP4]], [[TMP7]] 25378 // CHECK13-NEXT: [[TMP8:%.*]] = load double*, double** [[A]], align 8 25379 // CHECK13-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 25380 // CHECK13-NEXT: [[IDXPROM3:%.*]] = sext i32 [[TMP9]] to i64 25381 // CHECK13-NEXT: [[ARRAYIDX4:%.*]] = getelementptr inbounds double, double* [[TMP8]], i64 [[IDXPROM3]] 25382 // CHECK13-NEXT: store double [[ADD]], double* [[ARRAYIDX4]], align 8 25383 // CHECK13-NEXT: br label [[FOR_INC:%.*]] 25384 // CHECK13: for.inc: 25385 // CHECK13-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 25386 // CHECK13-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 25387 // CHECK13-NEXT: store i32 [[INC]], i32* [[I]], align 4 25388 // CHECK13-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP2:![0-9]+]] 25389 // CHECK13: for.end: 25390 // CHECK13-NEXT: store i32 0, i32* [[I5]], align 4 25391 // CHECK13-NEXT: br label [[FOR_COND6:%.*]] 25392 // CHECK13: for.cond6: 25393 // CHECK13-NEXT: [[TMP11:%.*]] = load i32, i32* [[I5]], align 4 25394 // CHECK13-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 25395 // CHECK13-NEXT: [[CMP7:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 25396 // CHECK13-NEXT: br i1 [[CMP7]], label [[FOR_BODY8:%.*]], label [[FOR_END18:%.*]] 25397 // CHECK13: for.body8: 25398 // CHECK13-NEXT: [[TMP13:%.*]] = load double*, double** [[B]], align 8 25399 // CHECK13-NEXT: [[TMP14:%.*]] = load i32, i32* [[I5]], align 4 25400 // CHECK13-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP14]] to i64 25401 // CHECK13-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP13]], i64 [[IDXPROM9]] 25402 // CHECK13-NEXT: [[TMP15:%.*]] = load double, double* [[ARRAYIDX10]], align 8 25403 // CHECK13-NEXT: [[TMP16:%.*]] = load double*, double** [[C]], align 8 25404 // CHECK13-NEXT: [[TMP17:%.*]] = load i32, i32* [[I5]], align 4 25405 // CHECK13-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP17]] to i64 25406 // CHECK13-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds double, double* [[TMP16]], i64 [[IDXPROM11]] 25407 // CHECK13-NEXT: [[TMP18:%.*]] = load double, double* [[ARRAYIDX12]], align 8 25408 // CHECK13-NEXT: [[ADD13:%.*]] = fadd double [[TMP15]], [[TMP18]] 25409 // CHECK13-NEXT: [[TMP19:%.*]] = load double*, double** [[A]], align 8 25410 // CHECK13-NEXT: [[TMP20:%.*]] = load i32, i32* [[I5]], align 4 25411 // CHECK13-NEXT: [[IDXPROM14:%.*]] = sext i32 [[TMP20]] to i64 25412 // CHECK13-NEXT: [[ARRAYIDX15:%.*]] = getelementptr inbounds double, double* [[TMP19]], i64 [[IDXPROM14]] 25413 // CHECK13-NEXT: store double [[ADD13]], double* [[ARRAYIDX15]], align 8 25414 // CHECK13-NEXT: br label [[FOR_INC16:%.*]] 25415 // CHECK13: for.inc16: 25416 // CHECK13-NEXT: [[TMP21:%.*]] = load i32, i32* [[I5]], align 4 25417 // CHECK13-NEXT: [[INC17:%.*]] = add nsw i32 [[TMP21]], 1 25418 // CHECK13-NEXT: store i32 [[INC17]], i32* [[I5]], align 4 25419 // CHECK13-NEXT: br label [[FOR_COND6]], !llvm.loop [[LOOP4:![0-9]+]] 25420 // CHECK13: for.end18: 25421 // CHECK13-NEXT: store i32 0, i32* [[I19]], align 4 25422 // CHECK13-NEXT: br label [[FOR_COND20:%.*]] 25423 // CHECK13: for.cond20: 25424 // CHECK13-NEXT: [[TMP22:%.*]] = load i32, i32* [[I19]], align 4 25425 // CHECK13-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 25426 // CHECK13-NEXT: [[CMP21:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 25427 // CHECK13-NEXT: br i1 [[CMP21]], label [[FOR_BODY22:%.*]], label [[FOR_END32:%.*]] 25428 // CHECK13: for.body22: 25429 // CHECK13-NEXT: [[TMP24:%.*]] = load double*, double** [[B]], align 8 25430 // CHECK13-NEXT: [[TMP25:%.*]] = load i32, i32* [[I19]], align 4 25431 // CHECK13-NEXT: [[IDXPROM23:%.*]] = sext i32 [[TMP25]] to i64 25432 // CHECK13-NEXT: [[ARRAYIDX24:%.*]] = getelementptr inbounds double, double* [[TMP24]], i64 [[IDXPROM23]] 25433 // CHECK13-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX24]], align 8 25434 // CHECK13-NEXT: [[TMP27:%.*]] = load double*, double** [[C]], align 8 25435 // CHECK13-NEXT: [[TMP28:%.*]] = load i32, i32* [[I19]], align 4 25436 // CHECK13-NEXT: [[IDXPROM25:%.*]] = sext i32 [[TMP28]] to i64 25437 // CHECK13-NEXT: [[ARRAYIDX26:%.*]] = getelementptr inbounds double, double* [[TMP27]], i64 [[IDXPROM25]] 25438 // CHECK13-NEXT: [[TMP29:%.*]] = load double, double* [[ARRAYIDX26]], align 8 25439 // CHECK13-NEXT: [[ADD27:%.*]] = fadd double [[TMP26]], [[TMP29]] 25440 // CHECK13-NEXT: [[TMP30:%.*]] = load double*, double** [[A]], align 8 25441 // CHECK13-NEXT: [[TMP31:%.*]] = load i32, i32* [[I19]], align 4 25442 // CHECK13-NEXT: [[IDXPROM28:%.*]] = sext i32 [[TMP31]] to i64 25443 // CHECK13-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds double, double* [[TMP30]], i64 [[IDXPROM28]] 25444 // CHECK13-NEXT: store double [[ADD27]], double* [[ARRAYIDX29]], align 8 25445 // CHECK13-NEXT: br label [[FOR_INC30:%.*]] 25446 // CHECK13: for.inc30: 25447 // CHECK13-NEXT: [[TMP32:%.*]] = load i32, i32* [[I19]], align 4 25448 // CHECK13-NEXT: [[INC31:%.*]] = add nsw i32 [[TMP32]], 1 25449 // CHECK13-NEXT: store i32 [[INC31]], i32* [[I19]], align 4 25450 // CHECK13-NEXT: br label [[FOR_COND20]], !llvm.loop [[LOOP5:![0-9]+]] 25451 // CHECK13: for.end32: 25452 // CHECK13-NEXT: store i32 0, i32* [[I33]], align 4 25453 // CHECK13-NEXT: br label [[FOR_COND34:%.*]] 25454 // CHECK13: for.cond34: 25455 // CHECK13-NEXT: [[TMP33:%.*]] = load i32, i32* [[I33]], align 4 25456 // CHECK13-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 25457 // CHECK13-NEXT: [[CMP35:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 25458 // CHECK13-NEXT: br i1 [[CMP35]], label [[FOR_BODY36:%.*]], label [[FOR_END46:%.*]] 25459 // CHECK13: for.body36: 25460 // CHECK13-NEXT: [[TMP35:%.*]] = load double*, double** [[B]], align 8 25461 // CHECK13-NEXT: [[TMP36:%.*]] = load i32, i32* [[I33]], align 4 25462 // CHECK13-NEXT: [[IDXPROM37:%.*]] = sext i32 [[TMP36]] to i64 25463 // CHECK13-NEXT: [[ARRAYIDX38:%.*]] = getelementptr inbounds double, double* [[TMP35]], i64 [[IDXPROM37]] 25464 // CHECK13-NEXT: [[TMP37:%.*]] = load double, double* [[ARRAYIDX38]], align 8 25465 // CHECK13-NEXT: [[TMP38:%.*]] = load double*, double** [[C]], align 8 25466 // CHECK13-NEXT: [[TMP39:%.*]] = load i32, i32* [[I33]], align 4 25467 // CHECK13-NEXT: [[IDXPROM39:%.*]] = sext i32 [[TMP39]] to i64 25468 // CHECK13-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds double, double* [[TMP38]], i64 [[IDXPROM39]] 25469 // CHECK13-NEXT: [[TMP40:%.*]] = load double, double* [[ARRAYIDX40]], align 8 25470 // CHECK13-NEXT: [[ADD41:%.*]] = fadd double [[TMP37]], [[TMP40]] 25471 // CHECK13-NEXT: [[TMP41:%.*]] = load double*, double** [[A]], align 8 25472 // CHECK13-NEXT: [[TMP42:%.*]] = load i32, i32* [[I33]], align 4 25473 // CHECK13-NEXT: [[IDXPROM42:%.*]] = sext i32 [[TMP42]] to i64 25474 // CHECK13-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds double, double* [[TMP41]], i64 [[IDXPROM42]] 25475 // CHECK13-NEXT: store double [[ADD41]], double* [[ARRAYIDX43]], align 8 25476 // CHECK13-NEXT: br label [[FOR_INC44:%.*]] 25477 // CHECK13: for.inc44: 25478 // CHECK13-NEXT: [[TMP43:%.*]] = load i32, i32* [[I33]], align 4 25479 // CHECK13-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP43]], 1 25480 // CHECK13-NEXT: store i32 [[INC45]], i32* [[I33]], align 4 25481 // CHECK13-NEXT: br label [[FOR_COND34]], !llvm.loop [[LOOP6:![0-9]+]] 25482 // CHECK13: for.end46: 25483 // CHECK13-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 25484 // CHECK13-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 25485 // CHECK13-NEXT: store i32 0, i32* [[I47]], align 4 25486 // CHECK13-NEXT: br label [[FOR_COND48:%.*]] 25487 // CHECK13: for.cond48: 25488 // CHECK13-NEXT: [[TMP45:%.*]] = load i32, i32* [[I47]], align 4 25489 // CHECK13-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 25490 // CHECK13-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 25491 // CHECK13-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END60:%.*]] 25492 // CHECK13: for.body50: 25493 // CHECK13-NEXT: [[TMP47:%.*]] = load double*, double** [[B]], align 8 25494 // CHECK13-NEXT: [[TMP48:%.*]] = load i32, i32* [[I47]], align 4 25495 // CHECK13-NEXT: [[IDXPROM51:%.*]] = sext i32 [[TMP48]] to i64 25496 // CHECK13-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds double, double* [[TMP47]], i64 [[IDXPROM51]] 25497 // CHECK13-NEXT: [[TMP49:%.*]] = load double, double* [[ARRAYIDX52]], align 8 25498 // CHECK13-NEXT: [[TMP50:%.*]] = load double*, double** [[C]], align 8 25499 // CHECK13-NEXT: [[TMP51:%.*]] = load i32, i32* [[I47]], align 4 25500 // CHECK13-NEXT: [[IDXPROM53:%.*]] = sext i32 [[TMP51]] to i64 25501 // CHECK13-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds double, double* [[TMP50]], i64 [[IDXPROM53]] 25502 // CHECK13-NEXT: [[TMP52:%.*]] = load double, double* [[ARRAYIDX54]], align 8 25503 // CHECK13-NEXT: [[ADD55:%.*]] = fadd double [[TMP49]], [[TMP52]] 25504 // CHECK13-NEXT: [[TMP53:%.*]] = load double*, double** [[A]], align 8 25505 // CHECK13-NEXT: [[TMP54:%.*]] = load i32, i32* [[I47]], align 4 25506 // CHECK13-NEXT: [[IDXPROM56:%.*]] = sext i32 [[TMP54]] to i64 25507 // CHECK13-NEXT: [[ARRAYIDX57:%.*]] = getelementptr inbounds double, double* [[TMP53]], i64 [[IDXPROM56]] 25508 // CHECK13-NEXT: store double [[ADD55]], double* [[ARRAYIDX57]], align 8 25509 // CHECK13-NEXT: br label [[FOR_INC58:%.*]] 25510 // CHECK13: for.inc58: 25511 // CHECK13-NEXT: [[TMP55:%.*]] = load i32, i32* [[I47]], align 4 25512 // CHECK13-NEXT: [[INC59:%.*]] = add nsw i32 [[TMP55]], 1 25513 // CHECK13-NEXT: store i32 [[INC59]], i32* [[I47]], align 4 25514 // CHECK13-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP7:![0-9]+]] 25515 // CHECK13: for.end60: 25516 // CHECK13-NEXT: store i32 0, i32* [[I61]], align 4 25517 // CHECK13-NEXT: br label [[FOR_COND62:%.*]] 25518 // CHECK13: for.cond62: 25519 // CHECK13-NEXT: [[TMP56:%.*]] = load i32, i32* [[I61]], align 4 25520 // CHECK13-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 25521 // CHECK13-NEXT: [[CMP63:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 25522 // CHECK13-NEXT: br i1 [[CMP63]], label [[FOR_BODY64:%.*]], label [[FOR_END74:%.*]] 25523 // CHECK13: for.body64: 25524 // CHECK13-NEXT: [[TMP58:%.*]] = load double*, double** [[B]], align 8 25525 // CHECK13-NEXT: [[TMP59:%.*]] = load i32, i32* [[I61]], align 4 25526 // CHECK13-NEXT: [[IDXPROM65:%.*]] = sext i32 [[TMP59]] to i64 25527 // CHECK13-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds double, double* [[TMP58]], i64 [[IDXPROM65]] 25528 // CHECK13-NEXT: [[TMP60:%.*]] = load double, double* [[ARRAYIDX66]], align 8 25529 // CHECK13-NEXT: [[TMP61:%.*]] = load double*, double** [[C]], align 8 25530 // CHECK13-NEXT: [[TMP62:%.*]] = load i32, i32* [[I61]], align 4 25531 // CHECK13-NEXT: [[IDXPROM67:%.*]] = sext i32 [[TMP62]] to i64 25532 // CHECK13-NEXT: [[ARRAYIDX68:%.*]] = getelementptr inbounds double, double* [[TMP61]], i64 [[IDXPROM67]] 25533 // CHECK13-NEXT: [[TMP63:%.*]] = load double, double* [[ARRAYIDX68]], align 8 25534 // CHECK13-NEXT: [[ADD69:%.*]] = fadd double [[TMP60]], [[TMP63]] 25535 // CHECK13-NEXT: [[TMP64:%.*]] = load double*, double** [[A]], align 8 25536 // CHECK13-NEXT: [[TMP65:%.*]] = load i32, i32* [[I61]], align 4 25537 // CHECK13-NEXT: [[IDXPROM70:%.*]] = sext i32 [[TMP65]] to i64 25538 // CHECK13-NEXT: [[ARRAYIDX71:%.*]] = getelementptr inbounds double, double* [[TMP64]], i64 [[IDXPROM70]] 25539 // CHECK13-NEXT: store double [[ADD69]], double* [[ARRAYIDX71]], align 8 25540 // CHECK13-NEXT: br label [[FOR_INC72:%.*]] 25541 // CHECK13: for.inc72: 25542 // CHECK13-NEXT: [[TMP66:%.*]] = load i32, i32* [[I61]], align 4 25543 // CHECK13-NEXT: [[INC73:%.*]] = add nsw i32 [[TMP66]], 1 25544 // CHECK13-NEXT: store i32 [[INC73]], i32* [[I61]], align 4 25545 // CHECK13-NEXT: br label [[FOR_COND62]], !llvm.loop [[LOOP8:![0-9]+]] 25546 // CHECK13: for.end74: 25547 // CHECK13-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 25548 // CHECK13-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_75]], align 4 25549 // CHECK13-NEXT: store i32 0, i32* [[I76]], align 4 25550 // CHECK13-NEXT: br label [[FOR_COND77:%.*]] 25551 // CHECK13: for.cond77: 25552 // CHECK13-NEXT: [[TMP68:%.*]] = load i32, i32* [[I76]], align 4 25553 // CHECK13-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 25554 // CHECK13-NEXT: [[CMP78:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 25555 // CHECK13-NEXT: br i1 [[CMP78]], label [[FOR_BODY79:%.*]], label [[FOR_END89:%.*]] 25556 // CHECK13: for.body79: 25557 // CHECK13-NEXT: [[TMP70:%.*]] = load double*, double** [[B]], align 8 25558 // CHECK13-NEXT: [[TMP71:%.*]] = load i32, i32* [[I76]], align 4 25559 // CHECK13-NEXT: [[IDXPROM80:%.*]] = sext i32 [[TMP71]] to i64 25560 // CHECK13-NEXT: [[ARRAYIDX81:%.*]] = getelementptr inbounds double, double* [[TMP70]], i64 [[IDXPROM80]] 25561 // CHECK13-NEXT: [[TMP72:%.*]] = load double, double* [[ARRAYIDX81]], align 8 25562 // CHECK13-NEXT: [[TMP73:%.*]] = load double*, double** [[C]], align 8 25563 // CHECK13-NEXT: [[TMP74:%.*]] = load i32, i32* [[I76]], align 4 25564 // CHECK13-NEXT: [[IDXPROM82:%.*]] = sext i32 [[TMP74]] to i64 25565 // CHECK13-NEXT: [[ARRAYIDX83:%.*]] = getelementptr inbounds double, double* [[TMP73]], i64 [[IDXPROM82]] 25566 // CHECK13-NEXT: [[TMP75:%.*]] = load double, double* [[ARRAYIDX83]], align 8 25567 // CHECK13-NEXT: [[ADD84:%.*]] = fadd double [[TMP72]], [[TMP75]] 25568 // CHECK13-NEXT: [[TMP76:%.*]] = load double*, double** [[A]], align 8 25569 // CHECK13-NEXT: [[TMP77:%.*]] = load i32, i32* [[I76]], align 4 25570 // CHECK13-NEXT: [[IDXPROM85:%.*]] = sext i32 [[TMP77]] to i64 25571 // CHECK13-NEXT: [[ARRAYIDX86:%.*]] = getelementptr inbounds double, double* [[TMP76]], i64 [[IDXPROM85]] 25572 // CHECK13-NEXT: store double [[ADD84]], double* [[ARRAYIDX86]], align 8 25573 // CHECK13-NEXT: br label [[FOR_INC87:%.*]] 25574 // CHECK13: for.inc87: 25575 // CHECK13-NEXT: [[TMP78:%.*]] = load i32, i32* [[I76]], align 4 25576 // CHECK13-NEXT: [[INC88:%.*]] = add nsw i32 [[TMP78]], 1 25577 // CHECK13-NEXT: store i32 [[INC88]], i32* [[I76]], align 4 25578 // CHECK13-NEXT: br label [[FOR_COND77]], !llvm.loop [[LOOP9:![0-9]+]] 25579 // CHECK13: for.end89: 25580 // CHECK13-NEXT: [[CALL:%.*]] = call signext i32 @_Z5tmainIiET_v() 25581 // CHECK13-NEXT: ret i32 [[CALL]] 25582 // 25583 // 25584 // CHECK13-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 25585 // CHECK13-SAME: () #[[ATTR1:[0-9]+]] comdat { 25586 // CHECK13-NEXT: entry: 25587 // CHECK13-NEXT: [[A:%.*]] = alloca i32*, align 8 25588 // CHECK13-NEXT: [[B:%.*]] = alloca i32*, align 8 25589 // CHECK13-NEXT: [[C:%.*]] = alloca i32*, align 8 25590 // CHECK13-NEXT: [[N:%.*]] = alloca i32, align 4 25591 // CHECK13-NEXT: [[CH:%.*]] = alloca i32, align 4 25592 // CHECK13-NEXT: [[I:%.*]] = alloca i32, align 4 25593 // CHECK13-NEXT: [[I5:%.*]] = alloca i32, align 4 25594 // CHECK13-NEXT: [[I19:%.*]] = alloca i32, align 4 25595 // CHECK13-NEXT: [[I33:%.*]] = alloca i32, align 4 25596 // CHECK13-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 25597 // CHECK13-NEXT: [[I47:%.*]] = alloca i32, align 4 25598 // CHECK13-NEXT: [[I61:%.*]] = alloca i32, align 4 25599 // CHECK13-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 25600 // CHECK13-NEXT: [[I76:%.*]] = alloca i32, align 4 25601 // CHECK13-NEXT: store i32 10000, i32* [[N]], align 4 25602 // CHECK13-NEXT: store i32 100, i32* [[CH]], align 4 25603 // CHECK13-NEXT: store i32 0, i32* [[I]], align 4 25604 // CHECK13-NEXT: br label [[FOR_COND:%.*]] 25605 // CHECK13: for.cond: 25606 // CHECK13-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 25607 // CHECK13-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 25608 // CHECK13-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 25609 // CHECK13-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 25610 // CHECK13: for.body: 25611 // CHECK13-NEXT: [[TMP2:%.*]] = load i32*, i32** [[B]], align 8 25612 // CHECK13-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 25613 // CHECK13-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP3]] to i64 25614 // CHECK13-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP2]], i64 [[IDXPROM]] 25615 // CHECK13-NEXT: [[TMP4:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 25616 // CHECK13-NEXT: [[TMP5:%.*]] = load i32*, i32** [[C]], align 8 25617 // CHECK13-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 25618 // CHECK13-NEXT: [[IDXPROM1:%.*]] = sext i32 [[TMP6]] to i64 25619 // CHECK13-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i32, i32* [[TMP5]], i64 [[IDXPROM1]] 25620 // CHECK13-NEXT: [[TMP7:%.*]] = load i32, i32* [[ARRAYIDX2]], align 4 25621 // CHECK13-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP4]], [[TMP7]] 25622 // CHECK13-NEXT: [[TMP8:%.*]] = load i32*, i32** [[A]], align 8 25623 // CHECK13-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 25624 // CHECK13-NEXT: [[IDXPROM3:%.*]] = sext i32 [[TMP9]] to i64 25625 // CHECK13-NEXT: [[ARRAYIDX4:%.*]] = getelementptr inbounds i32, i32* [[TMP8]], i64 [[IDXPROM3]] 25626 // CHECK13-NEXT: store i32 [[ADD]], i32* [[ARRAYIDX4]], align 4 25627 // CHECK13-NEXT: br label [[FOR_INC:%.*]] 25628 // CHECK13: for.inc: 25629 // CHECK13-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 25630 // CHECK13-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 25631 // CHECK13-NEXT: store i32 [[INC]], i32* [[I]], align 4 25632 // CHECK13-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP10:![0-9]+]] 25633 // CHECK13: for.end: 25634 // CHECK13-NEXT: store i32 0, i32* [[I5]], align 4 25635 // CHECK13-NEXT: br label [[FOR_COND6:%.*]] 25636 // CHECK13: for.cond6: 25637 // CHECK13-NEXT: [[TMP11:%.*]] = load i32, i32* [[I5]], align 4 25638 // CHECK13-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 25639 // CHECK13-NEXT: [[CMP7:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 25640 // CHECK13-NEXT: br i1 [[CMP7]], label [[FOR_BODY8:%.*]], label [[FOR_END18:%.*]] 25641 // CHECK13: for.body8: 25642 // CHECK13-NEXT: [[TMP13:%.*]] = load i32*, i32** [[B]], align 8 25643 // CHECK13-NEXT: [[TMP14:%.*]] = load i32, i32* [[I5]], align 4 25644 // CHECK13-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP14]] to i64 25645 // CHECK13-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP13]], i64 [[IDXPROM9]] 25646 // CHECK13-NEXT: [[TMP15:%.*]] = load i32, i32* [[ARRAYIDX10]], align 4 25647 // CHECK13-NEXT: [[TMP16:%.*]] = load i32*, i32** [[C]], align 8 25648 // CHECK13-NEXT: [[TMP17:%.*]] = load i32, i32* [[I5]], align 4 25649 // CHECK13-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP17]] to i64 25650 // CHECK13-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds i32, i32* [[TMP16]], i64 [[IDXPROM11]] 25651 // CHECK13-NEXT: [[TMP18:%.*]] = load i32, i32* [[ARRAYIDX12]], align 4 25652 // CHECK13-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP15]], [[TMP18]] 25653 // CHECK13-NEXT: [[TMP19:%.*]] = load i32*, i32** [[A]], align 8 25654 // CHECK13-NEXT: [[TMP20:%.*]] = load i32, i32* [[I5]], align 4 25655 // CHECK13-NEXT: [[IDXPROM14:%.*]] = sext i32 [[TMP20]] to i64 25656 // CHECK13-NEXT: [[ARRAYIDX15:%.*]] = getelementptr inbounds i32, i32* [[TMP19]], i64 [[IDXPROM14]] 25657 // CHECK13-NEXT: store i32 [[ADD13]], i32* [[ARRAYIDX15]], align 4 25658 // CHECK13-NEXT: br label [[FOR_INC16:%.*]] 25659 // CHECK13: for.inc16: 25660 // CHECK13-NEXT: [[TMP21:%.*]] = load i32, i32* [[I5]], align 4 25661 // CHECK13-NEXT: [[INC17:%.*]] = add nsw i32 [[TMP21]], 1 25662 // CHECK13-NEXT: store i32 [[INC17]], i32* [[I5]], align 4 25663 // CHECK13-NEXT: br label [[FOR_COND6]], !llvm.loop [[LOOP11:![0-9]+]] 25664 // CHECK13: for.end18: 25665 // CHECK13-NEXT: store i32 0, i32* [[I19]], align 4 25666 // CHECK13-NEXT: br label [[FOR_COND20:%.*]] 25667 // CHECK13: for.cond20: 25668 // CHECK13-NEXT: [[TMP22:%.*]] = load i32, i32* [[I19]], align 4 25669 // CHECK13-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 25670 // CHECK13-NEXT: [[CMP21:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 25671 // CHECK13-NEXT: br i1 [[CMP21]], label [[FOR_BODY22:%.*]], label [[FOR_END32:%.*]] 25672 // CHECK13: for.body22: 25673 // CHECK13-NEXT: [[TMP24:%.*]] = load i32*, i32** [[B]], align 8 25674 // CHECK13-NEXT: [[TMP25:%.*]] = load i32, i32* [[I19]], align 4 25675 // CHECK13-NEXT: [[IDXPROM23:%.*]] = sext i32 [[TMP25]] to i64 25676 // CHECK13-NEXT: [[ARRAYIDX24:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i64 [[IDXPROM23]] 25677 // CHECK13-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX24]], align 4 25678 // CHECK13-NEXT: [[TMP27:%.*]] = load i32*, i32** [[C]], align 8 25679 // CHECK13-NEXT: [[TMP28:%.*]] = load i32, i32* [[I19]], align 4 25680 // CHECK13-NEXT: [[IDXPROM25:%.*]] = sext i32 [[TMP28]] to i64 25681 // CHECK13-NEXT: [[ARRAYIDX26:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i64 [[IDXPROM25]] 25682 // CHECK13-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX26]], align 4 25683 // CHECK13-NEXT: [[ADD27:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 25684 // CHECK13-NEXT: [[TMP30:%.*]] = load i32*, i32** [[A]], align 8 25685 // CHECK13-NEXT: [[TMP31:%.*]] = load i32, i32* [[I19]], align 4 25686 // CHECK13-NEXT: [[IDXPROM28:%.*]] = sext i32 [[TMP31]] to i64 25687 // CHECK13-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i64 [[IDXPROM28]] 25688 // CHECK13-NEXT: store i32 [[ADD27]], i32* [[ARRAYIDX29]], align 4 25689 // CHECK13-NEXT: br label [[FOR_INC30:%.*]] 25690 // CHECK13: for.inc30: 25691 // CHECK13-NEXT: [[TMP32:%.*]] = load i32, i32* [[I19]], align 4 25692 // CHECK13-NEXT: [[INC31:%.*]] = add nsw i32 [[TMP32]], 1 25693 // CHECK13-NEXT: store i32 [[INC31]], i32* [[I19]], align 4 25694 // CHECK13-NEXT: br label [[FOR_COND20]], !llvm.loop [[LOOP12:![0-9]+]] 25695 // CHECK13: for.end32: 25696 // CHECK13-NEXT: store i32 0, i32* [[I33]], align 4 25697 // CHECK13-NEXT: br label [[FOR_COND34:%.*]] 25698 // CHECK13: for.cond34: 25699 // CHECK13-NEXT: [[TMP33:%.*]] = load i32, i32* [[I33]], align 4 25700 // CHECK13-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 25701 // CHECK13-NEXT: [[CMP35:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 25702 // CHECK13-NEXT: br i1 [[CMP35]], label [[FOR_BODY36:%.*]], label [[FOR_END46:%.*]] 25703 // CHECK13: for.body36: 25704 // CHECK13-NEXT: [[TMP35:%.*]] = load i32*, i32** [[B]], align 8 25705 // CHECK13-NEXT: [[TMP36:%.*]] = load i32, i32* [[I33]], align 4 25706 // CHECK13-NEXT: [[IDXPROM37:%.*]] = sext i32 [[TMP36]] to i64 25707 // CHECK13-NEXT: [[ARRAYIDX38:%.*]] = getelementptr inbounds i32, i32* [[TMP35]], i64 [[IDXPROM37]] 25708 // CHECK13-NEXT: [[TMP37:%.*]] = load i32, i32* [[ARRAYIDX38]], align 4 25709 // CHECK13-NEXT: [[TMP38:%.*]] = load i32*, i32** [[C]], align 8 25710 // CHECK13-NEXT: [[TMP39:%.*]] = load i32, i32* [[I33]], align 4 25711 // CHECK13-NEXT: [[IDXPROM39:%.*]] = sext i32 [[TMP39]] to i64 25712 // CHECK13-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds i32, i32* [[TMP38]], i64 [[IDXPROM39]] 25713 // CHECK13-NEXT: [[TMP40:%.*]] = load i32, i32* [[ARRAYIDX40]], align 4 25714 // CHECK13-NEXT: [[ADD41:%.*]] = add nsw i32 [[TMP37]], [[TMP40]] 25715 // CHECK13-NEXT: [[TMP41:%.*]] = load i32*, i32** [[A]], align 8 25716 // CHECK13-NEXT: [[TMP42:%.*]] = load i32, i32* [[I33]], align 4 25717 // CHECK13-NEXT: [[IDXPROM42:%.*]] = sext i32 [[TMP42]] to i64 25718 // CHECK13-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds i32, i32* [[TMP41]], i64 [[IDXPROM42]] 25719 // CHECK13-NEXT: store i32 [[ADD41]], i32* [[ARRAYIDX43]], align 4 25720 // CHECK13-NEXT: br label [[FOR_INC44:%.*]] 25721 // CHECK13: for.inc44: 25722 // CHECK13-NEXT: [[TMP43:%.*]] = load i32, i32* [[I33]], align 4 25723 // CHECK13-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP43]], 1 25724 // CHECK13-NEXT: store i32 [[INC45]], i32* [[I33]], align 4 25725 // CHECK13-NEXT: br label [[FOR_COND34]], !llvm.loop [[LOOP13:![0-9]+]] 25726 // CHECK13: for.end46: 25727 // CHECK13-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 25728 // CHECK13-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 25729 // CHECK13-NEXT: store i32 0, i32* [[I47]], align 4 25730 // CHECK13-NEXT: br label [[FOR_COND48:%.*]] 25731 // CHECK13: for.cond48: 25732 // CHECK13-NEXT: [[TMP45:%.*]] = load i32, i32* [[I47]], align 4 25733 // CHECK13-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 25734 // CHECK13-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 25735 // CHECK13-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END60:%.*]] 25736 // CHECK13: for.body50: 25737 // CHECK13-NEXT: [[TMP47:%.*]] = load i32*, i32** [[B]], align 8 25738 // CHECK13-NEXT: [[TMP48:%.*]] = load i32, i32* [[I47]], align 4 25739 // CHECK13-NEXT: [[IDXPROM51:%.*]] = sext i32 [[TMP48]] to i64 25740 // CHECK13-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds i32, i32* [[TMP47]], i64 [[IDXPROM51]] 25741 // CHECK13-NEXT: [[TMP49:%.*]] = load i32, i32* [[ARRAYIDX52]], align 4 25742 // CHECK13-NEXT: [[TMP50:%.*]] = load i32*, i32** [[C]], align 8 25743 // CHECK13-NEXT: [[TMP51:%.*]] = load i32, i32* [[I47]], align 4 25744 // CHECK13-NEXT: [[IDXPROM53:%.*]] = sext i32 [[TMP51]] to i64 25745 // CHECK13-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds i32, i32* [[TMP50]], i64 [[IDXPROM53]] 25746 // CHECK13-NEXT: [[TMP52:%.*]] = load i32, i32* [[ARRAYIDX54]], align 4 25747 // CHECK13-NEXT: [[ADD55:%.*]] = add nsw i32 [[TMP49]], [[TMP52]] 25748 // CHECK13-NEXT: [[TMP53:%.*]] = load i32*, i32** [[A]], align 8 25749 // CHECK13-NEXT: [[TMP54:%.*]] = load i32, i32* [[I47]], align 4 25750 // CHECK13-NEXT: [[IDXPROM56:%.*]] = sext i32 [[TMP54]] to i64 25751 // CHECK13-NEXT: [[ARRAYIDX57:%.*]] = getelementptr inbounds i32, i32* [[TMP53]], i64 [[IDXPROM56]] 25752 // CHECK13-NEXT: store i32 [[ADD55]], i32* [[ARRAYIDX57]], align 4 25753 // CHECK13-NEXT: br label [[FOR_INC58:%.*]] 25754 // CHECK13: for.inc58: 25755 // CHECK13-NEXT: [[TMP55:%.*]] = load i32, i32* [[I47]], align 4 25756 // CHECK13-NEXT: [[INC59:%.*]] = add nsw i32 [[TMP55]], 1 25757 // CHECK13-NEXT: store i32 [[INC59]], i32* [[I47]], align 4 25758 // CHECK13-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP14:![0-9]+]] 25759 // CHECK13: for.end60: 25760 // CHECK13-NEXT: store i32 0, i32* [[I61]], align 4 25761 // CHECK13-NEXT: br label [[FOR_COND62:%.*]] 25762 // CHECK13: for.cond62: 25763 // CHECK13-NEXT: [[TMP56:%.*]] = load i32, i32* [[I61]], align 4 25764 // CHECK13-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 25765 // CHECK13-NEXT: [[CMP63:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 25766 // CHECK13-NEXT: br i1 [[CMP63]], label [[FOR_BODY64:%.*]], label [[FOR_END74:%.*]] 25767 // CHECK13: for.body64: 25768 // CHECK13-NEXT: [[TMP58:%.*]] = load i32*, i32** [[B]], align 8 25769 // CHECK13-NEXT: [[TMP59:%.*]] = load i32, i32* [[I61]], align 4 25770 // CHECK13-NEXT: [[IDXPROM65:%.*]] = sext i32 [[TMP59]] to i64 25771 // CHECK13-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds i32, i32* [[TMP58]], i64 [[IDXPROM65]] 25772 // CHECK13-NEXT: [[TMP60:%.*]] = load i32, i32* [[ARRAYIDX66]], align 4 25773 // CHECK13-NEXT: [[TMP61:%.*]] = load i32*, i32** [[C]], align 8 25774 // CHECK13-NEXT: [[TMP62:%.*]] = load i32, i32* [[I61]], align 4 25775 // CHECK13-NEXT: [[IDXPROM67:%.*]] = sext i32 [[TMP62]] to i64 25776 // CHECK13-NEXT: [[ARRAYIDX68:%.*]] = getelementptr inbounds i32, i32* [[TMP61]], i64 [[IDXPROM67]] 25777 // CHECK13-NEXT: [[TMP63:%.*]] = load i32, i32* [[ARRAYIDX68]], align 4 25778 // CHECK13-NEXT: [[ADD69:%.*]] = add nsw i32 [[TMP60]], [[TMP63]] 25779 // CHECK13-NEXT: [[TMP64:%.*]] = load i32*, i32** [[A]], align 8 25780 // CHECK13-NEXT: [[TMP65:%.*]] = load i32, i32* [[I61]], align 4 25781 // CHECK13-NEXT: [[IDXPROM70:%.*]] = sext i32 [[TMP65]] to i64 25782 // CHECK13-NEXT: [[ARRAYIDX71:%.*]] = getelementptr inbounds i32, i32* [[TMP64]], i64 [[IDXPROM70]] 25783 // CHECK13-NEXT: store i32 [[ADD69]], i32* [[ARRAYIDX71]], align 4 25784 // CHECK13-NEXT: br label [[FOR_INC72:%.*]] 25785 // CHECK13: for.inc72: 25786 // CHECK13-NEXT: [[TMP66:%.*]] = load i32, i32* [[I61]], align 4 25787 // CHECK13-NEXT: [[INC73:%.*]] = add nsw i32 [[TMP66]], 1 25788 // CHECK13-NEXT: store i32 [[INC73]], i32* [[I61]], align 4 25789 // CHECK13-NEXT: br label [[FOR_COND62]], !llvm.loop [[LOOP15:![0-9]+]] 25790 // CHECK13: for.end74: 25791 // CHECK13-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 25792 // CHECK13-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_75]], align 4 25793 // CHECK13-NEXT: store i32 0, i32* [[I76]], align 4 25794 // CHECK13-NEXT: br label [[FOR_COND77:%.*]] 25795 // CHECK13: for.cond77: 25796 // CHECK13-NEXT: [[TMP68:%.*]] = load i32, i32* [[I76]], align 4 25797 // CHECK13-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 25798 // CHECK13-NEXT: [[CMP78:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 25799 // CHECK13-NEXT: br i1 [[CMP78]], label [[FOR_BODY79:%.*]], label [[FOR_END89:%.*]] 25800 // CHECK13: for.body79: 25801 // CHECK13-NEXT: [[TMP70:%.*]] = load i32*, i32** [[B]], align 8 25802 // CHECK13-NEXT: [[TMP71:%.*]] = load i32, i32* [[I76]], align 4 25803 // CHECK13-NEXT: [[IDXPROM80:%.*]] = sext i32 [[TMP71]] to i64 25804 // CHECK13-NEXT: [[ARRAYIDX81:%.*]] = getelementptr inbounds i32, i32* [[TMP70]], i64 [[IDXPROM80]] 25805 // CHECK13-NEXT: [[TMP72:%.*]] = load i32, i32* [[ARRAYIDX81]], align 4 25806 // CHECK13-NEXT: [[TMP73:%.*]] = load i32*, i32** [[C]], align 8 25807 // CHECK13-NEXT: [[TMP74:%.*]] = load i32, i32* [[I76]], align 4 25808 // CHECK13-NEXT: [[IDXPROM82:%.*]] = sext i32 [[TMP74]] to i64 25809 // CHECK13-NEXT: [[ARRAYIDX83:%.*]] = getelementptr inbounds i32, i32* [[TMP73]], i64 [[IDXPROM82]] 25810 // CHECK13-NEXT: [[TMP75:%.*]] = load i32, i32* [[ARRAYIDX83]], align 4 25811 // CHECK13-NEXT: [[ADD84:%.*]] = add nsw i32 [[TMP72]], [[TMP75]] 25812 // CHECK13-NEXT: [[TMP76:%.*]] = load i32*, i32** [[A]], align 8 25813 // CHECK13-NEXT: [[TMP77:%.*]] = load i32, i32* [[I76]], align 4 25814 // CHECK13-NEXT: [[IDXPROM85:%.*]] = sext i32 [[TMP77]] to i64 25815 // CHECK13-NEXT: [[ARRAYIDX86:%.*]] = getelementptr inbounds i32, i32* [[TMP76]], i64 [[IDXPROM85]] 25816 // CHECK13-NEXT: store i32 [[ADD84]], i32* [[ARRAYIDX86]], align 4 25817 // CHECK13-NEXT: br label [[FOR_INC87:%.*]] 25818 // CHECK13: for.inc87: 25819 // CHECK13-NEXT: [[TMP78:%.*]] = load i32, i32* [[I76]], align 4 25820 // CHECK13-NEXT: [[INC88:%.*]] = add nsw i32 [[TMP78]], 1 25821 // CHECK13-NEXT: store i32 [[INC88]], i32* [[I76]], align 4 25822 // CHECK13-NEXT: br label [[FOR_COND77]], !llvm.loop [[LOOP16:![0-9]+]] 25823 // CHECK13: for.end89: 25824 // CHECK13-NEXT: ret i32 0 25825 // 25826 // 25827 // CHECK14-LABEL: define {{[^@]+}}@main 25828 // CHECK14-SAME: () #[[ATTR0:[0-9]+]] { 25829 // CHECK14-NEXT: entry: 25830 // CHECK14-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 25831 // CHECK14-NEXT: [[A:%.*]] = alloca double*, align 8 25832 // CHECK14-NEXT: [[B:%.*]] = alloca double*, align 8 25833 // CHECK14-NEXT: [[C:%.*]] = alloca double*, align 8 25834 // CHECK14-NEXT: [[N:%.*]] = alloca i32, align 4 25835 // CHECK14-NEXT: [[CH:%.*]] = alloca i32, align 4 25836 // CHECK14-NEXT: [[I:%.*]] = alloca i32, align 4 25837 // CHECK14-NEXT: [[I5:%.*]] = alloca i32, align 4 25838 // CHECK14-NEXT: [[I19:%.*]] = alloca i32, align 4 25839 // CHECK14-NEXT: [[I33:%.*]] = alloca i32, align 4 25840 // CHECK14-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 25841 // CHECK14-NEXT: [[I47:%.*]] = alloca i32, align 4 25842 // CHECK14-NEXT: [[I61:%.*]] = alloca i32, align 4 25843 // CHECK14-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 25844 // CHECK14-NEXT: [[I76:%.*]] = alloca i32, align 4 25845 // CHECK14-NEXT: store i32 0, i32* [[RETVAL]], align 4 25846 // CHECK14-NEXT: store i32 10000, i32* [[N]], align 4 25847 // CHECK14-NEXT: store i32 100, i32* [[CH]], align 4 25848 // CHECK14-NEXT: store i32 0, i32* [[I]], align 4 25849 // CHECK14-NEXT: br label [[FOR_COND:%.*]] 25850 // CHECK14: for.cond: 25851 // CHECK14-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 25852 // CHECK14-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 25853 // CHECK14-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 25854 // CHECK14-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 25855 // CHECK14: for.body: 25856 // CHECK14-NEXT: [[TMP2:%.*]] = load double*, double** [[B]], align 8 25857 // CHECK14-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 25858 // CHECK14-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP3]] to i64 25859 // CHECK14-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP2]], i64 [[IDXPROM]] 25860 // CHECK14-NEXT: [[TMP4:%.*]] = load double, double* [[ARRAYIDX]], align 8 25861 // CHECK14-NEXT: [[TMP5:%.*]] = load double*, double** [[C]], align 8 25862 // CHECK14-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 25863 // CHECK14-NEXT: [[IDXPROM1:%.*]] = sext i32 [[TMP6]] to i64 25864 // CHECK14-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds double, double* [[TMP5]], i64 [[IDXPROM1]] 25865 // CHECK14-NEXT: [[TMP7:%.*]] = load double, double* [[ARRAYIDX2]], align 8 25866 // CHECK14-NEXT: [[ADD:%.*]] = fadd double [[TMP4]], [[TMP7]] 25867 // CHECK14-NEXT: [[TMP8:%.*]] = load double*, double** [[A]], align 8 25868 // CHECK14-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 25869 // CHECK14-NEXT: [[IDXPROM3:%.*]] = sext i32 [[TMP9]] to i64 25870 // CHECK14-NEXT: [[ARRAYIDX4:%.*]] = getelementptr inbounds double, double* [[TMP8]], i64 [[IDXPROM3]] 25871 // CHECK14-NEXT: store double [[ADD]], double* [[ARRAYIDX4]], align 8 25872 // CHECK14-NEXT: br label [[FOR_INC:%.*]] 25873 // CHECK14: for.inc: 25874 // CHECK14-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 25875 // CHECK14-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 25876 // CHECK14-NEXT: store i32 [[INC]], i32* [[I]], align 4 25877 // CHECK14-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP2:![0-9]+]] 25878 // CHECK14: for.end: 25879 // CHECK14-NEXT: store i32 0, i32* [[I5]], align 4 25880 // CHECK14-NEXT: br label [[FOR_COND6:%.*]] 25881 // CHECK14: for.cond6: 25882 // CHECK14-NEXT: [[TMP11:%.*]] = load i32, i32* [[I5]], align 4 25883 // CHECK14-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 25884 // CHECK14-NEXT: [[CMP7:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 25885 // CHECK14-NEXT: br i1 [[CMP7]], label [[FOR_BODY8:%.*]], label [[FOR_END18:%.*]] 25886 // CHECK14: for.body8: 25887 // CHECK14-NEXT: [[TMP13:%.*]] = load double*, double** [[B]], align 8 25888 // CHECK14-NEXT: [[TMP14:%.*]] = load i32, i32* [[I5]], align 4 25889 // CHECK14-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP14]] to i64 25890 // CHECK14-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP13]], i64 [[IDXPROM9]] 25891 // CHECK14-NEXT: [[TMP15:%.*]] = load double, double* [[ARRAYIDX10]], align 8 25892 // CHECK14-NEXT: [[TMP16:%.*]] = load double*, double** [[C]], align 8 25893 // CHECK14-NEXT: [[TMP17:%.*]] = load i32, i32* [[I5]], align 4 25894 // CHECK14-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP17]] to i64 25895 // CHECK14-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds double, double* [[TMP16]], i64 [[IDXPROM11]] 25896 // CHECK14-NEXT: [[TMP18:%.*]] = load double, double* [[ARRAYIDX12]], align 8 25897 // CHECK14-NEXT: [[ADD13:%.*]] = fadd double [[TMP15]], [[TMP18]] 25898 // CHECK14-NEXT: [[TMP19:%.*]] = load double*, double** [[A]], align 8 25899 // CHECK14-NEXT: [[TMP20:%.*]] = load i32, i32* [[I5]], align 4 25900 // CHECK14-NEXT: [[IDXPROM14:%.*]] = sext i32 [[TMP20]] to i64 25901 // CHECK14-NEXT: [[ARRAYIDX15:%.*]] = getelementptr inbounds double, double* [[TMP19]], i64 [[IDXPROM14]] 25902 // CHECK14-NEXT: store double [[ADD13]], double* [[ARRAYIDX15]], align 8 25903 // CHECK14-NEXT: br label [[FOR_INC16:%.*]] 25904 // CHECK14: for.inc16: 25905 // CHECK14-NEXT: [[TMP21:%.*]] = load i32, i32* [[I5]], align 4 25906 // CHECK14-NEXT: [[INC17:%.*]] = add nsw i32 [[TMP21]], 1 25907 // CHECK14-NEXT: store i32 [[INC17]], i32* [[I5]], align 4 25908 // CHECK14-NEXT: br label [[FOR_COND6]], !llvm.loop [[LOOP4:![0-9]+]] 25909 // CHECK14: for.end18: 25910 // CHECK14-NEXT: store i32 0, i32* [[I19]], align 4 25911 // CHECK14-NEXT: br label [[FOR_COND20:%.*]] 25912 // CHECK14: for.cond20: 25913 // CHECK14-NEXT: [[TMP22:%.*]] = load i32, i32* [[I19]], align 4 25914 // CHECK14-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 25915 // CHECK14-NEXT: [[CMP21:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 25916 // CHECK14-NEXT: br i1 [[CMP21]], label [[FOR_BODY22:%.*]], label [[FOR_END32:%.*]] 25917 // CHECK14: for.body22: 25918 // CHECK14-NEXT: [[TMP24:%.*]] = load double*, double** [[B]], align 8 25919 // CHECK14-NEXT: [[TMP25:%.*]] = load i32, i32* [[I19]], align 4 25920 // CHECK14-NEXT: [[IDXPROM23:%.*]] = sext i32 [[TMP25]] to i64 25921 // CHECK14-NEXT: [[ARRAYIDX24:%.*]] = getelementptr inbounds double, double* [[TMP24]], i64 [[IDXPROM23]] 25922 // CHECK14-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX24]], align 8 25923 // CHECK14-NEXT: [[TMP27:%.*]] = load double*, double** [[C]], align 8 25924 // CHECK14-NEXT: [[TMP28:%.*]] = load i32, i32* [[I19]], align 4 25925 // CHECK14-NEXT: [[IDXPROM25:%.*]] = sext i32 [[TMP28]] to i64 25926 // CHECK14-NEXT: [[ARRAYIDX26:%.*]] = getelementptr inbounds double, double* [[TMP27]], i64 [[IDXPROM25]] 25927 // CHECK14-NEXT: [[TMP29:%.*]] = load double, double* [[ARRAYIDX26]], align 8 25928 // CHECK14-NEXT: [[ADD27:%.*]] = fadd double [[TMP26]], [[TMP29]] 25929 // CHECK14-NEXT: [[TMP30:%.*]] = load double*, double** [[A]], align 8 25930 // CHECK14-NEXT: [[TMP31:%.*]] = load i32, i32* [[I19]], align 4 25931 // CHECK14-NEXT: [[IDXPROM28:%.*]] = sext i32 [[TMP31]] to i64 25932 // CHECK14-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds double, double* [[TMP30]], i64 [[IDXPROM28]] 25933 // CHECK14-NEXT: store double [[ADD27]], double* [[ARRAYIDX29]], align 8 25934 // CHECK14-NEXT: br label [[FOR_INC30:%.*]] 25935 // CHECK14: for.inc30: 25936 // CHECK14-NEXT: [[TMP32:%.*]] = load i32, i32* [[I19]], align 4 25937 // CHECK14-NEXT: [[INC31:%.*]] = add nsw i32 [[TMP32]], 1 25938 // CHECK14-NEXT: store i32 [[INC31]], i32* [[I19]], align 4 25939 // CHECK14-NEXT: br label [[FOR_COND20]], !llvm.loop [[LOOP5:![0-9]+]] 25940 // CHECK14: for.end32: 25941 // CHECK14-NEXT: store i32 0, i32* [[I33]], align 4 25942 // CHECK14-NEXT: br label [[FOR_COND34:%.*]] 25943 // CHECK14: for.cond34: 25944 // CHECK14-NEXT: [[TMP33:%.*]] = load i32, i32* [[I33]], align 4 25945 // CHECK14-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 25946 // CHECK14-NEXT: [[CMP35:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 25947 // CHECK14-NEXT: br i1 [[CMP35]], label [[FOR_BODY36:%.*]], label [[FOR_END46:%.*]] 25948 // CHECK14: for.body36: 25949 // CHECK14-NEXT: [[TMP35:%.*]] = load double*, double** [[B]], align 8 25950 // CHECK14-NEXT: [[TMP36:%.*]] = load i32, i32* [[I33]], align 4 25951 // CHECK14-NEXT: [[IDXPROM37:%.*]] = sext i32 [[TMP36]] to i64 25952 // CHECK14-NEXT: [[ARRAYIDX38:%.*]] = getelementptr inbounds double, double* [[TMP35]], i64 [[IDXPROM37]] 25953 // CHECK14-NEXT: [[TMP37:%.*]] = load double, double* [[ARRAYIDX38]], align 8 25954 // CHECK14-NEXT: [[TMP38:%.*]] = load double*, double** [[C]], align 8 25955 // CHECK14-NEXT: [[TMP39:%.*]] = load i32, i32* [[I33]], align 4 25956 // CHECK14-NEXT: [[IDXPROM39:%.*]] = sext i32 [[TMP39]] to i64 25957 // CHECK14-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds double, double* [[TMP38]], i64 [[IDXPROM39]] 25958 // CHECK14-NEXT: [[TMP40:%.*]] = load double, double* [[ARRAYIDX40]], align 8 25959 // CHECK14-NEXT: [[ADD41:%.*]] = fadd double [[TMP37]], [[TMP40]] 25960 // CHECK14-NEXT: [[TMP41:%.*]] = load double*, double** [[A]], align 8 25961 // CHECK14-NEXT: [[TMP42:%.*]] = load i32, i32* [[I33]], align 4 25962 // CHECK14-NEXT: [[IDXPROM42:%.*]] = sext i32 [[TMP42]] to i64 25963 // CHECK14-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds double, double* [[TMP41]], i64 [[IDXPROM42]] 25964 // CHECK14-NEXT: store double [[ADD41]], double* [[ARRAYIDX43]], align 8 25965 // CHECK14-NEXT: br label [[FOR_INC44:%.*]] 25966 // CHECK14: for.inc44: 25967 // CHECK14-NEXT: [[TMP43:%.*]] = load i32, i32* [[I33]], align 4 25968 // CHECK14-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP43]], 1 25969 // CHECK14-NEXT: store i32 [[INC45]], i32* [[I33]], align 4 25970 // CHECK14-NEXT: br label [[FOR_COND34]], !llvm.loop [[LOOP6:![0-9]+]] 25971 // CHECK14: for.end46: 25972 // CHECK14-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 25973 // CHECK14-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 25974 // CHECK14-NEXT: store i32 0, i32* [[I47]], align 4 25975 // CHECK14-NEXT: br label [[FOR_COND48:%.*]] 25976 // CHECK14: for.cond48: 25977 // CHECK14-NEXT: [[TMP45:%.*]] = load i32, i32* [[I47]], align 4 25978 // CHECK14-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 25979 // CHECK14-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 25980 // CHECK14-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END60:%.*]] 25981 // CHECK14: for.body50: 25982 // CHECK14-NEXT: [[TMP47:%.*]] = load double*, double** [[B]], align 8 25983 // CHECK14-NEXT: [[TMP48:%.*]] = load i32, i32* [[I47]], align 4 25984 // CHECK14-NEXT: [[IDXPROM51:%.*]] = sext i32 [[TMP48]] to i64 25985 // CHECK14-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds double, double* [[TMP47]], i64 [[IDXPROM51]] 25986 // CHECK14-NEXT: [[TMP49:%.*]] = load double, double* [[ARRAYIDX52]], align 8 25987 // CHECK14-NEXT: [[TMP50:%.*]] = load double*, double** [[C]], align 8 25988 // CHECK14-NEXT: [[TMP51:%.*]] = load i32, i32* [[I47]], align 4 25989 // CHECK14-NEXT: [[IDXPROM53:%.*]] = sext i32 [[TMP51]] to i64 25990 // CHECK14-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds double, double* [[TMP50]], i64 [[IDXPROM53]] 25991 // CHECK14-NEXT: [[TMP52:%.*]] = load double, double* [[ARRAYIDX54]], align 8 25992 // CHECK14-NEXT: [[ADD55:%.*]] = fadd double [[TMP49]], [[TMP52]] 25993 // CHECK14-NEXT: [[TMP53:%.*]] = load double*, double** [[A]], align 8 25994 // CHECK14-NEXT: [[TMP54:%.*]] = load i32, i32* [[I47]], align 4 25995 // CHECK14-NEXT: [[IDXPROM56:%.*]] = sext i32 [[TMP54]] to i64 25996 // CHECK14-NEXT: [[ARRAYIDX57:%.*]] = getelementptr inbounds double, double* [[TMP53]], i64 [[IDXPROM56]] 25997 // CHECK14-NEXT: store double [[ADD55]], double* [[ARRAYIDX57]], align 8 25998 // CHECK14-NEXT: br label [[FOR_INC58:%.*]] 25999 // CHECK14: for.inc58: 26000 // CHECK14-NEXT: [[TMP55:%.*]] = load i32, i32* [[I47]], align 4 26001 // CHECK14-NEXT: [[INC59:%.*]] = add nsw i32 [[TMP55]], 1 26002 // CHECK14-NEXT: store i32 [[INC59]], i32* [[I47]], align 4 26003 // CHECK14-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP7:![0-9]+]] 26004 // CHECK14: for.end60: 26005 // CHECK14-NEXT: store i32 0, i32* [[I61]], align 4 26006 // CHECK14-NEXT: br label [[FOR_COND62:%.*]] 26007 // CHECK14: for.cond62: 26008 // CHECK14-NEXT: [[TMP56:%.*]] = load i32, i32* [[I61]], align 4 26009 // CHECK14-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 26010 // CHECK14-NEXT: [[CMP63:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 26011 // CHECK14-NEXT: br i1 [[CMP63]], label [[FOR_BODY64:%.*]], label [[FOR_END74:%.*]] 26012 // CHECK14: for.body64: 26013 // CHECK14-NEXT: [[TMP58:%.*]] = load double*, double** [[B]], align 8 26014 // CHECK14-NEXT: [[TMP59:%.*]] = load i32, i32* [[I61]], align 4 26015 // CHECK14-NEXT: [[IDXPROM65:%.*]] = sext i32 [[TMP59]] to i64 26016 // CHECK14-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds double, double* [[TMP58]], i64 [[IDXPROM65]] 26017 // CHECK14-NEXT: [[TMP60:%.*]] = load double, double* [[ARRAYIDX66]], align 8 26018 // CHECK14-NEXT: [[TMP61:%.*]] = load double*, double** [[C]], align 8 26019 // CHECK14-NEXT: [[TMP62:%.*]] = load i32, i32* [[I61]], align 4 26020 // CHECK14-NEXT: [[IDXPROM67:%.*]] = sext i32 [[TMP62]] to i64 26021 // CHECK14-NEXT: [[ARRAYIDX68:%.*]] = getelementptr inbounds double, double* [[TMP61]], i64 [[IDXPROM67]] 26022 // CHECK14-NEXT: [[TMP63:%.*]] = load double, double* [[ARRAYIDX68]], align 8 26023 // CHECK14-NEXT: [[ADD69:%.*]] = fadd double [[TMP60]], [[TMP63]] 26024 // CHECK14-NEXT: [[TMP64:%.*]] = load double*, double** [[A]], align 8 26025 // CHECK14-NEXT: [[TMP65:%.*]] = load i32, i32* [[I61]], align 4 26026 // CHECK14-NEXT: [[IDXPROM70:%.*]] = sext i32 [[TMP65]] to i64 26027 // CHECK14-NEXT: [[ARRAYIDX71:%.*]] = getelementptr inbounds double, double* [[TMP64]], i64 [[IDXPROM70]] 26028 // CHECK14-NEXT: store double [[ADD69]], double* [[ARRAYIDX71]], align 8 26029 // CHECK14-NEXT: br label [[FOR_INC72:%.*]] 26030 // CHECK14: for.inc72: 26031 // CHECK14-NEXT: [[TMP66:%.*]] = load i32, i32* [[I61]], align 4 26032 // CHECK14-NEXT: [[INC73:%.*]] = add nsw i32 [[TMP66]], 1 26033 // CHECK14-NEXT: store i32 [[INC73]], i32* [[I61]], align 4 26034 // CHECK14-NEXT: br label [[FOR_COND62]], !llvm.loop [[LOOP8:![0-9]+]] 26035 // CHECK14: for.end74: 26036 // CHECK14-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 26037 // CHECK14-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_75]], align 4 26038 // CHECK14-NEXT: store i32 0, i32* [[I76]], align 4 26039 // CHECK14-NEXT: br label [[FOR_COND77:%.*]] 26040 // CHECK14: for.cond77: 26041 // CHECK14-NEXT: [[TMP68:%.*]] = load i32, i32* [[I76]], align 4 26042 // CHECK14-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 26043 // CHECK14-NEXT: [[CMP78:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 26044 // CHECK14-NEXT: br i1 [[CMP78]], label [[FOR_BODY79:%.*]], label [[FOR_END89:%.*]] 26045 // CHECK14: for.body79: 26046 // CHECK14-NEXT: [[TMP70:%.*]] = load double*, double** [[B]], align 8 26047 // CHECK14-NEXT: [[TMP71:%.*]] = load i32, i32* [[I76]], align 4 26048 // CHECK14-NEXT: [[IDXPROM80:%.*]] = sext i32 [[TMP71]] to i64 26049 // CHECK14-NEXT: [[ARRAYIDX81:%.*]] = getelementptr inbounds double, double* [[TMP70]], i64 [[IDXPROM80]] 26050 // CHECK14-NEXT: [[TMP72:%.*]] = load double, double* [[ARRAYIDX81]], align 8 26051 // CHECK14-NEXT: [[TMP73:%.*]] = load double*, double** [[C]], align 8 26052 // CHECK14-NEXT: [[TMP74:%.*]] = load i32, i32* [[I76]], align 4 26053 // CHECK14-NEXT: [[IDXPROM82:%.*]] = sext i32 [[TMP74]] to i64 26054 // CHECK14-NEXT: [[ARRAYIDX83:%.*]] = getelementptr inbounds double, double* [[TMP73]], i64 [[IDXPROM82]] 26055 // CHECK14-NEXT: [[TMP75:%.*]] = load double, double* [[ARRAYIDX83]], align 8 26056 // CHECK14-NEXT: [[ADD84:%.*]] = fadd double [[TMP72]], [[TMP75]] 26057 // CHECK14-NEXT: [[TMP76:%.*]] = load double*, double** [[A]], align 8 26058 // CHECK14-NEXT: [[TMP77:%.*]] = load i32, i32* [[I76]], align 4 26059 // CHECK14-NEXT: [[IDXPROM85:%.*]] = sext i32 [[TMP77]] to i64 26060 // CHECK14-NEXT: [[ARRAYIDX86:%.*]] = getelementptr inbounds double, double* [[TMP76]], i64 [[IDXPROM85]] 26061 // CHECK14-NEXT: store double [[ADD84]], double* [[ARRAYIDX86]], align 8 26062 // CHECK14-NEXT: br label [[FOR_INC87:%.*]] 26063 // CHECK14: for.inc87: 26064 // CHECK14-NEXT: [[TMP78:%.*]] = load i32, i32* [[I76]], align 4 26065 // CHECK14-NEXT: [[INC88:%.*]] = add nsw i32 [[TMP78]], 1 26066 // CHECK14-NEXT: store i32 [[INC88]], i32* [[I76]], align 4 26067 // CHECK14-NEXT: br label [[FOR_COND77]], !llvm.loop [[LOOP9:![0-9]+]] 26068 // CHECK14: for.end89: 26069 // CHECK14-NEXT: [[CALL:%.*]] = call signext i32 @_Z5tmainIiET_v() 26070 // CHECK14-NEXT: ret i32 [[CALL]] 26071 // 26072 // 26073 // CHECK14-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 26074 // CHECK14-SAME: () #[[ATTR1:[0-9]+]] comdat { 26075 // CHECK14-NEXT: entry: 26076 // CHECK14-NEXT: [[A:%.*]] = alloca i32*, align 8 26077 // CHECK14-NEXT: [[B:%.*]] = alloca i32*, align 8 26078 // CHECK14-NEXT: [[C:%.*]] = alloca i32*, align 8 26079 // CHECK14-NEXT: [[N:%.*]] = alloca i32, align 4 26080 // CHECK14-NEXT: [[CH:%.*]] = alloca i32, align 4 26081 // CHECK14-NEXT: [[I:%.*]] = alloca i32, align 4 26082 // CHECK14-NEXT: [[I5:%.*]] = alloca i32, align 4 26083 // CHECK14-NEXT: [[I19:%.*]] = alloca i32, align 4 26084 // CHECK14-NEXT: [[I33:%.*]] = alloca i32, align 4 26085 // CHECK14-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 26086 // CHECK14-NEXT: [[I47:%.*]] = alloca i32, align 4 26087 // CHECK14-NEXT: [[I61:%.*]] = alloca i32, align 4 26088 // CHECK14-NEXT: [[DOTCAPTURE_EXPR_75:%.*]] = alloca i32, align 4 26089 // CHECK14-NEXT: [[I76:%.*]] = alloca i32, align 4 26090 // CHECK14-NEXT: store i32 10000, i32* [[N]], align 4 26091 // CHECK14-NEXT: store i32 100, i32* [[CH]], align 4 26092 // CHECK14-NEXT: store i32 0, i32* [[I]], align 4 26093 // CHECK14-NEXT: br label [[FOR_COND:%.*]] 26094 // CHECK14: for.cond: 26095 // CHECK14-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 26096 // CHECK14-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 26097 // CHECK14-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 26098 // CHECK14-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 26099 // CHECK14: for.body: 26100 // CHECK14-NEXT: [[TMP2:%.*]] = load i32*, i32** [[B]], align 8 26101 // CHECK14-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 26102 // CHECK14-NEXT: [[IDXPROM:%.*]] = sext i32 [[TMP3]] to i64 26103 // CHECK14-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP2]], i64 [[IDXPROM]] 26104 // CHECK14-NEXT: [[TMP4:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 26105 // CHECK14-NEXT: [[TMP5:%.*]] = load i32*, i32** [[C]], align 8 26106 // CHECK14-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 26107 // CHECK14-NEXT: [[IDXPROM1:%.*]] = sext i32 [[TMP6]] to i64 26108 // CHECK14-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i32, i32* [[TMP5]], i64 [[IDXPROM1]] 26109 // CHECK14-NEXT: [[TMP7:%.*]] = load i32, i32* [[ARRAYIDX2]], align 4 26110 // CHECK14-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP4]], [[TMP7]] 26111 // CHECK14-NEXT: [[TMP8:%.*]] = load i32*, i32** [[A]], align 8 26112 // CHECK14-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 26113 // CHECK14-NEXT: [[IDXPROM3:%.*]] = sext i32 [[TMP9]] to i64 26114 // CHECK14-NEXT: [[ARRAYIDX4:%.*]] = getelementptr inbounds i32, i32* [[TMP8]], i64 [[IDXPROM3]] 26115 // CHECK14-NEXT: store i32 [[ADD]], i32* [[ARRAYIDX4]], align 4 26116 // CHECK14-NEXT: br label [[FOR_INC:%.*]] 26117 // CHECK14: for.inc: 26118 // CHECK14-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 26119 // CHECK14-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 26120 // CHECK14-NEXT: store i32 [[INC]], i32* [[I]], align 4 26121 // CHECK14-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP10:![0-9]+]] 26122 // CHECK14: for.end: 26123 // CHECK14-NEXT: store i32 0, i32* [[I5]], align 4 26124 // CHECK14-NEXT: br label [[FOR_COND6:%.*]] 26125 // CHECK14: for.cond6: 26126 // CHECK14-NEXT: [[TMP11:%.*]] = load i32, i32* [[I5]], align 4 26127 // CHECK14-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 26128 // CHECK14-NEXT: [[CMP7:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 26129 // CHECK14-NEXT: br i1 [[CMP7]], label [[FOR_BODY8:%.*]], label [[FOR_END18:%.*]] 26130 // CHECK14: for.body8: 26131 // CHECK14-NEXT: [[TMP13:%.*]] = load i32*, i32** [[B]], align 8 26132 // CHECK14-NEXT: [[TMP14:%.*]] = load i32, i32* [[I5]], align 4 26133 // CHECK14-NEXT: [[IDXPROM9:%.*]] = sext i32 [[TMP14]] to i64 26134 // CHECK14-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP13]], i64 [[IDXPROM9]] 26135 // CHECK14-NEXT: [[TMP15:%.*]] = load i32, i32* [[ARRAYIDX10]], align 4 26136 // CHECK14-NEXT: [[TMP16:%.*]] = load i32*, i32** [[C]], align 8 26137 // CHECK14-NEXT: [[TMP17:%.*]] = load i32, i32* [[I5]], align 4 26138 // CHECK14-NEXT: [[IDXPROM11:%.*]] = sext i32 [[TMP17]] to i64 26139 // CHECK14-NEXT: [[ARRAYIDX12:%.*]] = getelementptr inbounds i32, i32* [[TMP16]], i64 [[IDXPROM11]] 26140 // CHECK14-NEXT: [[TMP18:%.*]] = load i32, i32* [[ARRAYIDX12]], align 4 26141 // CHECK14-NEXT: [[ADD13:%.*]] = add nsw i32 [[TMP15]], [[TMP18]] 26142 // CHECK14-NEXT: [[TMP19:%.*]] = load i32*, i32** [[A]], align 8 26143 // CHECK14-NEXT: [[TMP20:%.*]] = load i32, i32* [[I5]], align 4 26144 // CHECK14-NEXT: [[IDXPROM14:%.*]] = sext i32 [[TMP20]] to i64 26145 // CHECK14-NEXT: [[ARRAYIDX15:%.*]] = getelementptr inbounds i32, i32* [[TMP19]], i64 [[IDXPROM14]] 26146 // CHECK14-NEXT: store i32 [[ADD13]], i32* [[ARRAYIDX15]], align 4 26147 // CHECK14-NEXT: br label [[FOR_INC16:%.*]] 26148 // CHECK14: for.inc16: 26149 // CHECK14-NEXT: [[TMP21:%.*]] = load i32, i32* [[I5]], align 4 26150 // CHECK14-NEXT: [[INC17:%.*]] = add nsw i32 [[TMP21]], 1 26151 // CHECK14-NEXT: store i32 [[INC17]], i32* [[I5]], align 4 26152 // CHECK14-NEXT: br label [[FOR_COND6]], !llvm.loop [[LOOP11:![0-9]+]] 26153 // CHECK14: for.end18: 26154 // CHECK14-NEXT: store i32 0, i32* [[I19]], align 4 26155 // CHECK14-NEXT: br label [[FOR_COND20:%.*]] 26156 // CHECK14: for.cond20: 26157 // CHECK14-NEXT: [[TMP22:%.*]] = load i32, i32* [[I19]], align 4 26158 // CHECK14-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 26159 // CHECK14-NEXT: [[CMP21:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 26160 // CHECK14-NEXT: br i1 [[CMP21]], label [[FOR_BODY22:%.*]], label [[FOR_END32:%.*]] 26161 // CHECK14: for.body22: 26162 // CHECK14-NEXT: [[TMP24:%.*]] = load i32*, i32** [[B]], align 8 26163 // CHECK14-NEXT: [[TMP25:%.*]] = load i32, i32* [[I19]], align 4 26164 // CHECK14-NEXT: [[IDXPROM23:%.*]] = sext i32 [[TMP25]] to i64 26165 // CHECK14-NEXT: [[ARRAYIDX24:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i64 [[IDXPROM23]] 26166 // CHECK14-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX24]], align 4 26167 // CHECK14-NEXT: [[TMP27:%.*]] = load i32*, i32** [[C]], align 8 26168 // CHECK14-NEXT: [[TMP28:%.*]] = load i32, i32* [[I19]], align 4 26169 // CHECK14-NEXT: [[IDXPROM25:%.*]] = sext i32 [[TMP28]] to i64 26170 // CHECK14-NEXT: [[ARRAYIDX26:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i64 [[IDXPROM25]] 26171 // CHECK14-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX26]], align 4 26172 // CHECK14-NEXT: [[ADD27:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 26173 // CHECK14-NEXT: [[TMP30:%.*]] = load i32*, i32** [[A]], align 8 26174 // CHECK14-NEXT: [[TMP31:%.*]] = load i32, i32* [[I19]], align 4 26175 // CHECK14-NEXT: [[IDXPROM28:%.*]] = sext i32 [[TMP31]] to i64 26176 // CHECK14-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i64 [[IDXPROM28]] 26177 // CHECK14-NEXT: store i32 [[ADD27]], i32* [[ARRAYIDX29]], align 4 26178 // CHECK14-NEXT: br label [[FOR_INC30:%.*]] 26179 // CHECK14: for.inc30: 26180 // CHECK14-NEXT: [[TMP32:%.*]] = load i32, i32* [[I19]], align 4 26181 // CHECK14-NEXT: [[INC31:%.*]] = add nsw i32 [[TMP32]], 1 26182 // CHECK14-NEXT: store i32 [[INC31]], i32* [[I19]], align 4 26183 // CHECK14-NEXT: br label [[FOR_COND20]], !llvm.loop [[LOOP12:![0-9]+]] 26184 // CHECK14: for.end32: 26185 // CHECK14-NEXT: store i32 0, i32* [[I33]], align 4 26186 // CHECK14-NEXT: br label [[FOR_COND34:%.*]] 26187 // CHECK14: for.cond34: 26188 // CHECK14-NEXT: [[TMP33:%.*]] = load i32, i32* [[I33]], align 4 26189 // CHECK14-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 26190 // CHECK14-NEXT: [[CMP35:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 26191 // CHECK14-NEXT: br i1 [[CMP35]], label [[FOR_BODY36:%.*]], label [[FOR_END46:%.*]] 26192 // CHECK14: for.body36: 26193 // CHECK14-NEXT: [[TMP35:%.*]] = load i32*, i32** [[B]], align 8 26194 // CHECK14-NEXT: [[TMP36:%.*]] = load i32, i32* [[I33]], align 4 26195 // CHECK14-NEXT: [[IDXPROM37:%.*]] = sext i32 [[TMP36]] to i64 26196 // CHECK14-NEXT: [[ARRAYIDX38:%.*]] = getelementptr inbounds i32, i32* [[TMP35]], i64 [[IDXPROM37]] 26197 // CHECK14-NEXT: [[TMP37:%.*]] = load i32, i32* [[ARRAYIDX38]], align 4 26198 // CHECK14-NEXT: [[TMP38:%.*]] = load i32*, i32** [[C]], align 8 26199 // CHECK14-NEXT: [[TMP39:%.*]] = load i32, i32* [[I33]], align 4 26200 // CHECK14-NEXT: [[IDXPROM39:%.*]] = sext i32 [[TMP39]] to i64 26201 // CHECK14-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds i32, i32* [[TMP38]], i64 [[IDXPROM39]] 26202 // CHECK14-NEXT: [[TMP40:%.*]] = load i32, i32* [[ARRAYIDX40]], align 4 26203 // CHECK14-NEXT: [[ADD41:%.*]] = add nsw i32 [[TMP37]], [[TMP40]] 26204 // CHECK14-NEXT: [[TMP41:%.*]] = load i32*, i32** [[A]], align 8 26205 // CHECK14-NEXT: [[TMP42:%.*]] = load i32, i32* [[I33]], align 4 26206 // CHECK14-NEXT: [[IDXPROM42:%.*]] = sext i32 [[TMP42]] to i64 26207 // CHECK14-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds i32, i32* [[TMP41]], i64 [[IDXPROM42]] 26208 // CHECK14-NEXT: store i32 [[ADD41]], i32* [[ARRAYIDX43]], align 4 26209 // CHECK14-NEXT: br label [[FOR_INC44:%.*]] 26210 // CHECK14: for.inc44: 26211 // CHECK14-NEXT: [[TMP43:%.*]] = load i32, i32* [[I33]], align 4 26212 // CHECK14-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP43]], 1 26213 // CHECK14-NEXT: store i32 [[INC45]], i32* [[I33]], align 4 26214 // CHECK14-NEXT: br label [[FOR_COND34]], !llvm.loop [[LOOP13:![0-9]+]] 26215 // CHECK14: for.end46: 26216 // CHECK14-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 26217 // CHECK14-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 26218 // CHECK14-NEXT: store i32 0, i32* [[I47]], align 4 26219 // CHECK14-NEXT: br label [[FOR_COND48:%.*]] 26220 // CHECK14: for.cond48: 26221 // CHECK14-NEXT: [[TMP45:%.*]] = load i32, i32* [[I47]], align 4 26222 // CHECK14-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 26223 // CHECK14-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 26224 // CHECK14-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END60:%.*]] 26225 // CHECK14: for.body50: 26226 // CHECK14-NEXT: [[TMP47:%.*]] = load i32*, i32** [[B]], align 8 26227 // CHECK14-NEXT: [[TMP48:%.*]] = load i32, i32* [[I47]], align 4 26228 // CHECK14-NEXT: [[IDXPROM51:%.*]] = sext i32 [[TMP48]] to i64 26229 // CHECK14-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds i32, i32* [[TMP47]], i64 [[IDXPROM51]] 26230 // CHECK14-NEXT: [[TMP49:%.*]] = load i32, i32* [[ARRAYIDX52]], align 4 26231 // CHECK14-NEXT: [[TMP50:%.*]] = load i32*, i32** [[C]], align 8 26232 // CHECK14-NEXT: [[TMP51:%.*]] = load i32, i32* [[I47]], align 4 26233 // CHECK14-NEXT: [[IDXPROM53:%.*]] = sext i32 [[TMP51]] to i64 26234 // CHECK14-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds i32, i32* [[TMP50]], i64 [[IDXPROM53]] 26235 // CHECK14-NEXT: [[TMP52:%.*]] = load i32, i32* [[ARRAYIDX54]], align 4 26236 // CHECK14-NEXT: [[ADD55:%.*]] = add nsw i32 [[TMP49]], [[TMP52]] 26237 // CHECK14-NEXT: [[TMP53:%.*]] = load i32*, i32** [[A]], align 8 26238 // CHECK14-NEXT: [[TMP54:%.*]] = load i32, i32* [[I47]], align 4 26239 // CHECK14-NEXT: [[IDXPROM56:%.*]] = sext i32 [[TMP54]] to i64 26240 // CHECK14-NEXT: [[ARRAYIDX57:%.*]] = getelementptr inbounds i32, i32* [[TMP53]], i64 [[IDXPROM56]] 26241 // CHECK14-NEXT: store i32 [[ADD55]], i32* [[ARRAYIDX57]], align 4 26242 // CHECK14-NEXT: br label [[FOR_INC58:%.*]] 26243 // CHECK14: for.inc58: 26244 // CHECK14-NEXT: [[TMP55:%.*]] = load i32, i32* [[I47]], align 4 26245 // CHECK14-NEXT: [[INC59:%.*]] = add nsw i32 [[TMP55]], 1 26246 // CHECK14-NEXT: store i32 [[INC59]], i32* [[I47]], align 4 26247 // CHECK14-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP14:![0-9]+]] 26248 // CHECK14: for.end60: 26249 // CHECK14-NEXT: store i32 0, i32* [[I61]], align 4 26250 // CHECK14-NEXT: br label [[FOR_COND62:%.*]] 26251 // CHECK14: for.cond62: 26252 // CHECK14-NEXT: [[TMP56:%.*]] = load i32, i32* [[I61]], align 4 26253 // CHECK14-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 26254 // CHECK14-NEXT: [[CMP63:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 26255 // CHECK14-NEXT: br i1 [[CMP63]], label [[FOR_BODY64:%.*]], label [[FOR_END74:%.*]] 26256 // CHECK14: for.body64: 26257 // CHECK14-NEXT: [[TMP58:%.*]] = load i32*, i32** [[B]], align 8 26258 // CHECK14-NEXT: [[TMP59:%.*]] = load i32, i32* [[I61]], align 4 26259 // CHECK14-NEXT: [[IDXPROM65:%.*]] = sext i32 [[TMP59]] to i64 26260 // CHECK14-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds i32, i32* [[TMP58]], i64 [[IDXPROM65]] 26261 // CHECK14-NEXT: [[TMP60:%.*]] = load i32, i32* [[ARRAYIDX66]], align 4 26262 // CHECK14-NEXT: [[TMP61:%.*]] = load i32*, i32** [[C]], align 8 26263 // CHECK14-NEXT: [[TMP62:%.*]] = load i32, i32* [[I61]], align 4 26264 // CHECK14-NEXT: [[IDXPROM67:%.*]] = sext i32 [[TMP62]] to i64 26265 // CHECK14-NEXT: [[ARRAYIDX68:%.*]] = getelementptr inbounds i32, i32* [[TMP61]], i64 [[IDXPROM67]] 26266 // CHECK14-NEXT: [[TMP63:%.*]] = load i32, i32* [[ARRAYIDX68]], align 4 26267 // CHECK14-NEXT: [[ADD69:%.*]] = add nsw i32 [[TMP60]], [[TMP63]] 26268 // CHECK14-NEXT: [[TMP64:%.*]] = load i32*, i32** [[A]], align 8 26269 // CHECK14-NEXT: [[TMP65:%.*]] = load i32, i32* [[I61]], align 4 26270 // CHECK14-NEXT: [[IDXPROM70:%.*]] = sext i32 [[TMP65]] to i64 26271 // CHECK14-NEXT: [[ARRAYIDX71:%.*]] = getelementptr inbounds i32, i32* [[TMP64]], i64 [[IDXPROM70]] 26272 // CHECK14-NEXT: store i32 [[ADD69]], i32* [[ARRAYIDX71]], align 4 26273 // CHECK14-NEXT: br label [[FOR_INC72:%.*]] 26274 // CHECK14: for.inc72: 26275 // CHECK14-NEXT: [[TMP66:%.*]] = load i32, i32* [[I61]], align 4 26276 // CHECK14-NEXT: [[INC73:%.*]] = add nsw i32 [[TMP66]], 1 26277 // CHECK14-NEXT: store i32 [[INC73]], i32* [[I61]], align 4 26278 // CHECK14-NEXT: br label [[FOR_COND62]], !llvm.loop [[LOOP15:![0-9]+]] 26279 // CHECK14: for.end74: 26280 // CHECK14-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 26281 // CHECK14-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_75]], align 4 26282 // CHECK14-NEXT: store i32 0, i32* [[I76]], align 4 26283 // CHECK14-NEXT: br label [[FOR_COND77:%.*]] 26284 // CHECK14: for.cond77: 26285 // CHECK14-NEXT: [[TMP68:%.*]] = load i32, i32* [[I76]], align 4 26286 // CHECK14-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 26287 // CHECK14-NEXT: [[CMP78:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 26288 // CHECK14-NEXT: br i1 [[CMP78]], label [[FOR_BODY79:%.*]], label [[FOR_END89:%.*]] 26289 // CHECK14: for.body79: 26290 // CHECK14-NEXT: [[TMP70:%.*]] = load i32*, i32** [[B]], align 8 26291 // CHECK14-NEXT: [[TMP71:%.*]] = load i32, i32* [[I76]], align 4 26292 // CHECK14-NEXT: [[IDXPROM80:%.*]] = sext i32 [[TMP71]] to i64 26293 // CHECK14-NEXT: [[ARRAYIDX81:%.*]] = getelementptr inbounds i32, i32* [[TMP70]], i64 [[IDXPROM80]] 26294 // CHECK14-NEXT: [[TMP72:%.*]] = load i32, i32* [[ARRAYIDX81]], align 4 26295 // CHECK14-NEXT: [[TMP73:%.*]] = load i32*, i32** [[C]], align 8 26296 // CHECK14-NEXT: [[TMP74:%.*]] = load i32, i32* [[I76]], align 4 26297 // CHECK14-NEXT: [[IDXPROM82:%.*]] = sext i32 [[TMP74]] to i64 26298 // CHECK14-NEXT: [[ARRAYIDX83:%.*]] = getelementptr inbounds i32, i32* [[TMP73]], i64 [[IDXPROM82]] 26299 // CHECK14-NEXT: [[TMP75:%.*]] = load i32, i32* [[ARRAYIDX83]], align 4 26300 // CHECK14-NEXT: [[ADD84:%.*]] = add nsw i32 [[TMP72]], [[TMP75]] 26301 // CHECK14-NEXT: [[TMP76:%.*]] = load i32*, i32** [[A]], align 8 26302 // CHECK14-NEXT: [[TMP77:%.*]] = load i32, i32* [[I76]], align 4 26303 // CHECK14-NEXT: [[IDXPROM85:%.*]] = sext i32 [[TMP77]] to i64 26304 // CHECK14-NEXT: [[ARRAYIDX86:%.*]] = getelementptr inbounds i32, i32* [[TMP76]], i64 [[IDXPROM85]] 26305 // CHECK14-NEXT: store i32 [[ADD84]], i32* [[ARRAYIDX86]], align 4 26306 // CHECK14-NEXT: br label [[FOR_INC87:%.*]] 26307 // CHECK14: for.inc87: 26308 // CHECK14-NEXT: [[TMP78:%.*]] = load i32, i32* [[I76]], align 4 26309 // CHECK14-NEXT: [[INC88:%.*]] = add nsw i32 [[TMP78]], 1 26310 // CHECK14-NEXT: store i32 [[INC88]], i32* [[I76]], align 4 26311 // CHECK14-NEXT: br label [[FOR_COND77]], !llvm.loop [[LOOP16:![0-9]+]] 26312 // CHECK14: for.end89: 26313 // CHECK14-NEXT: ret i32 0 26314 // 26315 // 26316 // CHECK15-LABEL: define {{[^@]+}}@main 26317 // CHECK15-SAME: () #[[ATTR0:[0-9]+]] { 26318 // CHECK15-NEXT: entry: 26319 // CHECK15-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 26320 // CHECK15-NEXT: [[A:%.*]] = alloca double*, align 4 26321 // CHECK15-NEXT: [[B:%.*]] = alloca double*, align 4 26322 // CHECK15-NEXT: [[C:%.*]] = alloca double*, align 4 26323 // CHECK15-NEXT: [[N:%.*]] = alloca i32, align 4 26324 // CHECK15-NEXT: [[CH:%.*]] = alloca i32, align 4 26325 // CHECK15-NEXT: [[I:%.*]] = alloca i32, align 4 26326 // CHECK15-NEXT: [[I3:%.*]] = alloca i32, align 4 26327 // CHECK15-NEXT: [[I14:%.*]] = alloca i32, align 4 26328 // CHECK15-NEXT: [[I25:%.*]] = alloca i32, align 4 26329 // CHECK15-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 26330 // CHECK15-NEXT: [[I36:%.*]] = alloca i32, align 4 26331 // CHECK15-NEXT: [[I47:%.*]] = alloca i32, align 4 26332 // CHECK15-NEXT: [[DOTCAPTURE_EXPR_58:%.*]] = alloca i32, align 4 26333 // CHECK15-NEXT: [[I59:%.*]] = alloca i32, align 4 26334 // CHECK15-NEXT: store i32 0, i32* [[RETVAL]], align 4 26335 // CHECK15-NEXT: store i32 10000, i32* [[N]], align 4 26336 // CHECK15-NEXT: store i32 100, i32* [[CH]], align 4 26337 // CHECK15-NEXT: store i32 0, i32* [[I]], align 4 26338 // CHECK15-NEXT: br label [[FOR_COND:%.*]] 26339 // CHECK15: for.cond: 26340 // CHECK15-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 26341 // CHECK15-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 26342 // CHECK15-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 26343 // CHECK15-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 26344 // CHECK15: for.body: 26345 // CHECK15-NEXT: [[TMP2:%.*]] = load double*, double** [[B]], align 4 26346 // CHECK15-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 26347 // CHECK15-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP2]], i32 [[TMP3]] 26348 // CHECK15-NEXT: [[TMP4:%.*]] = load double, double* [[ARRAYIDX]], align 4 26349 // CHECK15-NEXT: [[TMP5:%.*]] = load double*, double** [[C]], align 4 26350 // CHECK15-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 26351 // CHECK15-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds double, double* [[TMP5]], i32 [[TMP6]] 26352 // CHECK15-NEXT: [[TMP7:%.*]] = load double, double* [[ARRAYIDX1]], align 4 26353 // CHECK15-NEXT: [[ADD:%.*]] = fadd double [[TMP4]], [[TMP7]] 26354 // CHECK15-NEXT: [[TMP8:%.*]] = load double*, double** [[A]], align 4 26355 // CHECK15-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 26356 // CHECK15-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds double, double* [[TMP8]], i32 [[TMP9]] 26357 // CHECK15-NEXT: store double [[ADD]], double* [[ARRAYIDX2]], align 4 26358 // CHECK15-NEXT: br label [[FOR_INC:%.*]] 26359 // CHECK15: for.inc: 26360 // CHECK15-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 26361 // CHECK15-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 26362 // CHECK15-NEXT: store i32 [[INC]], i32* [[I]], align 4 26363 // CHECK15-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP3:![0-9]+]] 26364 // CHECK15: for.end: 26365 // CHECK15-NEXT: store i32 0, i32* [[I3]], align 4 26366 // CHECK15-NEXT: br label [[FOR_COND4:%.*]] 26367 // CHECK15: for.cond4: 26368 // CHECK15-NEXT: [[TMP11:%.*]] = load i32, i32* [[I3]], align 4 26369 // CHECK15-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 26370 // CHECK15-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 26371 // CHECK15-NEXT: br i1 [[CMP5]], label [[FOR_BODY6:%.*]], label [[FOR_END13:%.*]] 26372 // CHECK15: for.body6: 26373 // CHECK15-NEXT: [[TMP13:%.*]] = load double*, double** [[B]], align 4 26374 // CHECK15-NEXT: [[TMP14:%.*]] = load i32, i32* [[I3]], align 4 26375 // CHECK15-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP13]], i32 [[TMP14]] 26376 // CHECK15-NEXT: [[TMP15:%.*]] = load double, double* [[ARRAYIDX7]], align 4 26377 // CHECK15-NEXT: [[TMP16:%.*]] = load double*, double** [[C]], align 4 26378 // CHECK15-NEXT: [[TMP17:%.*]] = load i32, i32* [[I3]], align 4 26379 // CHECK15-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP16]], i32 [[TMP17]] 26380 // CHECK15-NEXT: [[TMP18:%.*]] = load double, double* [[ARRAYIDX8]], align 4 26381 // CHECK15-NEXT: [[ADD9:%.*]] = fadd double [[TMP15]], [[TMP18]] 26382 // CHECK15-NEXT: [[TMP19:%.*]] = load double*, double** [[A]], align 4 26383 // CHECK15-NEXT: [[TMP20:%.*]] = load i32, i32* [[I3]], align 4 26384 // CHECK15-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP19]], i32 [[TMP20]] 26385 // CHECK15-NEXT: store double [[ADD9]], double* [[ARRAYIDX10]], align 4 26386 // CHECK15-NEXT: br label [[FOR_INC11:%.*]] 26387 // CHECK15: for.inc11: 26388 // CHECK15-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 26389 // CHECK15-NEXT: [[INC12:%.*]] = add nsw i32 [[TMP21]], 1 26390 // CHECK15-NEXT: store i32 [[INC12]], i32* [[I3]], align 4 26391 // CHECK15-NEXT: br label [[FOR_COND4]], !llvm.loop [[LOOP5:![0-9]+]] 26392 // CHECK15: for.end13: 26393 // CHECK15-NEXT: store i32 0, i32* [[I14]], align 4 26394 // CHECK15-NEXT: br label [[FOR_COND15:%.*]] 26395 // CHECK15: for.cond15: 26396 // CHECK15-NEXT: [[TMP22:%.*]] = load i32, i32* [[I14]], align 4 26397 // CHECK15-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 26398 // CHECK15-NEXT: [[CMP16:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 26399 // CHECK15-NEXT: br i1 [[CMP16]], label [[FOR_BODY17:%.*]], label [[FOR_END24:%.*]] 26400 // CHECK15: for.body17: 26401 // CHECK15-NEXT: [[TMP24:%.*]] = load double*, double** [[B]], align 4 26402 // CHECK15-NEXT: [[TMP25:%.*]] = load i32, i32* [[I14]], align 4 26403 // CHECK15-NEXT: [[ARRAYIDX18:%.*]] = getelementptr inbounds double, double* [[TMP24]], i32 [[TMP25]] 26404 // CHECK15-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX18]], align 4 26405 // CHECK15-NEXT: [[TMP27:%.*]] = load double*, double** [[C]], align 4 26406 // CHECK15-NEXT: [[TMP28:%.*]] = load i32, i32* [[I14]], align 4 26407 // CHECK15-NEXT: [[ARRAYIDX19:%.*]] = getelementptr inbounds double, double* [[TMP27]], i32 [[TMP28]] 26408 // CHECK15-NEXT: [[TMP29:%.*]] = load double, double* [[ARRAYIDX19]], align 4 26409 // CHECK15-NEXT: [[ADD20:%.*]] = fadd double [[TMP26]], [[TMP29]] 26410 // CHECK15-NEXT: [[TMP30:%.*]] = load double*, double** [[A]], align 4 26411 // CHECK15-NEXT: [[TMP31:%.*]] = load i32, i32* [[I14]], align 4 26412 // CHECK15-NEXT: [[ARRAYIDX21:%.*]] = getelementptr inbounds double, double* [[TMP30]], i32 [[TMP31]] 26413 // CHECK15-NEXT: store double [[ADD20]], double* [[ARRAYIDX21]], align 4 26414 // CHECK15-NEXT: br label [[FOR_INC22:%.*]] 26415 // CHECK15: for.inc22: 26416 // CHECK15-NEXT: [[TMP32:%.*]] = load i32, i32* [[I14]], align 4 26417 // CHECK15-NEXT: [[INC23:%.*]] = add nsw i32 [[TMP32]], 1 26418 // CHECK15-NEXT: store i32 [[INC23]], i32* [[I14]], align 4 26419 // CHECK15-NEXT: br label [[FOR_COND15]], !llvm.loop [[LOOP6:![0-9]+]] 26420 // CHECK15: for.end24: 26421 // CHECK15-NEXT: store i32 0, i32* [[I25]], align 4 26422 // CHECK15-NEXT: br label [[FOR_COND26:%.*]] 26423 // CHECK15: for.cond26: 26424 // CHECK15-NEXT: [[TMP33:%.*]] = load i32, i32* [[I25]], align 4 26425 // CHECK15-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 26426 // CHECK15-NEXT: [[CMP27:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 26427 // CHECK15-NEXT: br i1 [[CMP27]], label [[FOR_BODY28:%.*]], label [[FOR_END35:%.*]] 26428 // CHECK15: for.body28: 26429 // CHECK15-NEXT: [[TMP35:%.*]] = load double*, double** [[B]], align 4 26430 // CHECK15-NEXT: [[TMP36:%.*]] = load i32, i32* [[I25]], align 4 26431 // CHECK15-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds double, double* [[TMP35]], i32 [[TMP36]] 26432 // CHECK15-NEXT: [[TMP37:%.*]] = load double, double* [[ARRAYIDX29]], align 4 26433 // CHECK15-NEXT: [[TMP38:%.*]] = load double*, double** [[C]], align 4 26434 // CHECK15-NEXT: [[TMP39:%.*]] = load i32, i32* [[I25]], align 4 26435 // CHECK15-NEXT: [[ARRAYIDX30:%.*]] = getelementptr inbounds double, double* [[TMP38]], i32 [[TMP39]] 26436 // CHECK15-NEXT: [[TMP40:%.*]] = load double, double* [[ARRAYIDX30]], align 4 26437 // CHECK15-NEXT: [[ADD31:%.*]] = fadd double [[TMP37]], [[TMP40]] 26438 // CHECK15-NEXT: [[TMP41:%.*]] = load double*, double** [[A]], align 4 26439 // CHECK15-NEXT: [[TMP42:%.*]] = load i32, i32* [[I25]], align 4 26440 // CHECK15-NEXT: [[ARRAYIDX32:%.*]] = getelementptr inbounds double, double* [[TMP41]], i32 [[TMP42]] 26441 // CHECK15-NEXT: store double [[ADD31]], double* [[ARRAYIDX32]], align 4 26442 // CHECK15-NEXT: br label [[FOR_INC33:%.*]] 26443 // CHECK15: for.inc33: 26444 // CHECK15-NEXT: [[TMP43:%.*]] = load i32, i32* [[I25]], align 4 26445 // CHECK15-NEXT: [[INC34:%.*]] = add nsw i32 [[TMP43]], 1 26446 // CHECK15-NEXT: store i32 [[INC34]], i32* [[I25]], align 4 26447 // CHECK15-NEXT: br label [[FOR_COND26]], !llvm.loop [[LOOP7:![0-9]+]] 26448 // CHECK15: for.end35: 26449 // CHECK15-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 26450 // CHECK15-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 26451 // CHECK15-NEXT: store i32 0, i32* [[I36]], align 4 26452 // CHECK15-NEXT: br label [[FOR_COND37:%.*]] 26453 // CHECK15: for.cond37: 26454 // CHECK15-NEXT: [[TMP45:%.*]] = load i32, i32* [[I36]], align 4 26455 // CHECK15-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 26456 // CHECK15-NEXT: [[CMP38:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 26457 // CHECK15-NEXT: br i1 [[CMP38]], label [[FOR_BODY39:%.*]], label [[FOR_END46:%.*]] 26458 // CHECK15: for.body39: 26459 // CHECK15-NEXT: [[TMP47:%.*]] = load double*, double** [[B]], align 4 26460 // CHECK15-NEXT: [[TMP48:%.*]] = load i32, i32* [[I36]], align 4 26461 // CHECK15-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds double, double* [[TMP47]], i32 [[TMP48]] 26462 // CHECK15-NEXT: [[TMP49:%.*]] = load double, double* [[ARRAYIDX40]], align 4 26463 // CHECK15-NEXT: [[TMP50:%.*]] = load double*, double** [[C]], align 4 26464 // CHECK15-NEXT: [[TMP51:%.*]] = load i32, i32* [[I36]], align 4 26465 // CHECK15-NEXT: [[ARRAYIDX41:%.*]] = getelementptr inbounds double, double* [[TMP50]], i32 [[TMP51]] 26466 // CHECK15-NEXT: [[TMP52:%.*]] = load double, double* [[ARRAYIDX41]], align 4 26467 // CHECK15-NEXT: [[ADD42:%.*]] = fadd double [[TMP49]], [[TMP52]] 26468 // CHECK15-NEXT: [[TMP53:%.*]] = load double*, double** [[A]], align 4 26469 // CHECK15-NEXT: [[TMP54:%.*]] = load i32, i32* [[I36]], align 4 26470 // CHECK15-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds double, double* [[TMP53]], i32 [[TMP54]] 26471 // CHECK15-NEXT: store double [[ADD42]], double* [[ARRAYIDX43]], align 4 26472 // CHECK15-NEXT: br label [[FOR_INC44:%.*]] 26473 // CHECK15: for.inc44: 26474 // CHECK15-NEXT: [[TMP55:%.*]] = load i32, i32* [[I36]], align 4 26475 // CHECK15-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP55]], 1 26476 // CHECK15-NEXT: store i32 [[INC45]], i32* [[I36]], align 4 26477 // CHECK15-NEXT: br label [[FOR_COND37]], !llvm.loop [[LOOP8:![0-9]+]] 26478 // CHECK15: for.end46: 26479 // CHECK15-NEXT: store i32 0, i32* [[I47]], align 4 26480 // CHECK15-NEXT: br label [[FOR_COND48:%.*]] 26481 // CHECK15: for.cond48: 26482 // CHECK15-NEXT: [[TMP56:%.*]] = load i32, i32* [[I47]], align 4 26483 // CHECK15-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 26484 // CHECK15-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 26485 // CHECK15-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END57:%.*]] 26486 // CHECK15: for.body50: 26487 // CHECK15-NEXT: [[TMP58:%.*]] = load double*, double** [[B]], align 4 26488 // CHECK15-NEXT: [[TMP59:%.*]] = load i32, i32* [[I47]], align 4 26489 // CHECK15-NEXT: [[ARRAYIDX51:%.*]] = getelementptr inbounds double, double* [[TMP58]], i32 [[TMP59]] 26490 // CHECK15-NEXT: [[TMP60:%.*]] = load double, double* [[ARRAYIDX51]], align 4 26491 // CHECK15-NEXT: [[TMP61:%.*]] = load double*, double** [[C]], align 4 26492 // CHECK15-NEXT: [[TMP62:%.*]] = load i32, i32* [[I47]], align 4 26493 // CHECK15-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds double, double* [[TMP61]], i32 [[TMP62]] 26494 // CHECK15-NEXT: [[TMP63:%.*]] = load double, double* [[ARRAYIDX52]], align 4 26495 // CHECK15-NEXT: [[ADD53:%.*]] = fadd double [[TMP60]], [[TMP63]] 26496 // CHECK15-NEXT: [[TMP64:%.*]] = load double*, double** [[A]], align 4 26497 // CHECK15-NEXT: [[TMP65:%.*]] = load i32, i32* [[I47]], align 4 26498 // CHECK15-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds double, double* [[TMP64]], i32 [[TMP65]] 26499 // CHECK15-NEXT: store double [[ADD53]], double* [[ARRAYIDX54]], align 4 26500 // CHECK15-NEXT: br label [[FOR_INC55:%.*]] 26501 // CHECK15: for.inc55: 26502 // CHECK15-NEXT: [[TMP66:%.*]] = load i32, i32* [[I47]], align 4 26503 // CHECK15-NEXT: [[INC56:%.*]] = add nsw i32 [[TMP66]], 1 26504 // CHECK15-NEXT: store i32 [[INC56]], i32* [[I47]], align 4 26505 // CHECK15-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP9:![0-9]+]] 26506 // CHECK15: for.end57: 26507 // CHECK15-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 26508 // CHECK15-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_58]], align 4 26509 // CHECK15-NEXT: store i32 0, i32* [[I59]], align 4 26510 // CHECK15-NEXT: br label [[FOR_COND60:%.*]] 26511 // CHECK15: for.cond60: 26512 // CHECK15-NEXT: [[TMP68:%.*]] = load i32, i32* [[I59]], align 4 26513 // CHECK15-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 26514 // CHECK15-NEXT: [[CMP61:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 26515 // CHECK15-NEXT: br i1 [[CMP61]], label [[FOR_BODY62:%.*]], label [[FOR_END69:%.*]] 26516 // CHECK15: for.body62: 26517 // CHECK15-NEXT: [[TMP70:%.*]] = load double*, double** [[B]], align 4 26518 // CHECK15-NEXT: [[TMP71:%.*]] = load i32, i32* [[I59]], align 4 26519 // CHECK15-NEXT: [[ARRAYIDX63:%.*]] = getelementptr inbounds double, double* [[TMP70]], i32 [[TMP71]] 26520 // CHECK15-NEXT: [[TMP72:%.*]] = load double, double* [[ARRAYIDX63]], align 4 26521 // CHECK15-NEXT: [[TMP73:%.*]] = load double*, double** [[C]], align 4 26522 // CHECK15-NEXT: [[TMP74:%.*]] = load i32, i32* [[I59]], align 4 26523 // CHECK15-NEXT: [[ARRAYIDX64:%.*]] = getelementptr inbounds double, double* [[TMP73]], i32 [[TMP74]] 26524 // CHECK15-NEXT: [[TMP75:%.*]] = load double, double* [[ARRAYIDX64]], align 4 26525 // CHECK15-NEXT: [[ADD65:%.*]] = fadd double [[TMP72]], [[TMP75]] 26526 // CHECK15-NEXT: [[TMP76:%.*]] = load double*, double** [[A]], align 4 26527 // CHECK15-NEXT: [[TMP77:%.*]] = load i32, i32* [[I59]], align 4 26528 // CHECK15-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds double, double* [[TMP76]], i32 [[TMP77]] 26529 // CHECK15-NEXT: store double [[ADD65]], double* [[ARRAYIDX66]], align 4 26530 // CHECK15-NEXT: br label [[FOR_INC67:%.*]] 26531 // CHECK15: for.inc67: 26532 // CHECK15-NEXT: [[TMP78:%.*]] = load i32, i32* [[I59]], align 4 26533 // CHECK15-NEXT: [[INC68:%.*]] = add nsw i32 [[TMP78]], 1 26534 // CHECK15-NEXT: store i32 [[INC68]], i32* [[I59]], align 4 26535 // CHECK15-NEXT: br label [[FOR_COND60]], !llvm.loop [[LOOP10:![0-9]+]] 26536 // CHECK15: for.end69: 26537 // CHECK15-NEXT: [[CALL:%.*]] = call i32 @_Z5tmainIiET_v() 26538 // CHECK15-NEXT: ret i32 [[CALL]] 26539 // 26540 // 26541 // CHECK15-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 26542 // CHECK15-SAME: () #[[ATTR1:[0-9]+]] comdat { 26543 // CHECK15-NEXT: entry: 26544 // CHECK15-NEXT: [[A:%.*]] = alloca i32*, align 4 26545 // CHECK15-NEXT: [[B:%.*]] = alloca i32*, align 4 26546 // CHECK15-NEXT: [[C:%.*]] = alloca i32*, align 4 26547 // CHECK15-NEXT: [[N:%.*]] = alloca i32, align 4 26548 // CHECK15-NEXT: [[CH:%.*]] = alloca i32, align 4 26549 // CHECK15-NEXT: [[I:%.*]] = alloca i32, align 4 26550 // CHECK15-NEXT: [[I3:%.*]] = alloca i32, align 4 26551 // CHECK15-NEXT: [[I14:%.*]] = alloca i32, align 4 26552 // CHECK15-NEXT: [[I25:%.*]] = alloca i32, align 4 26553 // CHECK15-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 26554 // CHECK15-NEXT: [[I36:%.*]] = alloca i32, align 4 26555 // CHECK15-NEXT: [[I47:%.*]] = alloca i32, align 4 26556 // CHECK15-NEXT: [[DOTCAPTURE_EXPR_58:%.*]] = alloca i32, align 4 26557 // CHECK15-NEXT: [[I59:%.*]] = alloca i32, align 4 26558 // CHECK15-NEXT: store i32 10000, i32* [[N]], align 4 26559 // CHECK15-NEXT: store i32 100, i32* [[CH]], align 4 26560 // CHECK15-NEXT: store i32 0, i32* [[I]], align 4 26561 // CHECK15-NEXT: br label [[FOR_COND:%.*]] 26562 // CHECK15: for.cond: 26563 // CHECK15-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 26564 // CHECK15-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 26565 // CHECK15-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 26566 // CHECK15-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 26567 // CHECK15: for.body: 26568 // CHECK15-NEXT: [[TMP2:%.*]] = load i32*, i32** [[B]], align 4 26569 // CHECK15-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 26570 // CHECK15-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP2]], i32 [[TMP3]] 26571 // CHECK15-NEXT: [[TMP4:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 26572 // CHECK15-NEXT: [[TMP5:%.*]] = load i32*, i32** [[C]], align 4 26573 // CHECK15-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 26574 // CHECK15-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[TMP5]], i32 [[TMP6]] 26575 // CHECK15-NEXT: [[TMP7:%.*]] = load i32, i32* [[ARRAYIDX1]], align 4 26576 // CHECK15-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP4]], [[TMP7]] 26577 // CHECK15-NEXT: [[TMP8:%.*]] = load i32*, i32** [[A]], align 4 26578 // CHECK15-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 26579 // CHECK15-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i32, i32* [[TMP8]], i32 [[TMP9]] 26580 // CHECK15-NEXT: store i32 [[ADD]], i32* [[ARRAYIDX2]], align 4 26581 // CHECK15-NEXT: br label [[FOR_INC:%.*]] 26582 // CHECK15: for.inc: 26583 // CHECK15-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 26584 // CHECK15-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 26585 // CHECK15-NEXT: store i32 [[INC]], i32* [[I]], align 4 26586 // CHECK15-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP11:![0-9]+]] 26587 // CHECK15: for.end: 26588 // CHECK15-NEXT: store i32 0, i32* [[I3]], align 4 26589 // CHECK15-NEXT: br label [[FOR_COND4:%.*]] 26590 // CHECK15: for.cond4: 26591 // CHECK15-NEXT: [[TMP11:%.*]] = load i32, i32* [[I3]], align 4 26592 // CHECK15-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 26593 // CHECK15-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 26594 // CHECK15-NEXT: br i1 [[CMP5]], label [[FOR_BODY6:%.*]], label [[FOR_END13:%.*]] 26595 // CHECK15: for.body6: 26596 // CHECK15-NEXT: [[TMP13:%.*]] = load i32*, i32** [[B]], align 4 26597 // CHECK15-NEXT: [[TMP14:%.*]] = load i32, i32* [[I3]], align 4 26598 // CHECK15-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds i32, i32* [[TMP13]], i32 [[TMP14]] 26599 // CHECK15-NEXT: [[TMP15:%.*]] = load i32, i32* [[ARRAYIDX7]], align 4 26600 // CHECK15-NEXT: [[TMP16:%.*]] = load i32*, i32** [[C]], align 4 26601 // CHECK15-NEXT: [[TMP17:%.*]] = load i32, i32* [[I3]], align 4 26602 // CHECK15-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP16]], i32 [[TMP17]] 26603 // CHECK15-NEXT: [[TMP18:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 26604 // CHECK15-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP15]], [[TMP18]] 26605 // CHECK15-NEXT: [[TMP19:%.*]] = load i32*, i32** [[A]], align 4 26606 // CHECK15-NEXT: [[TMP20:%.*]] = load i32, i32* [[I3]], align 4 26607 // CHECK15-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP19]], i32 [[TMP20]] 26608 // CHECK15-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX10]], align 4 26609 // CHECK15-NEXT: br label [[FOR_INC11:%.*]] 26610 // CHECK15: for.inc11: 26611 // CHECK15-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 26612 // CHECK15-NEXT: [[INC12:%.*]] = add nsw i32 [[TMP21]], 1 26613 // CHECK15-NEXT: store i32 [[INC12]], i32* [[I3]], align 4 26614 // CHECK15-NEXT: br label [[FOR_COND4]], !llvm.loop [[LOOP12:![0-9]+]] 26615 // CHECK15: for.end13: 26616 // CHECK15-NEXT: store i32 0, i32* [[I14]], align 4 26617 // CHECK15-NEXT: br label [[FOR_COND15:%.*]] 26618 // CHECK15: for.cond15: 26619 // CHECK15-NEXT: [[TMP22:%.*]] = load i32, i32* [[I14]], align 4 26620 // CHECK15-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 26621 // CHECK15-NEXT: [[CMP16:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 26622 // CHECK15-NEXT: br i1 [[CMP16]], label [[FOR_BODY17:%.*]], label [[FOR_END24:%.*]] 26623 // CHECK15: for.body17: 26624 // CHECK15-NEXT: [[TMP24:%.*]] = load i32*, i32** [[B]], align 4 26625 // CHECK15-NEXT: [[TMP25:%.*]] = load i32, i32* [[I14]], align 4 26626 // CHECK15-NEXT: [[ARRAYIDX18:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i32 [[TMP25]] 26627 // CHECK15-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX18]], align 4 26628 // CHECK15-NEXT: [[TMP27:%.*]] = load i32*, i32** [[C]], align 4 26629 // CHECK15-NEXT: [[TMP28:%.*]] = load i32, i32* [[I14]], align 4 26630 // CHECK15-NEXT: [[ARRAYIDX19:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i32 [[TMP28]] 26631 // CHECK15-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX19]], align 4 26632 // CHECK15-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 26633 // CHECK15-NEXT: [[TMP30:%.*]] = load i32*, i32** [[A]], align 4 26634 // CHECK15-NEXT: [[TMP31:%.*]] = load i32, i32* [[I14]], align 4 26635 // CHECK15-NEXT: [[ARRAYIDX21:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i32 [[TMP31]] 26636 // CHECK15-NEXT: store i32 [[ADD20]], i32* [[ARRAYIDX21]], align 4 26637 // CHECK15-NEXT: br label [[FOR_INC22:%.*]] 26638 // CHECK15: for.inc22: 26639 // CHECK15-NEXT: [[TMP32:%.*]] = load i32, i32* [[I14]], align 4 26640 // CHECK15-NEXT: [[INC23:%.*]] = add nsw i32 [[TMP32]], 1 26641 // CHECK15-NEXT: store i32 [[INC23]], i32* [[I14]], align 4 26642 // CHECK15-NEXT: br label [[FOR_COND15]], !llvm.loop [[LOOP13:![0-9]+]] 26643 // CHECK15: for.end24: 26644 // CHECK15-NEXT: store i32 0, i32* [[I25]], align 4 26645 // CHECK15-NEXT: br label [[FOR_COND26:%.*]] 26646 // CHECK15: for.cond26: 26647 // CHECK15-NEXT: [[TMP33:%.*]] = load i32, i32* [[I25]], align 4 26648 // CHECK15-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 26649 // CHECK15-NEXT: [[CMP27:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 26650 // CHECK15-NEXT: br i1 [[CMP27]], label [[FOR_BODY28:%.*]], label [[FOR_END35:%.*]] 26651 // CHECK15: for.body28: 26652 // CHECK15-NEXT: [[TMP35:%.*]] = load i32*, i32** [[B]], align 4 26653 // CHECK15-NEXT: [[TMP36:%.*]] = load i32, i32* [[I25]], align 4 26654 // CHECK15-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds i32, i32* [[TMP35]], i32 [[TMP36]] 26655 // CHECK15-NEXT: [[TMP37:%.*]] = load i32, i32* [[ARRAYIDX29]], align 4 26656 // CHECK15-NEXT: [[TMP38:%.*]] = load i32*, i32** [[C]], align 4 26657 // CHECK15-NEXT: [[TMP39:%.*]] = load i32, i32* [[I25]], align 4 26658 // CHECK15-NEXT: [[ARRAYIDX30:%.*]] = getelementptr inbounds i32, i32* [[TMP38]], i32 [[TMP39]] 26659 // CHECK15-NEXT: [[TMP40:%.*]] = load i32, i32* [[ARRAYIDX30]], align 4 26660 // CHECK15-NEXT: [[ADD31:%.*]] = add nsw i32 [[TMP37]], [[TMP40]] 26661 // CHECK15-NEXT: [[TMP41:%.*]] = load i32*, i32** [[A]], align 4 26662 // CHECK15-NEXT: [[TMP42:%.*]] = load i32, i32* [[I25]], align 4 26663 // CHECK15-NEXT: [[ARRAYIDX32:%.*]] = getelementptr inbounds i32, i32* [[TMP41]], i32 [[TMP42]] 26664 // CHECK15-NEXT: store i32 [[ADD31]], i32* [[ARRAYIDX32]], align 4 26665 // CHECK15-NEXT: br label [[FOR_INC33:%.*]] 26666 // CHECK15: for.inc33: 26667 // CHECK15-NEXT: [[TMP43:%.*]] = load i32, i32* [[I25]], align 4 26668 // CHECK15-NEXT: [[INC34:%.*]] = add nsw i32 [[TMP43]], 1 26669 // CHECK15-NEXT: store i32 [[INC34]], i32* [[I25]], align 4 26670 // CHECK15-NEXT: br label [[FOR_COND26]], !llvm.loop [[LOOP14:![0-9]+]] 26671 // CHECK15: for.end35: 26672 // CHECK15-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 26673 // CHECK15-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 26674 // CHECK15-NEXT: store i32 0, i32* [[I36]], align 4 26675 // CHECK15-NEXT: br label [[FOR_COND37:%.*]] 26676 // CHECK15: for.cond37: 26677 // CHECK15-NEXT: [[TMP45:%.*]] = load i32, i32* [[I36]], align 4 26678 // CHECK15-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 26679 // CHECK15-NEXT: [[CMP38:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 26680 // CHECK15-NEXT: br i1 [[CMP38]], label [[FOR_BODY39:%.*]], label [[FOR_END46:%.*]] 26681 // CHECK15: for.body39: 26682 // CHECK15-NEXT: [[TMP47:%.*]] = load i32*, i32** [[B]], align 4 26683 // CHECK15-NEXT: [[TMP48:%.*]] = load i32, i32* [[I36]], align 4 26684 // CHECK15-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds i32, i32* [[TMP47]], i32 [[TMP48]] 26685 // CHECK15-NEXT: [[TMP49:%.*]] = load i32, i32* [[ARRAYIDX40]], align 4 26686 // CHECK15-NEXT: [[TMP50:%.*]] = load i32*, i32** [[C]], align 4 26687 // CHECK15-NEXT: [[TMP51:%.*]] = load i32, i32* [[I36]], align 4 26688 // CHECK15-NEXT: [[ARRAYIDX41:%.*]] = getelementptr inbounds i32, i32* [[TMP50]], i32 [[TMP51]] 26689 // CHECK15-NEXT: [[TMP52:%.*]] = load i32, i32* [[ARRAYIDX41]], align 4 26690 // CHECK15-NEXT: [[ADD42:%.*]] = add nsw i32 [[TMP49]], [[TMP52]] 26691 // CHECK15-NEXT: [[TMP53:%.*]] = load i32*, i32** [[A]], align 4 26692 // CHECK15-NEXT: [[TMP54:%.*]] = load i32, i32* [[I36]], align 4 26693 // CHECK15-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds i32, i32* [[TMP53]], i32 [[TMP54]] 26694 // CHECK15-NEXT: store i32 [[ADD42]], i32* [[ARRAYIDX43]], align 4 26695 // CHECK15-NEXT: br label [[FOR_INC44:%.*]] 26696 // CHECK15: for.inc44: 26697 // CHECK15-NEXT: [[TMP55:%.*]] = load i32, i32* [[I36]], align 4 26698 // CHECK15-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP55]], 1 26699 // CHECK15-NEXT: store i32 [[INC45]], i32* [[I36]], align 4 26700 // CHECK15-NEXT: br label [[FOR_COND37]], !llvm.loop [[LOOP15:![0-9]+]] 26701 // CHECK15: for.end46: 26702 // CHECK15-NEXT: store i32 0, i32* [[I47]], align 4 26703 // CHECK15-NEXT: br label [[FOR_COND48:%.*]] 26704 // CHECK15: for.cond48: 26705 // CHECK15-NEXT: [[TMP56:%.*]] = load i32, i32* [[I47]], align 4 26706 // CHECK15-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 26707 // CHECK15-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 26708 // CHECK15-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END57:%.*]] 26709 // CHECK15: for.body50: 26710 // CHECK15-NEXT: [[TMP58:%.*]] = load i32*, i32** [[B]], align 4 26711 // CHECK15-NEXT: [[TMP59:%.*]] = load i32, i32* [[I47]], align 4 26712 // CHECK15-NEXT: [[ARRAYIDX51:%.*]] = getelementptr inbounds i32, i32* [[TMP58]], i32 [[TMP59]] 26713 // CHECK15-NEXT: [[TMP60:%.*]] = load i32, i32* [[ARRAYIDX51]], align 4 26714 // CHECK15-NEXT: [[TMP61:%.*]] = load i32*, i32** [[C]], align 4 26715 // CHECK15-NEXT: [[TMP62:%.*]] = load i32, i32* [[I47]], align 4 26716 // CHECK15-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds i32, i32* [[TMP61]], i32 [[TMP62]] 26717 // CHECK15-NEXT: [[TMP63:%.*]] = load i32, i32* [[ARRAYIDX52]], align 4 26718 // CHECK15-NEXT: [[ADD53:%.*]] = add nsw i32 [[TMP60]], [[TMP63]] 26719 // CHECK15-NEXT: [[TMP64:%.*]] = load i32*, i32** [[A]], align 4 26720 // CHECK15-NEXT: [[TMP65:%.*]] = load i32, i32* [[I47]], align 4 26721 // CHECK15-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds i32, i32* [[TMP64]], i32 [[TMP65]] 26722 // CHECK15-NEXT: store i32 [[ADD53]], i32* [[ARRAYIDX54]], align 4 26723 // CHECK15-NEXT: br label [[FOR_INC55:%.*]] 26724 // CHECK15: for.inc55: 26725 // CHECK15-NEXT: [[TMP66:%.*]] = load i32, i32* [[I47]], align 4 26726 // CHECK15-NEXT: [[INC56:%.*]] = add nsw i32 [[TMP66]], 1 26727 // CHECK15-NEXT: store i32 [[INC56]], i32* [[I47]], align 4 26728 // CHECK15-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP16:![0-9]+]] 26729 // CHECK15: for.end57: 26730 // CHECK15-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 26731 // CHECK15-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_58]], align 4 26732 // CHECK15-NEXT: store i32 0, i32* [[I59]], align 4 26733 // CHECK15-NEXT: br label [[FOR_COND60:%.*]] 26734 // CHECK15: for.cond60: 26735 // CHECK15-NEXT: [[TMP68:%.*]] = load i32, i32* [[I59]], align 4 26736 // CHECK15-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 26737 // CHECK15-NEXT: [[CMP61:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 26738 // CHECK15-NEXT: br i1 [[CMP61]], label [[FOR_BODY62:%.*]], label [[FOR_END69:%.*]] 26739 // CHECK15: for.body62: 26740 // CHECK15-NEXT: [[TMP70:%.*]] = load i32*, i32** [[B]], align 4 26741 // CHECK15-NEXT: [[TMP71:%.*]] = load i32, i32* [[I59]], align 4 26742 // CHECK15-NEXT: [[ARRAYIDX63:%.*]] = getelementptr inbounds i32, i32* [[TMP70]], i32 [[TMP71]] 26743 // CHECK15-NEXT: [[TMP72:%.*]] = load i32, i32* [[ARRAYIDX63]], align 4 26744 // CHECK15-NEXT: [[TMP73:%.*]] = load i32*, i32** [[C]], align 4 26745 // CHECK15-NEXT: [[TMP74:%.*]] = load i32, i32* [[I59]], align 4 26746 // CHECK15-NEXT: [[ARRAYIDX64:%.*]] = getelementptr inbounds i32, i32* [[TMP73]], i32 [[TMP74]] 26747 // CHECK15-NEXT: [[TMP75:%.*]] = load i32, i32* [[ARRAYIDX64]], align 4 26748 // CHECK15-NEXT: [[ADD65:%.*]] = add nsw i32 [[TMP72]], [[TMP75]] 26749 // CHECK15-NEXT: [[TMP76:%.*]] = load i32*, i32** [[A]], align 4 26750 // CHECK15-NEXT: [[TMP77:%.*]] = load i32, i32* [[I59]], align 4 26751 // CHECK15-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds i32, i32* [[TMP76]], i32 [[TMP77]] 26752 // CHECK15-NEXT: store i32 [[ADD65]], i32* [[ARRAYIDX66]], align 4 26753 // CHECK15-NEXT: br label [[FOR_INC67:%.*]] 26754 // CHECK15: for.inc67: 26755 // CHECK15-NEXT: [[TMP78:%.*]] = load i32, i32* [[I59]], align 4 26756 // CHECK15-NEXT: [[INC68:%.*]] = add nsw i32 [[TMP78]], 1 26757 // CHECK15-NEXT: store i32 [[INC68]], i32* [[I59]], align 4 26758 // CHECK15-NEXT: br label [[FOR_COND60]], !llvm.loop [[LOOP17:![0-9]+]] 26759 // CHECK15: for.end69: 26760 // CHECK15-NEXT: ret i32 0 26761 // 26762 // 26763 // CHECK16-LABEL: define {{[^@]+}}@main 26764 // CHECK16-SAME: () #[[ATTR0:[0-9]+]] { 26765 // CHECK16-NEXT: entry: 26766 // CHECK16-NEXT: [[RETVAL:%.*]] = alloca i32, align 4 26767 // CHECK16-NEXT: [[A:%.*]] = alloca double*, align 4 26768 // CHECK16-NEXT: [[B:%.*]] = alloca double*, align 4 26769 // CHECK16-NEXT: [[C:%.*]] = alloca double*, align 4 26770 // CHECK16-NEXT: [[N:%.*]] = alloca i32, align 4 26771 // CHECK16-NEXT: [[CH:%.*]] = alloca i32, align 4 26772 // CHECK16-NEXT: [[I:%.*]] = alloca i32, align 4 26773 // CHECK16-NEXT: [[I3:%.*]] = alloca i32, align 4 26774 // CHECK16-NEXT: [[I14:%.*]] = alloca i32, align 4 26775 // CHECK16-NEXT: [[I25:%.*]] = alloca i32, align 4 26776 // CHECK16-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 26777 // CHECK16-NEXT: [[I36:%.*]] = alloca i32, align 4 26778 // CHECK16-NEXT: [[I47:%.*]] = alloca i32, align 4 26779 // CHECK16-NEXT: [[DOTCAPTURE_EXPR_58:%.*]] = alloca i32, align 4 26780 // CHECK16-NEXT: [[I59:%.*]] = alloca i32, align 4 26781 // CHECK16-NEXT: store i32 0, i32* [[RETVAL]], align 4 26782 // CHECK16-NEXT: store i32 10000, i32* [[N]], align 4 26783 // CHECK16-NEXT: store i32 100, i32* [[CH]], align 4 26784 // CHECK16-NEXT: store i32 0, i32* [[I]], align 4 26785 // CHECK16-NEXT: br label [[FOR_COND:%.*]] 26786 // CHECK16: for.cond: 26787 // CHECK16-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 26788 // CHECK16-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 26789 // CHECK16-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 26790 // CHECK16-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 26791 // CHECK16: for.body: 26792 // CHECK16-NEXT: [[TMP2:%.*]] = load double*, double** [[B]], align 4 26793 // CHECK16-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 26794 // CHECK16-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, double* [[TMP2]], i32 [[TMP3]] 26795 // CHECK16-NEXT: [[TMP4:%.*]] = load double, double* [[ARRAYIDX]], align 4 26796 // CHECK16-NEXT: [[TMP5:%.*]] = load double*, double** [[C]], align 4 26797 // CHECK16-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 26798 // CHECK16-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds double, double* [[TMP5]], i32 [[TMP6]] 26799 // CHECK16-NEXT: [[TMP7:%.*]] = load double, double* [[ARRAYIDX1]], align 4 26800 // CHECK16-NEXT: [[ADD:%.*]] = fadd double [[TMP4]], [[TMP7]] 26801 // CHECK16-NEXT: [[TMP8:%.*]] = load double*, double** [[A]], align 4 26802 // CHECK16-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 26803 // CHECK16-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds double, double* [[TMP8]], i32 [[TMP9]] 26804 // CHECK16-NEXT: store double [[ADD]], double* [[ARRAYIDX2]], align 4 26805 // CHECK16-NEXT: br label [[FOR_INC:%.*]] 26806 // CHECK16: for.inc: 26807 // CHECK16-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 26808 // CHECK16-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 26809 // CHECK16-NEXT: store i32 [[INC]], i32* [[I]], align 4 26810 // CHECK16-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP3:![0-9]+]] 26811 // CHECK16: for.end: 26812 // CHECK16-NEXT: store i32 0, i32* [[I3]], align 4 26813 // CHECK16-NEXT: br label [[FOR_COND4:%.*]] 26814 // CHECK16: for.cond4: 26815 // CHECK16-NEXT: [[TMP11:%.*]] = load i32, i32* [[I3]], align 4 26816 // CHECK16-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 26817 // CHECK16-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 26818 // CHECK16-NEXT: br i1 [[CMP5]], label [[FOR_BODY6:%.*]], label [[FOR_END13:%.*]] 26819 // CHECK16: for.body6: 26820 // CHECK16-NEXT: [[TMP13:%.*]] = load double*, double** [[B]], align 4 26821 // CHECK16-NEXT: [[TMP14:%.*]] = load i32, i32* [[I3]], align 4 26822 // CHECK16-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds double, double* [[TMP13]], i32 [[TMP14]] 26823 // CHECK16-NEXT: [[TMP15:%.*]] = load double, double* [[ARRAYIDX7]], align 4 26824 // CHECK16-NEXT: [[TMP16:%.*]] = load double*, double** [[C]], align 4 26825 // CHECK16-NEXT: [[TMP17:%.*]] = load i32, i32* [[I3]], align 4 26826 // CHECK16-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds double, double* [[TMP16]], i32 [[TMP17]] 26827 // CHECK16-NEXT: [[TMP18:%.*]] = load double, double* [[ARRAYIDX8]], align 4 26828 // CHECK16-NEXT: [[ADD9:%.*]] = fadd double [[TMP15]], [[TMP18]] 26829 // CHECK16-NEXT: [[TMP19:%.*]] = load double*, double** [[A]], align 4 26830 // CHECK16-NEXT: [[TMP20:%.*]] = load i32, i32* [[I3]], align 4 26831 // CHECK16-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds double, double* [[TMP19]], i32 [[TMP20]] 26832 // CHECK16-NEXT: store double [[ADD9]], double* [[ARRAYIDX10]], align 4 26833 // CHECK16-NEXT: br label [[FOR_INC11:%.*]] 26834 // CHECK16: for.inc11: 26835 // CHECK16-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 26836 // CHECK16-NEXT: [[INC12:%.*]] = add nsw i32 [[TMP21]], 1 26837 // CHECK16-NEXT: store i32 [[INC12]], i32* [[I3]], align 4 26838 // CHECK16-NEXT: br label [[FOR_COND4]], !llvm.loop [[LOOP5:![0-9]+]] 26839 // CHECK16: for.end13: 26840 // CHECK16-NEXT: store i32 0, i32* [[I14]], align 4 26841 // CHECK16-NEXT: br label [[FOR_COND15:%.*]] 26842 // CHECK16: for.cond15: 26843 // CHECK16-NEXT: [[TMP22:%.*]] = load i32, i32* [[I14]], align 4 26844 // CHECK16-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 26845 // CHECK16-NEXT: [[CMP16:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 26846 // CHECK16-NEXT: br i1 [[CMP16]], label [[FOR_BODY17:%.*]], label [[FOR_END24:%.*]] 26847 // CHECK16: for.body17: 26848 // CHECK16-NEXT: [[TMP24:%.*]] = load double*, double** [[B]], align 4 26849 // CHECK16-NEXT: [[TMP25:%.*]] = load i32, i32* [[I14]], align 4 26850 // CHECK16-NEXT: [[ARRAYIDX18:%.*]] = getelementptr inbounds double, double* [[TMP24]], i32 [[TMP25]] 26851 // CHECK16-NEXT: [[TMP26:%.*]] = load double, double* [[ARRAYIDX18]], align 4 26852 // CHECK16-NEXT: [[TMP27:%.*]] = load double*, double** [[C]], align 4 26853 // CHECK16-NEXT: [[TMP28:%.*]] = load i32, i32* [[I14]], align 4 26854 // CHECK16-NEXT: [[ARRAYIDX19:%.*]] = getelementptr inbounds double, double* [[TMP27]], i32 [[TMP28]] 26855 // CHECK16-NEXT: [[TMP29:%.*]] = load double, double* [[ARRAYIDX19]], align 4 26856 // CHECK16-NEXT: [[ADD20:%.*]] = fadd double [[TMP26]], [[TMP29]] 26857 // CHECK16-NEXT: [[TMP30:%.*]] = load double*, double** [[A]], align 4 26858 // CHECK16-NEXT: [[TMP31:%.*]] = load i32, i32* [[I14]], align 4 26859 // CHECK16-NEXT: [[ARRAYIDX21:%.*]] = getelementptr inbounds double, double* [[TMP30]], i32 [[TMP31]] 26860 // CHECK16-NEXT: store double [[ADD20]], double* [[ARRAYIDX21]], align 4 26861 // CHECK16-NEXT: br label [[FOR_INC22:%.*]] 26862 // CHECK16: for.inc22: 26863 // CHECK16-NEXT: [[TMP32:%.*]] = load i32, i32* [[I14]], align 4 26864 // CHECK16-NEXT: [[INC23:%.*]] = add nsw i32 [[TMP32]], 1 26865 // CHECK16-NEXT: store i32 [[INC23]], i32* [[I14]], align 4 26866 // CHECK16-NEXT: br label [[FOR_COND15]], !llvm.loop [[LOOP6:![0-9]+]] 26867 // CHECK16: for.end24: 26868 // CHECK16-NEXT: store i32 0, i32* [[I25]], align 4 26869 // CHECK16-NEXT: br label [[FOR_COND26:%.*]] 26870 // CHECK16: for.cond26: 26871 // CHECK16-NEXT: [[TMP33:%.*]] = load i32, i32* [[I25]], align 4 26872 // CHECK16-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 26873 // CHECK16-NEXT: [[CMP27:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 26874 // CHECK16-NEXT: br i1 [[CMP27]], label [[FOR_BODY28:%.*]], label [[FOR_END35:%.*]] 26875 // CHECK16: for.body28: 26876 // CHECK16-NEXT: [[TMP35:%.*]] = load double*, double** [[B]], align 4 26877 // CHECK16-NEXT: [[TMP36:%.*]] = load i32, i32* [[I25]], align 4 26878 // CHECK16-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds double, double* [[TMP35]], i32 [[TMP36]] 26879 // CHECK16-NEXT: [[TMP37:%.*]] = load double, double* [[ARRAYIDX29]], align 4 26880 // CHECK16-NEXT: [[TMP38:%.*]] = load double*, double** [[C]], align 4 26881 // CHECK16-NEXT: [[TMP39:%.*]] = load i32, i32* [[I25]], align 4 26882 // CHECK16-NEXT: [[ARRAYIDX30:%.*]] = getelementptr inbounds double, double* [[TMP38]], i32 [[TMP39]] 26883 // CHECK16-NEXT: [[TMP40:%.*]] = load double, double* [[ARRAYIDX30]], align 4 26884 // CHECK16-NEXT: [[ADD31:%.*]] = fadd double [[TMP37]], [[TMP40]] 26885 // CHECK16-NEXT: [[TMP41:%.*]] = load double*, double** [[A]], align 4 26886 // CHECK16-NEXT: [[TMP42:%.*]] = load i32, i32* [[I25]], align 4 26887 // CHECK16-NEXT: [[ARRAYIDX32:%.*]] = getelementptr inbounds double, double* [[TMP41]], i32 [[TMP42]] 26888 // CHECK16-NEXT: store double [[ADD31]], double* [[ARRAYIDX32]], align 4 26889 // CHECK16-NEXT: br label [[FOR_INC33:%.*]] 26890 // CHECK16: for.inc33: 26891 // CHECK16-NEXT: [[TMP43:%.*]] = load i32, i32* [[I25]], align 4 26892 // CHECK16-NEXT: [[INC34:%.*]] = add nsw i32 [[TMP43]], 1 26893 // CHECK16-NEXT: store i32 [[INC34]], i32* [[I25]], align 4 26894 // CHECK16-NEXT: br label [[FOR_COND26]], !llvm.loop [[LOOP7:![0-9]+]] 26895 // CHECK16: for.end35: 26896 // CHECK16-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 26897 // CHECK16-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 26898 // CHECK16-NEXT: store i32 0, i32* [[I36]], align 4 26899 // CHECK16-NEXT: br label [[FOR_COND37:%.*]] 26900 // CHECK16: for.cond37: 26901 // CHECK16-NEXT: [[TMP45:%.*]] = load i32, i32* [[I36]], align 4 26902 // CHECK16-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 26903 // CHECK16-NEXT: [[CMP38:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 26904 // CHECK16-NEXT: br i1 [[CMP38]], label [[FOR_BODY39:%.*]], label [[FOR_END46:%.*]] 26905 // CHECK16: for.body39: 26906 // CHECK16-NEXT: [[TMP47:%.*]] = load double*, double** [[B]], align 4 26907 // CHECK16-NEXT: [[TMP48:%.*]] = load i32, i32* [[I36]], align 4 26908 // CHECK16-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds double, double* [[TMP47]], i32 [[TMP48]] 26909 // CHECK16-NEXT: [[TMP49:%.*]] = load double, double* [[ARRAYIDX40]], align 4 26910 // CHECK16-NEXT: [[TMP50:%.*]] = load double*, double** [[C]], align 4 26911 // CHECK16-NEXT: [[TMP51:%.*]] = load i32, i32* [[I36]], align 4 26912 // CHECK16-NEXT: [[ARRAYIDX41:%.*]] = getelementptr inbounds double, double* [[TMP50]], i32 [[TMP51]] 26913 // CHECK16-NEXT: [[TMP52:%.*]] = load double, double* [[ARRAYIDX41]], align 4 26914 // CHECK16-NEXT: [[ADD42:%.*]] = fadd double [[TMP49]], [[TMP52]] 26915 // CHECK16-NEXT: [[TMP53:%.*]] = load double*, double** [[A]], align 4 26916 // CHECK16-NEXT: [[TMP54:%.*]] = load i32, i32* [[I36]], align 4 26917 // CHECK16-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds double, double* [[TMP53]], i32 [[TMP54]] 26918 // CHECK16-NEXT: store double [[ADD42]], double* [[ARRAYIDX43]], align 4 26919 // CHECK16-NEXT: br label [[FOR_INC44:%.*]] 26920 // CHECK16: for.inc44: 26921 // CHECK16-NEXT: [[TMP55:%.*]] = load i32, i32* [[I36]], align 4 26922 // CHECK16-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP55]], 1 26923 // CHECK16-NEXT: store i32 [[INC45]], i32* [[I36]], align 4 26924 // CHECK16-NEXT: br label [[FOR_COND37]], !llvm.loop [[LOOP8:![0-9]+]] 26925 // CHECK16: for.end46: 26926 // CHECK16-NEXT: store i32 0, i32* [[I47]], align 4 26927 // CHECK16-NEXT: br label [[FOR_COND48:%.*]] 26928 // CHECK16: for.cond48: 26929 // CHECK16-NEXT: [[TMP56:%.*]] = load i32, i32* [[I47]], align 4 26930 // CHECK16-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 26931 // CHECK16-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 26932 // CHECK16-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END57:%.*]] 26933 // CHECK16: for.body50: 26934 // CHECK16-NEXT: [[TMP58:%.*]] = load double*, double** [[B]], align 4 26935 // CHECK16-NEXT: [[TMP59:%.*]] = load i32, i32* [[I47]], align 4 26936 // CHECK16-NEXT: [[ARRAYIDX51:%.*]] = getelementptr inbounds double, double* [[TMP58]], i32 [[TMP59]] 26937 // CHECK16-NEXT: [[TMP60:%.*]] = load double, double* [[ARRAYIDX51]], align 4 26938 // CHECK16-NEXT: [[TMP61:%.*]] = load double*, double** [[C]], align 4 26939 // CHECK16-NEXT: [[TMP62:%.*]] = load i32, i32* [[I47]], align 4 26940 // CHECK16-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds double, double* [[TMP61]], i32 [[TMP62]] 26941 // CHECK16-NEXT: [[TMP63:%.*]] = load double, double* [[ARRAYIDX52]], align 4 26942 // CHECK16-NEXT: [[ADD53:%.*]] = fadd double [[TMP60]], [[TMP63]] 26943 // CHECK16-NEXT: [[TMP64:%.*]] = load double*, double** [[A]], align 4 26944 // CHECK16-NEXT: [[TMP65:%.*]] = load i32, i32* [[I47]], align 4 26945 // CHECK16-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds double, double* [[TMP64]], i32 [[TMP65]] 26946 // CHECK16-NEXT: store double [[ADD53]], double* [[ARRAYIDX54]], align 4 26947 // CHECK16-NEXT: br label [[FOR_INC55:%.*]] 26948 // CHECK16: for.inc55: 26949 // CHECK16-NEXT: [[TMP66:%.*]] = load i32, i32* [[I47]], align 4 26950 // CHECK16-NEXT: [[INC56:%.*]] = add nsw i32 [[TMP66]], 1 26951 // CHECK16-NEXT: store i32 [[INC56]], i32* [[I47]], align 4 26952 // CHECK16-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP9:![0-9]+]] 26953 // CHECK16: for.end57: 26954 // CHECK16-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 26955 // CHECK16-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_58]], align 4 26956 // CHECK16-NEXT: store i32 0, i32* [[I59]], align 4 26957 // CHECK16-NEXT: br label [[FOR_COND60:%.*]] 26958 // CHECK16: for.cond60: 26959 // CHECK16-NEXT: [[TMP68:%.*]] = load i32, i32* [[I59]], align 4 26960 // CHECK16-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 26961 // CHECK16-NEXT: [[CMP61:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 26962 // CHECK16-NEXT: br i1 [[CMP61]], label [[FOR_BODY62:%.*]], label [[FOR_END69:%.*]] 26963 // CHECK16: for.body62: 26964 // CHECK16-NEXT: [[TMP70:%.*]] = load double*, double** [[B]], align 4 26965 // CHECK16-NEXT: [[TMP71:%.*]] = load i32, i32* [[I59]], align 4 26966 // CHECK16-NEXT: [[ARRAYIDX63:%.*]] = getelementptr inbounds double, double* [[TMP70]], i32 [[TMP71]] 26967 // CHECK16-NEXT: [[TMP72:%.*]] = load double, double* [[ARRAYIDX63]], align 4 26968 // CHECK16-NEXT: [[TMP73:%.*]] = load double*, double** [[C]], align 4 26969 // CHECK16-NEXT: [[TMP74:%.*]] = load i32, i32* [[I59]], align 4 26970 // CHECK16-NEXT: [[ARRAYIDX64:%.*]] = getelementptr inbounds double, double* [[TMP73]], i32 [[TMP74]] 26971 // CHECK16-NEXT: [[TMP75:%.*]] = load double, double* [[ARRAYIDX64]], align 4 26972 // CHECK16-NEXT: [[ADD65:%.*]] = fadd double [[TMP72]], [[TMP75]] 26973 // CHECK16-NEXT: [[TMP76:%.*]] = load double*, double** [[A]], align 4 26974 // CHECK16-NEXT: [[TMP77:%.*]] = load i32, i32* [[I59]], align 4 26975 // CHECK16-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds double, double* [[TMP76]], i32 [[TMP77]] 26976 // CHECK16-NEXT: store double [[ADD65]], double* [[ARRAYIDX66]], align 4 26977 // CHECK16-NEXT: br label [[FOR_INC67:%.*]] 26978 // CHECK16: for.inc67: 26979 // CHECK16-NEXT: [[TMP78:%.*]] = load i32, i32* [[I59]], align 4 26980 // CHECK16-NEXT: [[INC68:%.*]] = add nsw i32 [[TMP78]], 1 26981 // CHECK16-NEXT: store i32 [[INC68]], i32* [[I59]], align 4 26982 // CHECK16-NEXT: br label [[FOR_COND60]], !llvm.loop [[LOOP10:![0-9]+]] 26983 // CHECK16: for.end69: 26984 // CHECK16-NEXT: [[CALL:%.*]] = call i32 @_Z5tmainIiET_v() 26985 // CHECK16-NEXT: ret i32 [[CALL]] 26986 // 26987 // 26988 // CHECK16-LABEL: define {{[^@]+}}@_Z5tmainIiET_v 26989 // CHECK16-SAME: () #[[ATTR1:[0-9]+]] comdat { 26990 // CHECK16-NEXT: entry: 26991 // CHECK16-NEXT: [[A:%.*]] = alloca i32*, align 4 26992 // CHECK16-NEXT: [[B:%.*]] = alloca i32*, align 4 26993 // CHECK16-NEXT: [[C:%.*]] = alloca i32*, align 4 26994 // CHECK16-NEXT: [[N:%.*]] = alloca i32, align 4 26995 // CHECK16-NEXT: [[CH:%.*]] = alloca i32, align 4 26996 // CHECK16-NEXT: [[I:%.*]] = alloca i32, align 4 26997 // CHECK16-NEXT: [[I3:%.*]] = alloca i32, align 4 26998 // CHECK16-NEXT: [[I14:%.*]] = alloca i32, align 4 26999 // CHECK16-NEXT: [[I25:%.*]] = alloca i32, align 4 27000 // CHECK16-NEXT: [[DOTCAPTURE_EXPR_:%.*]] = alloca i32, align 4 27001 // CHECK16-NEXT: [[I36:%.*]] = alloca i32, align 4 27002 // CHECK16-NEXT: [[I47:%.*]] = alloca i32, align 4 27003 // CHECK16-NEXT: [[DOTCAPTURE_EXPR_58:%.*]] = alloca i32, align 4 27004 // CHECK16-NEXT: [[I59:%.*]] = alloca i32, align 4 27005 // CHECK16-NEXT: store i32 10000, i32* [[N]], align 4 27006 // CHECK16-NEXT: store i32 100, i32* [[CH]], align 4 27007 // CHECK16-NEXT: store i32 0, i32* [[I]], align 4 27008 // CHECK16-NEXT: br label [[FOR_COND:%.*]] 27009 // CHECK16: for.cond: 27010 // CHECK16-NEXT: [[TMP0:%.*]] = load i32, i32* [[I]], align 4 27011 // CHECK16-NEXT: [[TMP1:%.*]] = load i32, i32* [[N]], align 4 27012 // CHECK16-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] 27013 // CHECK16-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] 27014 // CHECK16: for.body: 27015 // CHECK16-NEXT: [[TMP2:%.*]] = load i32*, i32** [[B]], align 4 27016 // CHECK16-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 27017 // CHECK16-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[TMP2]], i32 [[TMP3]] 27018 // CHECK16-NEXT: [[TMP4:%.*]] = load i32, i32* [[ARRAYIDX]], align 4 27019 // CHECK16-NEXT: [[TMP5:%.*]] = load i32*, i32** [[C]], align 4 27020 // CHECK16-NEXT: [[TMP6:%.*]] = load i32, i32* [[I]], align 4 27021 // CHECK16-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i32, i32* [[TMP5]], i32 [[TMP6]] 27022 // CHECK16-NEXT: [[TMP7:%.*]] = load i32, i32* [[ARRAYIDX1]], align 4 27023 // CHECK16-NEXT: [[ADD:%.*]] = add nsw i32 [[TMP4]], [[TMP7]] 27024 // CHECK16-NEXT: [[TMP8:%.*]] = load i32*, i32** [[A]], align 4 27025 // CHECK16-NEXT: [[TMP9:%.*]] = load i32, i32* [[I]], align 4 27026 // CHECK16-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i32, i32* [[TMP8]], i32 [[TMP9]] 27027 // CHECK16-NEXT: store i32 [[ADD]], i32* [[ARRAYIDX2]], align 4 27028 // CHECK16-NEXT: br label [[FOR_INC:%.*]] 27029 // CHECK16: for.inc: 27030 // CHECK16-NEXT: [[TMP10:%.*]] = load i32, i32* [[I]], align 4 27031 // CHECK16-NEXT: [[INC:%.*]] = add nsw i32 [[TMP10]], 1 27032 // CHECK16-NEXT: store i32 [[INC]], i32* [[I]], align 4 27033 // CHECK16-NEXT: br label [[FOR_COND]], !llvm.loop [[LOOP11:![0-9]+]] 27034 // CHECK16: for.end: 27035 // CHECK16-NEXT: store i32 0, i32* [[I3]], align 4 27036 // CHECK16-NEXT: br label [[FOR_COND4:%.*]] 27037 // CHECK16: for.cond4: 27038 // CHECK16-NEXT: [[TMP11:%.*]] = load i32, i32* [[I3]], align 4 27039 // CHECK16-NEXT: [[TMP12:%.*]] = load i32, i32* [[N]], align 4 27040 // CHECK16-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] 27041 // CHECK16-NEXT: br i1 [[CMP5]], label [[FOR_BODY6:%.*]], label [[FOR_END13:%.*]] 27042 // CHECK16: for.body6: 27043 // CHECK16-NEXT: [[TMP13:%.*]] = load i32*, i32** [[B]], align 4 27044 // CHECK16-NEXT: [[TMP14:%.*]] = load i32, i32* [[I3]], align 4 27045 // CHECK16-NEXT: [[ARRAYIDX7:%.*]] = getelementptr inbounds i32, i32* [[TMP13]], i32 [[TMP14]] 27046 // CHECK16-NEXT: [[TMP15:%.*]] = load i32, i32* [[ARRAYIDX7]], align 4 27047 // CHECK16-NEXT: [[TMP16:%.*]] = load i32*, i32** [[C]], align 4 27048 // CHECK16-NEXT: [[TMP17:%.*]] = load i32, i32* [[I3]], align 4 27049 // CHECK16-NEXT: [[ARRAYIDX8:%.*]] = getelementptr inbounds i32, i32* [[TMP16]], i32 [[TMP17]] 27050 // CHECK16-NEXT: [[TMP18:%.*]] = load i32, i32* [[ARRAYIDX8]], align 4 27051 // CHECK16-NEXT: [[ADD9:%.*]] = add nsw i32 [[TMP15]], [[TMP18]] 27052 // CHECK16-NEXT: [[TMP19:%.*]] = load i32*, i32** [[A]], align 4 27053 // CHECK16-NEXT: [[TMP20:%.*]] = load i32, i32* [[I3]], align 4 27054 // CHECK16-NEXT: [[ARRAYIDX10:%.*]] = getelementptr inbounds i32, i32* [[TMP19]], i32 [[TMP20]] 27055 // CHECK16-NEXT: store i32 [[ADD9]], i32* [[ARRAYIDX10]], align 4 27056 // CHECK16-NEXT: br label [[FOR_INC11:%.*]] 27057 // CHECK16: for.inc11: 27058 // CHECK16-NEXT: [[TMP21:%.*]] = load i32, i32* [[I3]], align 4 27059 // CHECK16-NEXT: [[INC12:%.*]] = add nsw i32 [[TMP21]], 1 27060 // CHECK16-NEXT: store i32 [[INC12]], i32* [[I3]], align 4 27061 // CHECK16-NEXT: br label [[FOR_COND4]], !llvm.loop [[LOOP12:![0-9]+]] 27062 // CHECK16: for.end13: 27063 // CHECK16-NEXT: store i32 0, i32* [[I14]], align 4 27064 // CHECK16-NEXT: br label [[FOR_COND15:%.*]] 27065 // CHECK16: for.cond15: 27066 // CHECK16-NEXT: [[TMP22:%.*]] = load i32, i32* [[I14]], align 4 27067 // CHECK16-NEXT: [[TMP23:%.*]] = load i32, i32* [[N]], align 4 27068 // CHECK16-NEXT: [[CMP16:%.*]] = icmp slt i32 [[TMP22]], [[TMP23]] 27069 // CHECK16-NEXT: br i1 [[CMP16]], label [[FOR_BODY17:%.*]], label [[FOR_END24:%.*]] 27070 // CHECK16: for.body17: 27071 // CHECK16-NEXT: [[TMP24:%.*]] = load i32*, i32** [[B]], align 4 27072 // CHECK16-NEXT: [[TMP25:%.*]] = load i32, i32* [[I14]], align 4 27073 // CHECK16-NEXT: [[ARRAYIDX18:%.*]] = getelementptr inbounds i32, i32* [[TMP24]], i32 [[TMP25]] 27074 // CHECK16-NEXT: [[TMP26:%.*]] = load i32, i32* [[ARRAYIDX18]], align 4 27075 // CHECK16-NEXT: [[TMP27:%.*]] = load i32*, i32** [[C]], align 4 27076 // CHECK16-NEXT: [[TMP28:%.*]] = load i32, i32* [[I14]], align 4 27077 // CHECK16-NEXT: [[ARRAYIDX19:%.*]] = getelementptr inbounds i32, i32* [[TMP27]], i32 [[TMP28]] 27078 // CHECK16-NEXT: [[TMP29:%.*]] = load i32, i32* [[ARRAYIDX19]], align 4 27079 // CHECK16-NEXT: [[ADD20:%.*]] = add nsw i32 [[TMP26]], [[TMP29]] 27080 // CHECK16-NEXT: [[TMP30:%.*]] = load i32*, i32** [[A]], align 4 27081 // CHECK16-NEXT: [[TMP31:%.*]] = load i32, i32* [[I14]], align 4 27082 // CHECK16-NEXT: [[ARRAYIDX21:%.*]] = getelementptr inbounds i32, i32* [[TMP30]], i32 [[TMP31]] 27083 // CHECK16-NEXT: store i32 [[ADD20]], i32* [[ARRAYIDX21]], align 4 27084 // CHECK16-NEXT: br label [[FOR_INC22:%.*]] 27085 // CHECK16: for.inc22: 27086 // CHECK16-NEXT: [[TMP32:%.*]] = load i32, i32* [[I14]], align 4 27087 // CHECK16-NEXT: [[INC23:%.*]] = add nsw i32 [[TMP32]], 1 27088 // CHECK16-NEXT: store i32 [[INC23]], i32* [[I14]], align 4 27089 // CHECK16-NEXT: br label [[FOR_COND15]], !llvm.loop [[LOOP13:![0-9]+]] 27090 // CHECK16: for.end24: 27091 // CHECK16-NEXT: store i32 0, i32* [[I25]], align 4 27092 // CHECK16-NEXT: br label [[FOR_COND26:%.*]] 27093 // CHECK16: for.cond26: 27094 // CHECK16-NEXT: [[TMP33:%.*]] = load i32, i32* [[I25]], align 4 27095 // CHECK16-NEXT: [[TMP34:%.*]] = load i32, i32* [[N]], align 4 27096 // CHECK16-NEXT: [[CMP27:%.*]] = icmp slt i32 [[TMP33]], [[TMP34]] 27097 // CHECK16-NEXT: br i1 [[CMP27]], label [[FOR_BODY28:%.*]], label [[FOR_END35:%.*]] 27098 // CHECK16: for.body28: 27099 // CHECK16-NEXT: [[TMP35:%.*]] = load i32*, i32** [[B]], align 4 27100 // CHECK16-NEXT: [[TMP36:%.*]] = load i32, i32* [[I25]], align 4 27101 // CHECK16-NEXT: [[ARRAYIDX29:%.*]] = getelementptr inbounds i32, i32* [[TMP35]], i32 [[TMP36]] 27102 // CHECK16-NEXT: [[TMP37:%.*]] = load i32, i32* [[ARRAYIDX29]], align 4 27103 // CHECK16-NEXT: [[TMP38:%.*]] = load i32*, i32** [[C]], align 4 27104 // CHECK16-NEXT: [[TMP39:%.*]] = load i32, i32* [[I25]], align 4 27105 // CHECK16-NEXT: [[ARRAYIDX30:%.*]] = getelementptr inbounds i32, i32* [[TMP38]], i32 [[TMP39]] 27106 // CHECK16-NEXT: [[TMP40:%.*]] = load i32, i32* [[ARRAYIDX30]], align 4 27107 // CHECK16-NEXT: [[ADD31:%.*]] = add nsw i32 [[TMP37]], [[TMP40]] 27108 // CHECK16-NEXT: [[TMP41:%.*]] = load i32*, i32** [[A]], align 4 27109 // CHECK16-NEXT: [[TMP42:%.*]] = load i32, i32* [[I25]], align 4 27110 // CHECK16-NEXT: [[ARRAYIDX32:%.*]] = getelementptr inbounds i32, i32* [[TMP41]], i32 [[TMP42]] 27111 // CHECK16-NEXT: store i32 [[ADD31]], i32* [[ARRAYIDX32]], align 4 27112 // CHECK16-NEXT: br label [[FOR_INC33:%.*]] 27113 // CHECK16: for.inc33: 27114 // CHECK16-NEXT: [[TMP43:%.*]] = load i32, i32* [[I25]], align 4 27115 // CHECK16-NEXT: [[INC34:%.*]] = add nsw i32 [[TMP43]], 1 27116 // CHECK16-NEXT: store i32 [[INC34]], i32* [[I25]], align 4 27117 // CHECK16-NEXT: br label [[FOR_COND26]], !llvm.loop [[LOOP14:![0-9]+]] 27118 // CHECK16: for.end35: 27119 // CHECK16-NEXT: [[TMP44:%.*]] = load i32, i32* [[CH]], align 4 27120 // CHECK16-NEXT: store i32 [[TMP44]], i32* [[DOTCAPTURE_EXPR_]], align 4 27121 // CHECK16-NEXT: store i32 0, i32* [[I36]], align 4 27122 // CHECK16-NEXT: br label [[FOR_COND37:%.*]] 27123 // CHECK16: for.cond37: 27124 // CHECK16-NEXT: [[TMP45:%.*]] = load i32, i32* [[I36]], align 4 27125 // CHECK16-NEXT: [[TMP46:%.*]] = load i32, i32* [[N]], align 4 27126 // CHECK16-NEXT: [[CMP38:%.*]] = icmp slt i32 [[TMP45]], [[TMP46]] 27127 // CHECK16-NEXT: br i1 [[CMP38]], label [[FOR_BODY39:%.*]], label [[FOR_END46:%.*]] 27128 // CHECK16: for.body39: 27129 // CHECK16-NEXT: [[TMP47:%.*]] = load i32*, i32** [[B]], align 4 27130 // CHECK16-NEXT: [[TMP48:%.*]] = load i32, i32* [[I36]], align 4 27131 // CHECK16-NEXT: [[ARRAYIDX40:%.*]] = getelementptr inbounds i32, i32* [[TMP47]], i32 [[TMP48]] 27132 // CHECK16-NEXT: [[TMP49:%.*]] = load i32, i32* [[ARRAYIDX40]], align 4 27133 // CHECK16-NEXT: [[TMP50:%.*]] = load i32*, i32** [[C]], align 4 27134 // CHECK16-NEXT: [[TMP51:%.*]] = load i32, i32* [[I36]], align 4 27135 // CHECK16-NEXT: [[ARRAYIDX41:%.*]] = getelementptr inbounds i32, i32* [[TMP50]], i32 [[TMP51]] 27136 // CHECK16-NEXT: [[TMP52:%.*]] = load i32, i32* [[ARRAYIDX41]], align 4 27137 // CHECK16-NEXT: [[ADD42:%.*]] = add nsw i32 [[TMP49]], [[TMP52]] 27138 // CHECK16-NEXT: [[TMP53:%.*]] = load i32*, i32** [[A]], align 4 27139 // CHECK16-NEXT: [[TMP54:%.*]] = load i32, i32* [[I36]], align 4 27140 // CHECK16-NEXT: [[ARRAYIDX43:%.*]] = getelementptr inbounds i32, i32* [[TMP53]], i32 [[TMP54]] 27141 // CHECK16-NEXT: store i32 [[ADD42]], i32* [[ARRAYIDX43]], align 4 27142 // CHECK16-NEXT: br label [[FOR_INC44:%.*]] 27143 // CHECK16: for.inc44: 27144 // CHECK16-NEXT: [[TMP55:%.*]] = load i32, i32* [[I36]], align 4 27145 // CHECK16-NEXT: [[INC45:%.*]] = add nsw i32 [[TMP55]], 1 27146 // CHECK16-NEXT: store i32 [[INC45]], i32* [[I36]], align 4 27147 // CHECK16-NEXT: br label [[FOR_COND37]], !llvm.loop [[LOOP15:![0-9]+]] 27148 // CHECK16: for.end46: 27149 // CHECK16-NEXT: store i32 0, i32* [[I47]], align 4 27150 // CHECK16-NEXT: br label [[FOR_COND48:%.*]] 27151 // CHECK16: for.cond48: 27152 // CHECK16-NEXT: [[TMP56:%.*]] = load i32, i32* [[I47]], align 4 27153 // CHECK16-NEXT: [[TMP57:%.*]] = load i32, i32* [[N]], align 4 27154 // CHECK16-NEXT: [[CMP49:%.*]] = icmp slt i32 [[TMP56]], [[TMP57]] 27155 // CHECK16-NEXT: br i1 [[CMP49]], label [[FOR_BODY50:%.*]], label [[FOR_END57:%.*]] 27156 // CHECK16: for.body50: 27157 // CHECK16-NEXT: [[TMP58:%.*]] = load i32*, i32** [[B]], align 4 27158 // CHECK16-NEXT: [[TMP59:%.*]] = load i32, i32* [[I47]], align 4 27159 // CHECK16-NEXT: [[ARRAYIDX51:%.*]] = getelementptr inbounds i32, i32* [[TMP58]], i32 [[TMP59]] 27160 // CHECK16-NEXT: [[TMP60:%.*]] = load i32, i32* [[ARRAYIDX51]], align 4 27161 // CHECK16-NEXT: [[TMP61:%.*]] = load i32*, i32** [[C]], align 4 27162 // CHECK16-NEXT: [[TMP62:%.*]] = load i32, i32* [[I47]], align 4 27163 // CHECK16-NEXT: [[ARRAYIDX52:%.*]] = getelementptr inbounds i32, i32* [[TMP61]], i32 [[TMP62]] 27164 // CHECK16-NEXT: [[TMP63:%.*]] = load i32, i32* [[ARRAYIDX52]], align 4 27165 // CHECK16-NEXT: [[ADD53:%.*]] = add nsw i32 [[TMP60]], [[TMP63]] 27166 // CHECK16-NEXT: [[TMP64:%.*]] = load i32*, i32** [[A]], align 4 27167 // CHECK16-NEXT: [[TMP65:%.*]] = load i32, i32* [[I47]], align 4 27168 // CHECK16-NEXT: [[ARRAYIDX54:%.*]] = getelementptr inbounds i32, i32* [[TMP64]], i32 [[TMP65]] 27169 // CHECK16-NEXT: store i32 [[ADD53]], i32* [[ARRAYIDX54]], align 4 27170 // CHECK16-NEXT: br label [[FOR_INC55:%.*]] 27171 // CHECK16: for.inc55: 27172 // CHECK16-NEXT: [[TMP66:%.*]] = load i32, i32* [[I47]], align 4 27173 // CHECK16-NEXT: [[INC56:%.*]] = add nsw i32 [[TMP66]], 1 27174 // CHECK16-NEXT: store i32 [[INC56]], i32* [[I47]], align 4 27175 // CHECK16-NEXT: br label [[FOR_COND48]], !llvm.loop [[LOOP16:![0-9]+]] 27176 // CHECK16: for.end57: 27177 // CHECK16-NEXT: [[TMP67:%.*]] = load i32, i32* [[CH]], align 4 27178 // CHECK16-NEXT: store i32 [[TMP67]], i32* [[DOTCAPTURE_EXPR_58]], align 4 27179 // CHECK16-NEXT: store i32 0, i32* [[I59]], align 4 27180 // CHECK16-NEXT: br label [[FOR_COND60:%.*]] 27181 // CHECK16: for.cond60: 27182 // CHECK16-NEXT: [[TMP68:%.*]] = load i32, i32* [[I59]], align 4 27183 // CHECK16-NEXT: [[TMP69:%.*]] = load i32, i32* [[N]], align 4 27184 // CHECK16-NEXT: [[CMP61:%.*]] = icmp slt i32 [[TMP68]], [[TMP69]] 27185 // CHECK16-NEXT: br i1 [[CMP61]], label [[FOR_BODY62:%.*]], label [[FOR_END69:%.*]] 27186 // CHECK16: for.body62: 27187 // CHECK16-NEXT: [[TMP70:%.*]] = load i32*, i32** [[B]], align 4 27188 // CHECK16-NEXT: [[TMP71:%.*]] = load i32, i32* [[I59]], align 4 27189 // CHECK16-NEXT: [[ARRAYIDX63:%.*]] = getelementptr inbounds i32, i32* [[TMP70]], i32 [[TMP71]] 27190 // CHECK16-NEXT: [[TMP72:%.*]] = load i32, i32* [[ARRAYIDX63]], align 4 27191 // CHECK16-NEXT: [[TMP73:%.*]] = load i32*, i32** [[C]], align 4 27192 // CHECK16-NEXT: [[TMP74:%.*]] = load i32, i32* [[I59]], align 4 27193 // CHECK16-NEXT: [[ARRAYIDX64:%.*]] = getelementptr inbounds i32, i32* [[TMP73]], i32 [[TMP74]] 27194 // CHECK16-NEXT: [[TMP75:%.*]] = load i32, i32* [[ARRAYIDX64]], align 4 27195 // CHECK16-NEXT: [[ADD65:%.*]] = add nsw i32 [[TMP72]], [[TMP75]] 27196 // CHECK16-NEXT: [[TMP76:%.*]] = load i32*, i32** [[A]], align 4 27197 // CHECK16-NEXT: [[TMP77:%.*]] = load i32, i32* [[I59]], align 4 27198 // CHECK16-NEXT: [[ARRAYIDX66:%.*]] = getelementptr inbounds i32, i32* [[TMP76]], i32 [[TMP77]] 27199 // CHECK16-NEXT: store i32 [[ADD65]], i32* [[ARRAYIDX66]], align 4 27200 // CHECK16-NEXT: br label [[FOR_INC67:%.*]] 27201 // CHECK16: for.inc67: 27202 // CHECK16-NEXT: [[TMP78:%.*]] = load i32, i32* [[I59]], align 4 27203 // CHECK16-NEXT: [[INC68:%.*]] = add nsw i32 [[TMP78]], 1 27204 // CHECK16-NEXT: store i32 [[INC68]], i32* [[I59]], align 4 27205 // CHECK16-NEXT: br label [[FOR_COND60]], !llvm.loop [[LOOP17:![0-9]+]] 27206 // CHECK16: for.end69: 27207 // CHECK16-NEXT: ret i32 0 27208 // 27209