1 #![expect(non_snake_case, reason = "DSL style here")] 2 3 use crate::cdsl::instructions::{ 4 AllInstructions, InstructionBuilder as Inst, InstructionGroupBuilder, 5 }; 6 use crate::cdsl::operands::Operand; 7 use crate::cdsl::types::{LaneType, ValueType}; 8 use crate::cdsl::typevar::{Interval, TypeSetBuilder, TypeVar}; 9 use crate::shared::formats::Formats; 10 use crate::shared::types; 11 use crate::shared::{entities::EntityRefs, immediates::Immediates}; 12 13 #[inline(never)] 14 fn define_control_flow( 15 ig: &mut InstructionGroupBuilder, 16 formats: &Formats, 17 imm: &Immediates, 18 entities: &EntityRefs, 19 ) { 20 ig.push( 21 Inst::new( 22 "jump", 23 r#" 24 Jump. 25 26 Unconditionally jump to a basic block, passing the specified 27 block arguments. The number and types of arguments must match the 28 destination block. 29 "#, 30 &formats.jump, 31 ) 32 .operands_in(vec![ 33 Operand::new("block_call", &entities.block_call) 34 .with_doc("Destination basic block, with its arguments provided"), 35 ]) 36 .branches(), 37 ); 38 39 let ScalarTruthy = &TypeVar::new( 40 "ScalarTruthy", 41 "A scalar truthy type", 42 TypeSetBuilder::new().ints(Interval::All).build(), 43 ); 44 45 ig.push( 46 Inst::new( 47 "brif", 48 r#" 49 Conditional branch when cond is non-zero. 50 51 Take the ``then`` branch when ``c != 0``, and the ``else`` branch otherwise. 52 "#, 53 &formats.brif, 54 ) 55 .operands_in(vec![ 56 Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"), 57 Operand::new("block_then", &entities.block_then).with_doc("Then block"), 58 Operand::new("block_else", &entities.block_else).with_doc("Else block"), 59 ]) 60 .branches(), 61 ); 62 63 { 64 let _i32 = &TypeVar::new( 65 "i32", 66 "A 32 bit scalar integer type", 67 TypeSetBuilder::new().ints(32..32).build(), 68 ); 69 70 ig.push( 71 Inst::new( 72 "br_table", 73 r#" 74 Indirect branch via jump table. 75 76 Use ``x`` as an unsigned index into the jump table ``JT``. If a jump 77 table entry is found, branch to the corresponding block. If no entry was 78 found or the index is out-of-bounds, branch to the default block of the 79 table. 80 81 Note that this branch instruction can't pass arguments to the targeted 82 blocks. Split critical edges as needed to work around this. 83 84 Do not confuse this with "tables" in WebAssembly. ``br_table`` is for 85 jump tables with destinations within the current function only -- think 86 of a ``match`` in Rust or a ``switch`` in C. If you want to call a 87 function in a dynamic library, that will typically use 88 ``call_indirect``. 89 "#, 90 &formats.branch_table, 91 ) 92 .operands_in(vec![ 93 Operand::new("x", _i32).with_doc("i32 index into jump table"), 94 Operand::new("JT", &entities.jump_table), 95 ]) 96 .branches(), 97 ); 98 } 99 100 let iAddr = &TypeVar::new( 101 "iAddr", 102 "An integer address type", 103 TypeSetBuilder::new().ints(32..64).build(), 104 ); 105 106 ig.push( 107 Inst::new( 108 "debugtrap", 109 r#" 110 Encodes an assembly debug trap. 111 "#, 112 &formats.nullary, 113 ) 114 .other_side_effects() 115 .can_load() 116 .can_store(), 117 ); 118 119 ig.push( 120 Inst::new( 121 "trap", 122 r#" 123 Terminate execution unconditionally. 124 "#, 125 &formats.trap, 126 ) 127 .operands_in(vec![Operand::new("code", &imm.trapcode)]) 128 .can_trap() 129 .terminates_block(), 130 ); 131 132 ig.push( 133 Inst::new( 134 "trapz", 135 r#" 136 Trap when zero. 137 138 if ``c`` is non-zero, execution continues at the following instruction. 139 "#, 140 &formats.cond_trap, 141 ) 142 .operands_in(vec![ 143 Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"), 144 Operand::new("code", &imm.trapcode), 145 ]) 146 .can_trap() 147 // When one `trapz` dominates another `trapz` and they have identical 148 // conditions and trap codes, it is safe to deduplicate them (like GVN, 149 // although there is not actually any value being numbered). Either the 150 // first `trapz` raised a trap and execution halted, or it didn't and 151 // therefore the dominated `trapz` will not raise a trap either. 152 .side_effects_idempotent(), 153 ); 154 155 ig.push( 156 Inst::new( 157 "trapnz", 158 r#" 159 Trap when non-zero. 160 161 If ``c`` is zero, execution continues at the following instruction. 162 "#, 163 &formats.cond_trap, 164 ) 165 .operands_in(vec![ 166 Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"), 167 Operand::new("code", &imm.trapcode), 168 ]) 169 .can_trap() 170 // See the above comment for `trapz` and idempotent side effects. 171 .side_effects_idempotent(), 172 ); 173 174 ig.push( 175 Inst::new( 176 "return", 177 r#" 178 Return from the function. 179 180 Unconditionally transfer control to the calling function, passing the 181 provided return values. The list of return values must match the 182 function signature's return types. 183 "#, 184 &formats.multiary, 185 ) 186 .operands_in(vec![ 187 Operand::new("rvals", &entities.varargs).with_doc("return values"), 188 ]) 189 .returns(), 190 ); 191 192 ig.push( 193 Inst::new( 194 "call", 195 r#" 196 Direct function call. 197 198 Call a function which has been declared in the preamble. The argument 199 types must match the function's signature. 200 "#, 201 &formats.call, 202 ) 203 .operands_in(vec![ 204 Operand::new("FN", &entities.func_ref) 205 .with_doc("function to call, declared by `function`"), 206 Operand::new("args", &entities.varargs).with_doc("call arguments"), 207 ]) 208 .operands_out(vec![ 209 Operand::new("rvals", &entities.varargs).with_doc("return values"), 210 ]) 211 .call(), 212 ); 213 214 ig.push( 215 Inst::new( 216 "call_indirect", 217 r#" 218 Indirect function call. 219 220 Call the function pointed to by `callee` with the given arguments. The 221 called function must match the specified signature. 222 223 Note that this is different from WebAssembly's ``call_indirect``; the 224 callee is a native address, rather than a table index. For WebAssembly, 225 `table_addr` and `load` are used to obtain a native address 226 from a table. 227 "#, 228 &formats.call_indirect, 229 ) 230 .operands_in(vec![ 231 Operand::new("SIG", &entities.sig_ref).with_doc("function signature"), 232 Operand::new("callee", iAddr).with_doc("address of function to call"), 233 Operand::new("args", &entities.varargs).with_doc("call arguments"), 234 ]) 235 .operands_out(vec![ 236 Operand::new("rvals", &entities.varargs).with_doc("return values"), 237 ]) 238 .call(), 239 ); 240 241 ig.push( 242 Inst::new( 243 "return_call", 244 r#" 245 Direct tail call. 246 247 Tail call a function which has been declared in the preamble. The 248 argument types must match the function's signature, the caller and 249 callee calling conventions must be the same, and must be a calling 250 convention that supports tail calls. 251 252 This instruction is a block terminator. 253 "#, 254 &formats.call, 255 ) 256 .operands_in(vec![ 257 Operand::new("FN", &entities.func_ref) 258 .with_doc("function to call, declared by `function`"), 259 Operand::new("args", &entities.varargs).with_doc("call arguments"), 260 ]) 261 .returns() 262 .call(), 263 ); 264 265 ig.push( 266 Inst::new( 267 "return_call_indirect", 268 r#" 269 Indirect tail call. 270 271 Call the function pointed to by `callee` with the given arguments. The 272 argument types must match the function's signature, the caller and 273 callee calling conventions must be the same, and must be a calling 274 convention that supports tail calls. 275 276 This instruction is a block terminator. 277 278 Note that this is different from WebAssembly's ``tail_call_indirect``; 279 the callee is a native address, rather than a table index. For 280 WebAssembly, `table_addr` and `load` are used to obtain a native address 281 from a table. 282 "#, 283 &formats.call_indirect, 284 ) 285 .operands_in(vec![ 286 Operand::new("SIG", &entities.sig_ref).with_doc("function signature"), 287 Operand::new("callee", iAddr).with_doc("address of function to call"), 288 Operand::new("args", &entities.varargs).with_doc("call arguments"), 289 ]) 290 .returns() 291 .call(), 292 ); 293 294 ig.push( 295 Inst::new( 296 "func_addr", 297 r#" 298 Get the address of a function. 299 300 Compute the absolute address of a function declared in the preamble. 301 The returned address can be used as a ``callee`` argument to 302 `call_indirect`. This is also a method for calling functions that 303 are too far away to be addressable by a direct `call` 304 instruction. 305 "#, 306 &formats.func_addr, 307 ) 308 .operands_in(vec![ 309 Operand::new("FN", &entities.func_ref) 310 .with_doc("function to call, declared by `function`"), 311 ]) 312 .operands_out(vec![Operand::new("addr", iAddr)]), 313 ); 314 315 ig.push( 316 Inst::new( 317 "try_call", 318 r#" 319 Call a function, catching the specified exceptions. 320 321 Call the function pointed to by `callee` with the given arguments. On 322 normal return, branch to the first target, with function returns 323 available as `retN` block arguments. On exceptional return, 324 look up the thrown exception tag in the provided exception table; 325 if the tag matches one of the targets, branch to the matching 326 target with the exception payloads available as `exnN` block arguments. 327 If no tag matches, then propagate the exception up the stack. 328 329 It is the Cranelift embedder's responsibility to define the meaning 330 of tags: they are accepted by this instruction and passed through 331 to unwind metadata tables in Cranelift's output. Actual unwinding is 332 outside the purview of the core Cranelift compiler. 333 334 Payload values on exception are passed in fixed register(s) that are 335 defined by the platform and ABI. See the documentation on `CallConv` 336 for details. 337 "#, 338 &formats.try_call, 339 ) 340 .operands_in(vec![ 341 Operand::new("callee", &entities.func_ref) 342 .with_doc("function to call, declared by `function`"), 343 Operand::new("args", &entities.varargs).with_doc("call arguments"), 344 Operand::new("ET", &entities.exception_table).with_doc("exception table"), 345 ]) 346 .call() 347 .branches(), 348 ); 349 350 ig.push( 351 Inst::new( 352 "try_call_indirect", 353 r#" 354 Call a function, catching the specified exceptions. 355 356 Call the function pointed to by `callee` with the given arguments. On 357 normal return, branch to the first target, with function returns 358 available as `retN` block arguments. On exceptional return, 359 look up the thrown exception tag in the provided exception table; 360 if the tag matches one of the targets, branch to the matching 361 target with the exception payloads available as `exnN` block arguments. 362 If no tag matches, then propagate the exception up the stack. 363 364 It is the Cranelift embedder's responsibility to define the meaning 365 of tags: they are accepted by this instruction and passed through 366 to unwind metadata tables in Cranelift's output. Actual unwinding is 367 outside the purview of the core Cranelift compiler. 368 369 Payload values on exception are passed in fixed register(s) that are 370 defined by the platform and ABI. See the documentation on `CallConv` 371 for details. 372 "#, 373 &formats.try_call_indirect, 374 ) 375 .operands_in(vec![ 376 Operand::new("callee", iAddr).with_doc("address of function to call"), 377 Operand::new("args", &entities.varargs).with_doc("call arguments"), 378 Operand::new("ET", &entities.exception_table).with_doc("exception table"), 379 ]) 380 .call() 381 .branches(), 382 ); 383 } 384 385 #[inline(never)] 386 fn define_simd_lane_access( 387 ig: &mut InstructionGroupBuilder, 388 formats: &Formats, 389 imm: &Immediates, 390 _: &EntityRefs, 391 ) { 392 let TxN = &TypeVar::new( 393 "TxN", 394 "A SIMD vector type", 395 TypeSetBuilder::new() 396 .ints(Interval::All) 397 .floats(Interval::All) 398 .simd_lanes(Interval::All) 399 .dynamic_simd_lanes(Interval::All) 400 .includes_scalars(false) 401 .build(), 402 ); 403 404 ig.push( 405 Inst::new( 406 "splat", 407 r#" 408 Vector splat. 409 410 Return a vector whose lanes are all ``x``. 411 "#, 412 &formats.unary, 413 ) 414 .operands_in(vec![ 415 Operand::new("x", &TxN.lane_of()).with_doc("Value to splat to all lanes"), 416 ]) 417 .operands_out(vec![Operand::new("a", TxN)]), 418 ); 419 420 let I8x16 = &TypeVar::new( 421 "I8x16", 422 "A SIMD vector type consisting of 16 lanes of 8-bit integers", 423 TypeSetBuilder::new() 424 .ints(8..8) 425 .simd_lanes(16..16) 426 .includes_scalars(false) 427 .build(), 428 ); 429 430 ig.push( 431 Inst::new( 432 "swizzle", 433 r#" 434 Vector swizzle. 435 436 Returns a new vector with byte-width lanes selected from the lanes of the first input 437 vector ``x`` specified in the second input vector ``s``. The indices ``i`` in range 438 ``[0, 15]`` select the ``i``-th element of ``x``. For indices outside of the range the 439 resulting lane is 0. Note that this operates on byte-width lanes. 440 "#, 441 &formats.binary, 442 ) 443 .operands_in(vec![ 444 Operand::new("x", I8x16).with_doc("Vector to modify by re-arranging lanes"), 445 Operand::new("y", I8x16).with_doc("Mask for re-arranging lanes"), 446 ]) 447 .operands_out(vec![Operand::new("a", I8x16)]), 448 ); 449 450 ig.push( 451 Inst::new( 452 "x86_pshufb", 453 r#" 454 A vector swizzle lookalike which has the semantics of `pshufb` on x64. 455 456 This instruction will permute the 8-bit lanes of `x` with the indices 457 specified in `y`. Each lane in the mask, `y`, uses the bottom four 458 bits for selecting the lane from `x` unless the most significant bit 459 is set, in which case the lane is zeroed. The output vector will have 460 the following contents when the element of `y` is in these ranges: 461 462 * `[0, 127]` -> `x[y[i] % 16]` 463 * `[128, 255]` -> 0 464 "#, 465 &formats.binary, 466 ) 467 .operands_in(vec![ 468 Operand::new("x", I8x16).with_doc("Vector to modify by re-arranging lanes"), 469 Operand::new("y", I8x16).with_doc("Mask for re-arranging lanes"), 470 ]) 471 .operands_out(vec![Operand::new("a", I8x16)]), 472 ); 473 474 ig.push( 475 Inst::new( 476 "insertlane", 477 r#" 478 Insert ``y`` as lane ``Idx`` in x. 479 480 The lane index, ``Idx``, is an immediate value, not an SSA value. It 481 must indicate a valid lane index for the type of ``x``. 482 "#, 483 &formats.ternary_imm8, 484 ) 485 .operands_in(vec![ 486 Operand::new("x", TxN).with_doc("The vector to modify"), 487 Operand::new("y", &TxN.lane_of()).with_doc("New lane value"), 488 Operand::new("Idx", &imm.uimm8).with_doc("Lane index"), 489 ]) 490 .operands_out(vec![Operand::new("a", TxN)]), 491 ); 492 493 ig.push( 494 Inst::new( 495 "extractlane", 496 r#" 497 Extract lane ``Idx`` from ``x``. 498 499 The lane index, ``Idx``, is an immediate value, not an SSA value. It 500 must indicate a valid lane index for the type of ``x``. Note that the upper bits of ``a`` 501 may or may not be zeroed depending on the ISA but the type system should prevent using 502 ``a`` as anything other than the extracted value. 503 "#, 504 &formats.binary_imm8, 505 ) 506 .operands_in(vec![ 507 Operand::new("x", TxN), 508 Operand::new("Idx", &imm.uimm8).with_doc("Lane index"), 509 ]) 510 .operands_out(vec![Operand::new("a", &TxN.lane_of())]), 511 ); 512 } 513 514 #[inline(never)] 515 fn define_simd_arithmetic( 516 ig: &mut InstructionGroupBuilder, 517 formats: &Formats, 518 _: &Immediates, 519 _: &EntityRefs, 520 ) { 521 let Int = &TypeVar::new( 522 "Int", 523 "A scalar or vector integer type", 524 TypeSetBuilder::new() 525 .ints(Interval::All) 526 .simd_lanes(Interval::All) 527 .build(), 528 ); 529 530 ig.push( 531 Inst::new( 532 "smin", 533 r#" 534 Signed integer minimum. 535 "#, 536 &formats.binary, 537 ) 538 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 539 .operands_out(vec![Operand::new("a", Int)]), 540 ); 541 542 ig.push( 543 Inst::new( 544 "umin", 545 r#" 546 Unsigned integer minimum. 547 "#, 548 &formats.binary, 549 ) 550 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 551 .operands_out(vec![Operand::new("a", Int)]), 552 ); 553 554 ig.push( 555 Inst::new( 556 "smax", 557 r#" 558 Signed integer maximum. 559 "#, 560 &formats.binary, 561 ) 562 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 563 .operands_out(vec![Operand::new("a", Int)]), 564 ); 565 566 ig.push( 567 Inst::new( 568 "umax", 569 r#" 570 Unsigned integer maximum. 571 "#, 572 &formats.binary, 573 ) 574 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 575 .operands_out(vec![Operand::new("a", Int)]), 576 ); 577 578 let IxN = &TypeVar::new( 579 "IxN", 580 "A SIMD vector type containing integers", 581 TypeSetBuilder::new() 582 .ints(Interval::All) 583 .simd_lanes(Interval::All) 584 .includes_scalars(false) 585 .build(), 586 ); 587 588 ig.push( 589 Inst::new( 590 "avg_round", 591 r#" 592 Unsigned average with rounding: `a := (x + y + 1) // 2` 593 594 The addition does not lose any information (such as from overflow). 595 "#, 596 &formats.binary, 597 ) 598 .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)]) 599 .operands_out(vec![Operand::new("a", IxN)]), 600 ); 601 602 ig.push( 603 Inst::new( 604 "uadd_sat", 605 r#" 606 Add with unsigned saturation. 607 608 This is similar to `iadd` but the operands are interpreted as unsigned integers and their 609 summed result, instead of wrapping, will be saturated to the highest unsigned integer for 610 the controlling type (e.g. `0xFF` for i8). 611 "#, 612 &formats.binary, 613 ) 614 .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)]) 615 .operands_out(vec![Operand::new("a", IxN)]), 616 ); 617 618 ig.push( 619 Inst::new( 620 "sadd_sat", 621 r#" 622 Add with signed saturation. 623 624 This is similar to `iadd` but the operands are interpreted as signed integers and their 625 summed result, instead of wrapping, will be saturated to the lowest or highest 626 signed integer for the controlling type (e.g. `0x80` or `0x7F` for i8). For example, 627 since an `sadd_sat.i8` of `0x70` and `0x70` is greater than `0x7F`, the result will be 628 clamped to `0x7F`. 629 "#, 630 &formats.binary, 631 ) 632 .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)]) 633 .operands_out(vec![Operand::new("a", IxN)]), 634 ); 635 636 ig.push( 637 Inst::new( 638 "usub_sat", 639 r#" 640 Subtract with unsigned saturation. 641 642 This is similar to `isub` but the operands are interpreted as unsigned integers and their 643 difference, instead of wrapping, will be saturated to the lowest unsigned integer for 644 the controlling type (e.g. `0x00` for i8). 645 "#, 646 &formats.binary, 647 ) 648 .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)]) 649 .operands_out(vec![Operand::new("a", IxN)]), 650 ); 651 652 ig.push( 653 Inst::new( 654 "ssub_sat", 655 r#" 656 Subtract with signed saturation. 657 658 This is similar to `isub` but the operands are interpreted as signed integers and their 659 difference, instead of wrapping, will be saturated to the lowest or highest 660 signed integer for the controlling type (e.g. `0x80` or `0x7F` for i8). 661 "#, 662 &formats.binary, 663 ) 664 .operands_in(vec![Operand::new("x", IxN), Operand::new("y", IxN)]) 665 .operands_out(vec![Operand::new("a", IxN)]), 666 ); 667 } 668 669 pub(crate) fn define( 670 all_instructions: &mut AllInstructions, 671 formats: &Formats, 672 imm: &Immediates, 673 entities: &EntityRefs, 674 ) { 675 let mut ig = InstructionGroupBuilder::new(all_instructions); 676 677 define_control_flow(&mut ig, formats, imm, entities); 678 define_simd_lane_access(&mut ig, formats, imm, entities); 679 define_simd_arithmetic(&mut ig, formats, imm, entities); 680 681 // Operand kind shorthands. 682 let i8: &TypeVar = &ValueType::from(LaneType::from(types::Int::I8)).into(); 683 let f16_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F16)).into(); 684 let f32_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F32)).into(); 685 let f64_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F64)).into(); 686 let f128_: &TypeVar = &ValueType::from(LaneType::from(types::Float::F128)).into(); 687 688 // Starting definitions. 689 let Int = &TypeVar::new( 690 "Int", 691 "A scalar or vector integer type", 692 TypeSetBuilder::new() 693 .ints(Interval::All) 694 .simd_lanes(Interval::All) 695 .dynamic_simd_lanes(Interval::All) 696 .build(), 697 ); 698 699 let NarrowInt = &TypeVar::new( 700 "NarrowInt", 701 "An integer type of width up to `i64`", 702 TypeSetBuilder::new().ints(8..64).build(), 703 ); 704 705 let ScalarTruthy = &TypeVar::new( 706 "ScalarTruthy", 707 "A scalar truthy type", 708 TypeSetBuilder::new().ints(Interval::All).build(), 709 ); 710 711 let iB = &TypeVar::new( 712 "iB", 713 "A scalar integer type", 714 TypeSetBuilder::new().ints(Interval::All).build(), 715 ); 716 717 let iSwappable = &TypeVar::new( 718 "iSwappable", 719 "A multi byte scalar integer type", 720 TypeSetBuilder::new().ints(16..128).build(), 721 ); 722 723 let iAddr = &TypeVar::new( 724 "iAddr", 725 "An integer address type", 726 TypeSetBuilder::new().ints(32..64).build(), 727 ); 728 729 let TxN = &TypeVar::new( 730 "TxN", 731 "A SIMD vector type", 732 TypeSetBuilder::new() 733 .ints(Interval::All) 734 .floats(Interval::All) 735 .simd_lanes(Interval::All) 736 .includes_scalars(false) 737 .build(), 738 ); 739 let Any = &TypeVar::new( 740 "Any", 741 "Any integer, float, or reference scalar or vector type", 742 TypeSetBuilder::new() 743 .ints(Interval::All) 744 .floats(Interval::All) 745 .simd_lanes(Interval::All) 746 .includes_scalars(true) 747 .build(), 748 ); 749 750 let Mem = &TypeVar::new( 751 "Mem", 752 "Any type that can be stored in memory", 753 TypeSetBuilder::new() 754 .ints(Interval::All) 755 .floats(Interval::All) 756 .simd_lanes(Interval::All) 757 .dynamic_simd_lanes(Interval::All) 758 .build(), 759 ); 760 761 let MemTo = &TypeVar::copy_from(Mem, "MemTo".to_string()); 762 763 ig.push( 764 Inst::new( 765 "load", 766 r#" 767 Load from memory at ``p + Offset``. 768 769 This is a polymorphic instruction that can load any value type which 770 has a memory representation. 771 "#, 772 &formats.load, 773 ) 774 .operands_in(vec![ 775 Operand::new("MemFlags", &imm.memflags), 776 Operand::new("p", iAddr), 777 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 778 ]) 779 .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]) 780 .can_load(), 781 ); 782 783 ig.push( 784 Inst::new( 785 "store", 786 r#" 787 Store ``x`` to memory at ``p + Offset``. 788 789 This is a polymorphic instruction that can store any value type with a 790 memory representation. 791 "#, 792 &formats.store, 793 ) 794 .operands_in(vec![ 795 Operand::new("MemFlags", &imm.memflags), 796 Operand::new("x", Mem).with_doc("Value to be stored"), 797 Operand::new("p", iAddr), 798 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 799 ]) 800 .can_store(), 801 ); 802 803 let iExt8 = &TypeVar::new( 804 "iExt8", 805 "An integer type with more than 8 bits", 806 TypeSetBuilder::new().ints(16..64).build(), 807 ); 808 809 ig.push( 810 Inst::new( 811 "uload8", 812 r#" 813 Load 8 bits from memory at ``p + Offset`` and zero-extend. 814 815 This is equivalent to ``load.i8`` followed by ``uextend``. 816 "#, 817 &formats.load, 818 ) 819 .operands_in(vec![ 820 Operand::new("MemFlags", &imm.memflags), 821 Operand::new("p", iAddr), 822 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 823 ]) 824 .operands_out(vec![Operand::new("a", iExt8)]) 825 .can_load(), 826 ); 827 828 ig.push( 829 Inst::new( 830 "sload8", 831 r#" 832 Load 8 bits from memory at ``p + Offset`` and sign-extend. 833 834 This is equivalent to ``load.i8`` followed by ``sextend``. 835 "#, 836 &formats.load, 837 ) 838 .operands_in(vec![ 839 Operand::new("MemFlags", &imm.memflags), 840 Operand::new("p", iAddr), 841 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 842 ]) 843 .operands_out(vec![Operand::new("a", iExt8)]) 844 .can_load(), 845 ); 846 847 ig.push( 848 Inst::new( 849 "istore8", 850 r#" 851 Store the low 8 bits of ``x`` to memory at ``p + Offset``. 852 853 This is equivalent to ``ireduce.i8`` followed by ``store.i8``. 854 "#, 855 &formats.store, 856 ) 857 .operands_in(vec![ 858 Operand::new("MemFlags", &imm.memflags), 859 Operand::new("x", iExt8), 860 Operand::new("p", iAddr), 861 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 862 ]) 863 .can_store(), 864 ); 865 866 let iExt16 = &TypeVar::new( 867 "iExt16", 868 "An integer type with more than 16 bits", 869 TypeSetBuilder::new().ints(32..64).build(), 870 ); 871 872 ig.push( 873 Inst::new( 874 "uload16", 875 r#" 876 Load 16 bits from memory at ``p + Offset`` and zero-extend. 877 878 This is equivalent to ``load.i16`` followed by ``uextend``. 879 "#, 880 &formats.load, 881 ) 882 .operands_in(vec![ 883 Operand::new("MemFlags", &imm.memflags), 884 Operand::new("p", iAddr), 885 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 886 ]) 887 .operands_out(vec![Operand::new("a", iExt16)]) 888 .can_load(), 889 ); 890 891 ig.push( 892 Inst::new( 893 "sload16", 894 r#" 895 Load 16 bits from memory at ``p + Offset`` and sign-extend. 896 897 This is equivalent to ``load.i16`` followed by ``sextend``. 898 "#, 899 &formats.load, 900 ) 901 .operands_in(vec![ 902 Operand::new("MemFlags", &imm.memflags), 903 Operand::new("p", iAddr), 904 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 905 ]) 906 .operands_out(vec![Operand::new("a", iExt16)]) 907 .can_load(), 908 ); 909 910 ig.push( 911 Inst::new( 912 "istore16", 913 r#" 914 Store the low 16 bits of ``x`` to memory at ``p + Offset``. 915 916 This is equivalent to ``ireduce.i16`` followed by ``store.i16``. 917 "#, 918 &formats.store, 919 ) 920 .operands_in(vec![ 921 Operand::new("MemFlags", &imm.memflags), 922 Operand::new("x", iExt16), 923 Operand::new("p", iAddr), 924 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 925 ]) 926 .can_store(), 927 ); 928 929 let iExt32 = &TypeVar::new( 930 "iExt32", 931 "An integer type with more than 32 bits", 932 TypeSetBuilder::new().ints(64..64).build(), 933 ); 934 935 ig.push( 936 Inst::new( 937 "uload32", 938 r#" 939 Load 32 bits from memory at ``p + Offset`` and zero-extend. 940 941 This is equivalent to ``load.i32`` followed by ``uextend``. 942 "#, 943 &formats.load, 944 ) 945 .operands_in(vec![ 946 Operand::new("MemFlags", &imm.memflags), 947 Operand::new("p", iAddr), 948 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 949 ]) 950 .operands_out(vec![Operand::new("a", iExt32)]) 951 .can_load(), 952 ); 953 954 ig.push( 955 Inst::new( 956 "sload32", 957 r#" 958 Load 32 bits from memory at ``p + Offset`` and sign-extend. 959 960 This is equivalent to ``load.i32`` followed by ``sextend``. 961 "#, 962 &formats.load, 963 ) 964 .operands_in(vec![ 965 Operand::new("MemFlags", &imm.memflags), 966 Operand::new("p", iAddr), 967 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 968 ]) 969 .operands_out(vec![Operand::new("a", iExt32)]) 970 .can_load(), 971 ); 972 973 ig.push( 974 Inst::new( 975 "istore32", 976 r#" 977 Store the low 32 bits of ``x`` to memory at ``p + Offset``. 978 979 This is equivalent to ``ireduce.i32`` followed by ``store.i32``. 980 "#, 981 &formats.store, 982 ) 983 .operands_in(vec![ 984 Operand::new("MemFlags", &imm.memflags), 985 Operand::new("x", iExt32), 986 Operand::new("p", iAddr), 987 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 988 ]) 989 .can_store(), 990 ); 991 ig.push( 992 Inst::new( 993 "stack_switch", 994 r#" 995 Suspends execution of the current stack and resumes execution of another 996 one. 997 998 The target stack to switch to is identified by the data stored at 999 ``load_context_ptr``. Before switching, this instruction stores 1000 analogous information about the 1001 current (i.e., original) stack at ``store_context_ptr``, to 1002 enabled switching back to the original stack at a later point. 1003 1004 The size, alignment and layout of the information stored at 1005 ``load_context_ptr`` and ``store_context_ptr`` is platform-dependent. 1006 The instruction assumes that ``load_context_ptr`` and 1007 ``store_context_ptr`` are valid pointers to memory with said layout and 1008 alignment, and does not perform any checks on these pointers or the data 1009 stored there. 1010 1011 The instruction is experimental and only supported on x64 Linux at the 1012 moment. 1013 1014 When switching from a stack A to a stack B, one of the following cases 1015 must apply: 1016 1. Stack B was previously suspended using a ``stack_switch`` instruction. 1017 2. Stack B is a newly initialized stack. The necessary initialization is 1018 platform-dependent and will generally involve running some kind of 1019 trampoline to start execution of a function on the new stack. 1020 1021 In both cases, the ``in_payload`` argument of the ``stack_switch`` 1022 instruction executed on A is passed to stack B. In the first case above, 1023 it will be the result value of the earlier ``stack_switch`` instruction 1024 executed on stack B. In the second case, the value will be accessible to 1025 the trampoline in a platform-dependent register. 1026 1027 The pointers ``load_context_ptr`` and ``store_context_ptr`` are allowed 1028 to be equal; the instruction ensures that all data is loaded from the 1029 former before writing to the latter. 1030 1031 Stack switching is one-shot in the sense that each ``stack_switch`` 1032 operation effectively consumes the context identified by 1033 ``load_context_ptr``. In other words, performing two ``stack_switches`` 1034 using the same ``load_context_ptr`` causes undefined behavior, unless 1035 the context at ``load_context_ptr`` is overwritten by another 1036 `stack_switch` in between. 1037 "#, 1038 &formats.ternary, 1039 ) 1040 .operands_in(vec![ 1041 Operand::new("store_context_ptr", iAddr), 1042 Operand::new("load_context_ptr", iAddr), 1043 Operand::new("in_payload0", iAddr), 1044 ]) 1045 .operands_out(vec![Operand::new("out_payload0", iAddr)]) 1046 .other_side_effects() 1047 .can_load() 1048 .can_store() 1049 .call(), 1050 ); 1051 1052 let I16x8 = &TypeVar::new( 1053 "I16x8", 1054 "A SIMD vector with exactly 8 lanes of 16-bit values", 1055 TypeSetBuilder::new() 1056 .ints(16..16) 1057 .simd_lanes(8..8) 1058 .includes_scalars(false) 1059 .build(), 1060 ); 1061 1062 ig.push( 1063 Inst::new( 1064 "uload8x8", 1065 r#" 1066 Load an 8x8 vector (64 bits) from memory at ``p + Offset`` and zero-extend into an i16x8 1067 vector. 1068 "#, 1069 &formats.load, 1070 ) 1071 .operands_in(vec![ 1072 Operand::new("MemFlags", &imm.memflags), 1073 Operand::new("p", iAddr), 1074 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 1075 ]) 1076 .operands_out(vec![Operand::new("a", I16x8).with_doc("Value loaded")]) 1077 .can_load(), 1078 ); 1079 1080 ig.push( 1081 Inst::new( 1082 "sload8x8", 1083 r#" 1084 Load an 8x8 vector (64 bits) from memory at ``p + Offset`` and sign-extend into an i16x8 1085 vector. 1086 "#, 1087 &formats.load, 1088 ) 1089 .operands_in(vec![ 1090 Operand::new("MemFlags", &imm.memflags), 1091 Operand::new("p", iAddr), 1092 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 1093 ]) 1094 .operands_out(vec![Operand::new("a", I16x8).with_doc("Value loaded")]) 1095 .can_load(), 1096 ); 1097 1098 let I32x4 = &TypeVar::new( 1099 "I32x4", 1100 "A SIMD vector with exactly 4 lanes of 32-bit values", 1101 TypeSetBuilder::new() 1102 .ints(32..32) 1103 .simd_lanes(4..4) 1104 .includes_scalars(false) 1105 .build(), 1106 ); 1107 1108 ig.push( 1109 Inst::new( 1110 "uload16x4", 1111 r#" 1112 Load a 16x4 vector (64 bits) from memory at ``p + Offset`` and zero-extend into an i32x4 1113 vector. 1114 "#, 1115 &formats.load, 1116 ) 1117 .operands_in(vec![ 1118 Operand::new("MemFlags", &imm.memflags), 1119 Operand::new("p", iAddr), 1120 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 1121 ]) 1122 .operands_out(vec![Operand::new("a", I32x4).with_doc("Value loaded")]) 1123 .can_load(), 1124 ); 1125 1126 ig.push( 1127 Inst::new( 1128 "sload16x4", 1129 r#" 1130 Load a 16x4 vector (64 bits) from memory at ``p + Offset`` and sign-extend into an i32x4 1131 vector. 1132 "#, 1133 &formats.load, 1134 ) 1135 .operands_in(vec![ 1136 Operand::new("MemFlags", &imm.memflags), 1137 Operand::new("p", iAddr), 1138 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 1139 ]) 1140 .operands_out(vec![Operand::new("a", I32x4).with_doc("Value loaded")]) 1141 .can_load(), 1142 ); 1143 1144 let I64x2 = &TypeVar::new( 1145 "I64x2", 1146 "A SIMD vector with exactly 2 lanes of 64-bit values", 1147 TypeSetBuilder::new() 1148 .ints(64..64) 1149 .simd_lanes(2..2) 1150 .includes_scalars(false) 1151 .build(), 1152 ); 1153 1154 ig.push( 1155 Inst::new( 1156 "uload32x2", 1157 r#" 1158 Load an 32x2 vector (64 bits) from memory at ``p + Offset`` and zero-extend into an i64x2 1159 vector. 1160 "#, 1161 &formats.load, 1162 ) 1163 .operands_in(vec![ 1164 Operand::new("MemFlags", &imm.memflags), 1165 Operand::new("p", iAddr), 1166 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 1167 ]) 1168 .operands_out(vec![Operand::new("a", I64x2).with_doc("Value loaded")]) 1169 .can_load(), 1170 ); 1171 1172 ig.push( 1173 Inst::new( 1174 "sload32x2", 1175 r#" 1176 Load a 32x2 vector (64 bits) from memory at ``p + Offset`` and sign-extend into an i64x2 1177 vector. 1178 "#, 1179 &formats.load, 1180 ) 1181 .operands_in(vec![ 1182 Operand::new("MemFlags", &imm.memflags), 1183 Operand::new("p", iAddr), 1184 Operand::new("Offset", &imm.offset32).with_doc("Byte offset from base address"), 1185 ]) 1186 .operands_out(vec![Operand::new("a", I64x2).with_doc("Value loaded")]) 1187 .can_load(), 1188 ); 1189 1190 ig.push( 1191 Inst::new( 1192 "stack_load", 1193 r#" 1194 Load a value from a stack slot at the constant offset. 1195 1196 This is a polymorphic instruction that can load any value type which 1197 has a memory representation. 1198 1199 The offset is an immediate constant, not an SSA value. The memory 1200 access cannot go out of bounds, i.e. 1201 `sizeof(a) + Offset <= sizeof(SS)`. 1202 "#, 1203 &formats.stack_load, 1204 ) 1205 .operands_in(vec![ 1206 Operand::new("SS", &entities.stack_slot), 1207 Operand::new("Offset", &imm.offset32).with_doc("In-bounds offset into stack slot"), 1208 ]) 1209 .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]) 1210 .can_load(), 1211 ); 1212 1213 ig.push( 1214 Inst::new( 1215 "stack_store", 1216 r#" 1217 Store a value to a stack slot at a constant offset. 1218 1219 This is a polymorphic instruction that can store any value type with a 1220 memory representation. 1221 1222 The offset is an immediate constant, not an SSA value. The memory 1223 access cannot go out of bounds, i.e. 1224 `sizeof(a) + Offset <= sizeof(SS)`. 1225 "#, 1226 &formats.stack_store, 1227 ) 1228 .operands_in(vec![ 1229 Operand::new("x", Mem).with_doc("Value to be stored"), 1230 Operand::new("SS", &entities.stack_slot), 1231 Operand::new("Offset", &imm.offset32).with_doc("In-bounds offset into stack slot"), 1232 ]) 1233 .can_store(), 1234 ); 1235 1236 ig.push( 1237 Inst::new( 1238 "stack_addr", 1239 r#" 1240 Get the address of a stack slot. 1241 1242 Compute the absolute address of a byte in a stack slot. The offset must 1243 refer to a byte inside the stack slot: 1244 `0 <= Offset < sizeof(SS)`. 1245 "#, 1246 &formats.stack_load, 1247 ) 1248 .operands_in(vec![ 1249 Operand::new("SS", &entities.stack_slot), 1250 Operand::new("Offset", &imm.offset32).with_doc("In-bounds offset into stack slot"), 1251 ]) 1252 .operands_out(vec![Operand::new("addr", iAddr)]), 1253 ); 1254 1255 ig.push( 1256 Inst::new( 1257 "dynamic_stack_load", 1258 r#" 1259 Load a value from a dynamic stack slot. 1260 1261 This is a polymorphic instruction that can load any value type which 1262 has a memory representation. 1263 "#, 1264 &formats.dynamic_stack_load, 1265 ) 1266 .operands_in(vec![Operand::new("DSS", &entities.dynamic_stack_slot)]) 1267 .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]) 1268 .can_load(), 1269 ); 1270 1271 ig.push( 1272 Inst::new( 1273 "dynamic_stack_store", 1274 r#" 1275 Store a value to a dynamic stack slot. 1276 1277 This is a polymorphic instruction that can store any dynamic value type with a 1278 memory representation. 1279 "#, 1280 &formats.dynamic_stack_store, 1281 ) 1282 .operands_in(vec![ 1283 Operand::new("x", Mem).with_doc("Value to be stored"), 1284 Operand::new("DSS", &entities.dynamic_stack_slot), 1285 ]) 1286 .can_store(), 1287 ); 1288 1289 ig.push( 1290 Inst::new( 1291 "dynamic_stack_addr", 1292 r#" 1293 Get the address of a dynamic stack slot. 1294 1295 Compute the absolute address of the first byte of a dynamic stack slot. 1296 "#, 1297 &formats.dynamic_stack_load, 1298 ) 1299 .operands_in(vec![Operand::new("DSS", &entities.dynamic_stack_slot)]) 1300 .operands_out(vec![Operand::new("addr", iAddr)]), 1301 ); 1302 1303 ig.push( 1304 Inst::new( 1305 "global_value", 1306 r#" 1307 Compute the value of global GV. 1308 "#, 1309 &formats.unary_global_value, 1310 ) 1311 .operands_in(vec![Operand::new("GV", &entities.global_value)]) 1312 .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]), 1313 ); 1314 1315 ig.push( 1316 Inst::new( 1317 "symbol_value", 1318 r#" 1319 Compute the value of global GV, which is a symbolic value. 1320 "#, 1321 &formats.unary_global_value, 1322 ) 1323 .operands_in(vec![Operand::new("GV", &entities.global_value)]) 1324 .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]), 1325 ); 1326 1327 ig.push( 1328 Inst::new( 1329 "tls_value", 1330 r#" 1331 Compute the value of global GV, which is a TLS (thread local storage) value. 1332 "#, 1333 &formats.unary_global_value, 1334 ) 1335 .operands_in(vec![Operand::new("GV", &entities.global_value)]) 1336 .operands_out(vec![Operand::new("a", Mem).with_doc("Value loaded")]), 1337 ); 1338 1339 // Note this instruction is marked as having other side-effects, so GVN won't try to hoist it, 1340 // which would result in it being subject to spilling. While not hoisting would generally hurt 1341 // performance, since a computed value used many times may need to be regenerated before each 1342 // use, it is not the case here: this instruction doesn't generate any code. That's because, 1343 // by definition the pinned register is never used by the register allocator, but is written to 1344 // and read explicitly and exclusively by set_pinned_reg and get_pinned_reg. 1345 ig.push( 1346 Inst::new( 1347 "get_pinned_reg", 1348 r#" 1349 Gets the content of the pinned register, when it's enabled. 1350 "#, 1351 &formats.nullary, 1352 ) 1353 .operands_out(vec![Operand::new("addr", iAddr)]) 1354 .other_side_effects(), 1355 ); 1356 1357 ig.push( 1358 Inst::new( 1359 "set_pinned_reg", 1360 r#" 1361 Sets the content of the pinned register, when it's enabled. 1362 "#, 1363 &formats.unary, 1364 ) 1365 .operands_in(vec![Operand::new("addr", iAddr)]) 1366 .other_side_effects(), 1367 ); 1368 1369 ig.push( 1370 Inst::new( 1371 "get_frame_pointer", 1372 r#" 1373 Get the address in the frame pointer register. 1374 1375 Usage of this instruction requires setting `preserve_frame_pointers` to `true`. 1376 "#, 1377 &formats.nullary, 1378 ) 1379 .operands_out(vec![Operand::new("addr", iAddr)]), 1380 ); 1381 1382 ig.push( 1383 Inst::new( 1384 "get_stack_pointer", 1385 r#" 1386 Get the address in the stack pointer register. 1387 "#, 1388 &formats.nullary, 1389 ) 1390 .operands_out(vec![Operand::new("addr", iAddr)]), 1391 ); 1392 1393 ig.push( 1394 Inst::new( 1395 "get_return_address", 1396 r#" 1397 Get the PC where this function will transfer control to when it returns. 1398 1399 Usage of this instruction requires setting `preserve_frame_pointers` to `true`. 1400 "#, 1401 &formats.nullary, 1402 ) 1403 .operands_out(vec![Operand::new("addr", iAddr)]), 1404 ); 1405 1406 ig.push( 1407 Inst::new( 1408 "get_exception_handler_address", 1409 r#" 1410 Get the handler PC for the given exceptional edge for an 1411 exception return from the given `try_call`-terminated block. 1412 1413 This instruction provides the PC for the handler resume point, 1414 as defined by the exception-handling aspect of the given 1415 callee ABI, for a return from the given calling block. It can 1416 be used when the exception unwind mechanism requires manual 1417 plumbing for this information which must be set up before the call 1418 itself: for example, if the resume address needs to be stored in 1419 some context structure for a runtime to resume to on error. 1420 1421 The given caller block must end in a `try_call` and the given 1422 exception-handling block must be one of its exceptional 1423 successors in the associated exception-handling table. The 1424 returned PC is *only* valid to resume to when the `try_call` 1425 is on the stack having called the callee; in other words, when 1426 a normal exception unwinder might otherwise resume to that 1427 handler. 1428 "#, 1429 &formats.exception_handler_address, 1430 ) 1431 .operands_in(vec![ 1432 Operand::new("block", &entities.raw_block), 1433 Operand::new("index", &imm.imm64), 1434 ]) 1435 .operands_out(vec![Operand::new("addr", iAddr)]), 1436 ); 1437 1438 ig.push( 1439 Inst::new( 1440 "iconst", 1441 r#" 1442 Integer constant. 1443 1444 Create a scalar integer SSA value with an immediate constant value, or 1445 an integer vector where all the lanes have the same value. 1446 "#, 1447 &formats.unary_imm, 1448 ) 1449 .operands_in(vec![Operand::new("N", &imm.imm64)]) 1450 .operands_out(vec![ 1451 Operand::new("a", NarrowInt).with_doc("A constant integer scalar or vector value"), 1452 ]), 1453 ); 1454 1455 ig.push( 1456 Inst::new( 1457 "f16const", 1458 r#" 1459 Floating point constant. 1460 1461 Create a `f16` SSA value with an immediate constant value. 1462 "#, 1463 &formats.unary_ieee16, 1464 ) 1465 .operands_in(vec![Operand::new("N", &imm.ieee16)]) 1466 .operands_out(vec![ 1467 Operand::new("a", f16_).with_doc("A constant f16 scalar value"), 1468 ]), 1469 ); 1470 1471 ig.push( 1472 Inst::new( 1473 "f32const", 1474 r#" 1475 Floating point constant. 1476 1477 Create a `f32` SSA value with an immediate constant value. 1478 "#, 1479 &formats.unary_ieee32, 1480 ) 1481 .operands_in(vec![Operand::new("N", &imm.ieee32)]) 1482 .operands_out(vec![ 1483 Operand::new("a", f32_).with_doc("A constant f32 scalar value"), 1484 ]), 1485 ); 1486 1487 ig.push( 1488 Inst::new( 1489 "f64const", 1490 r#" 1491 Floating point constant. 1492 1493 Create a `f64` SSA value with an immediate constant value. 1494 "#, 1495 &formats.unary_ieee64, 1496 ) 1497 .operands_in(vec![Operand::new("N", &imm.ieee64)]) 1498 .operands_out(vec![ 1499 Operand::new("a", f64_).with_doc("A constant f64 scalar value"), 1500 ]), 1501 ); 1502 1503 ig.push( 1504 Inst::new( 1505 "f128const", 1506 r#" 1507 Floating point constant. 1508 1509 Create a `f128` SSA value with an immediate constant value. 1510 "#, 1511 &formats.unary_const, 1512 ) 1513 .operands_in(vec![Operand::new("N", &entities.pool_constant)]) 1514 .operands_out(vec![ 1515 Operand::new("a", f128_).with_doc("A constant f128 scalar value"), 1516 ]), 1517 ); 1518 1519 ig.push( 1520 Inst::new( 1521 "vconst", 1522 r#" 1523 SIMD vector constant. 1524 1525 Construct a vector with the given immediate bytes. 1526 "#, 1527 &formats.unary_const, 1528 ) 1529 .operands_in(vec![ 1530 Operand::new("N", &entities.pool_constant) 1531 .with_doc("The 16 immediate bytes of a 128-bit vector"), 1532 ]) 1533 .operands_out(vec![ 1534 Operand::new("a", TxN).with_doc("A constant vector value"), 1535 ]), 1536 ); 1537 1538 let Tx16 = &TypeVar::new( 1539 "Tx16", 1540 "A SIMD vector with exactly 16 lanes of 8-bit values; eventually this may support other \ 1541 lane counts and widths", 1542 TypeSetBuilder::new() 1543 .ints(8..8) 1544 .simd_lanes(16..16) 1545 .includes_scalars(false) 1546 .build(), 1547 ); 1548 1549 ig.push( 1550 Inst::new( 1551 "shuffle", 1552 r#" 1553 SIMD vector shuffle. 1554 1555 Shuffle two vectors using the given immediate bytes. For each of the 16 bytes of the 1556 immediate, a value i of 0-15 selects the i-th element of the first vector and a value i of 1557 16-31 selects the (i-16)th element of the second vector. Immediate values outside of the 1558 0-31 range are not valid. 1559 "#, 1560 &formats.shuffle, 1561 ) 1562 .operands_in(vec![ 1563 Operand::new("a", Tx16).with_doc("A vector value"), 1564 Operand::new("b", Tx16).with_doc("A vector value"), 1565 Operand::new("mask", &entities.uimm128) 1566 .with_doc("The 16 immediate bytes used for selecting the elements to shuffle"), 1567 ]) 1568 .operands_out(vec![Operand::new("a", Tx16).with_doc("A vector value")]), 1569 ); 1570 1571 ig.push(Inst::new( 1572 "nop", 1573 r#" 1574 Just a dummy instruction. 1575 1576 Note: this doesn't compile to a machine code nop. 1577 "#, 1578 &formats.nullary, 1579 )); 1580 1581 ig.push( 1582 Inst::new( 1583 "select", 1584 r#" 1585 Conditional select. 1586 1587 This instruction selects whole values. Use `bitselect` to choose each 1588 bit according to a mask. 1589 "#, 1590 &formats.ternary, 1591 ) 1592 .operands_in(vec![ 1593 Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"), 1594 Operand::new("x", Any).with_doc("Value to use when `c` is true"), 1595 Operand::new("y", Any).with_doc("Value to use when `c` is false"), 1596 ]) 1597 .operands_out(vec![Operand::new("a", Any)]), 1598 ); 1599 1600 ig.push( 1601 Inst::new( 1602 "select_spectre_guard", 1603 r#" 1604 Conditional select intended for Spectre guards. 1605 1606 This operation is semantically equivalent to a select instruction. 1607 However, this instruction prohibits all speculation on the 1608 controlling value when determining which input to use as the result. 1609 As such, it is suitable for use in Spectre guards. 1610 1611 For example, on a target which may speculatively execute branches, 1612 the lowering of this instruction is guaranteed to not conditionally 1613 branch. Instead it will typically lower to a conditional move 1614 instruction. (No Spectre-vulnerable processors are known to perform 1615 value speculation on conditional move instructions.) 1616 1617 Ensure that the instruction you're trying to protect from Spectre 1618 attacks has a data dependency on the result of this instruction. 1619 That prevents an out-of-order CPU from evaluating that instruction 1620 until the result of this one is known, which in turn will be blocked 1621 until the controlling value is known. 1622 1623 Typical usage is to use a bounds-check as the controlling value, 1624 and select between either a null pointer if the bounds-check 1625 fails, or an in-bounds address otherwise, so that dereferencing 1626 the resulting address with a load or store instruction will trap if 1627 the bounds-check failed. When this instruction is used in this way, 1628 any microarchitectural side effects of the memory access will only 1629 occur after the bounds-check finishes, which ensures that no Spectre 1630 vulnerability will exist. 1631 1632 Optimization opportunities for this instruction are limited compared 1633 to a normal select instruction, but it is allowed to be replaced 1634 by other values which are functionally equivalent as long as doing 1635 so does not introduce any new opportunities to speculate on the 1636 controlling value. 1637 "#, 1638 &formats.ternary, 1639 ) 1640 .operands_in(vec![ 1641 Operand::new("c", ScalarTruthy).with_doc("Controlling value to test"), 1642 Operand::new("x", Any).with_doc("Value to use when `c` is true"), 1643 Operand::new("y", Any).with_doc("Value to use when `c` is false"), 1644 ]) 1645 .operands_out(vec![Operand::new("a", Any)]), 1646 ); 1647 1648 ig.push( 1649 Inst::new( 1650 "bitselect", 1651 r#" 1652 Conditional select of bits. 1653 1654 For each bit in `c`, this instruction selects the corresponding bit from `x` if the bit 1655 in `x` is 1 and the corresponding bit from `y` if the bit in `c` is 0. See also: 1656 `select`. 1657 "#, 1658 &formats.ternary, 1659 ) 1660 .operands_in(vec![ 1661 Operand::new("c", Any).with_doc("Controlling value to test"), 1662 Operand::new("x", Any).with_doc("Value to use when `c` is true"), 1663 Operand::new("y", Any).with_doc("Value to use when `c` is false"), 1664 ]) 1665 .operands_out(vec![Operand::new("a", Any)]), 1666 ); 1667 1668 ig.push( 1669 Inst::new( 1670 "blendv", 1671 r#" 1672 A bitselect-lookalike instruction except with the semantics of 1673 `blendv`-related instructions on x86. 1674 1675 This instruction will use the top bit of each lane in `c`, the condition 1676 mask. If the bit is 1 then the corresponding lane from `x` is chosen. 1677 Otherwise the corresponding lane from `y` is chosen. 1678 1679 "#, 1680 &formats.ternary, 1681 ) 1682 .operands_in(vec![ 1683 Operand::new("c", Any).with_doc("Controlling value to test"), 1684 Operand::new("x", Any).with_doc("Value to use when `c` is true"), 1685 Operand::new("y", Any).with_doc("Value to use when `c` is false"), 1686 ]) 1687 .operands_out(vec![Operand::new("a", Any)]), 1688 ); 1689 1690 ig.push( 1691 Inst::new( 1692 "vany_true", 1693 r#" 1694 Reduce a vector to a scalar boolean. 1695 1696 Return a scalar boolean true if any lane in ``a`` is non-zero, false otherwise. 1697 "#, 1698 &formats.unary, 1699 ) 1700 .operands_in(vec![Operand::new("a", TxN)]) 1701 .operands_out(vec![Operand::new("s", i8)]), 1702 ); 1703 1704 ig.push( 1705 Inst::new( 1706 "vall_true", 1707 r#" 1708 Reduce a vector to a scalar boolean. 1709 1710 Return a scalar boolean true if all lanes in ``i`` are non-zero, false otherwise. 1711 "#, 1712 &formats.unary, 1713 ) 1714 .operands_in(vec![Operand::new("a", TxN)]) 1715 .operands_out(vec![Operand::new("s", i8)]), 1716 ); 1717 1718 ig.push( 1719 Inst::new( 1720 "vhigh_bits", 1721 r#" 1722 Reduce a vector to a scalar integer. 1723 1724 Return a scalar integer, consisting of the concatenation of the most significant bit 1725 of each lane of ``a``. 1726 "#, 1727 &formats.unary, 1728 ) 1729 .operands_in(vec![Operand::new("a", TxN)]) 1730 .operands_out(vec![Operand::new("x", NarrowInt)]), 1731 ); 1732 1733 ig.push( 1734 Inst::new( 1735 "icmp", 1736 r#" 1737 Integer comparison. 1738 1739 The condition code determines if the operands are interpreted as signed 1740 or unsigned integers. 1741 1742 | Signed | Unsigned | Condition | 1743 |--------|----------|-----------------------| 1744 | eq | eq | Equal | 1745 | ne | ne | Not equal | 1746 | slt | ult | Less than | 1747 | sge | uge | Greater than or equal | 1748 | sgt | ugt | Greater than | 1749 | sle | ule | Less than or equal | 1750 1751 When this instruction compares integer vectors, it returns a vector of 1752 lane-wise comparisons. 1753 1754 When comparing scalars, the result is: 1755 - `1` if the condition holds. 1756 - `0` if the condition does not hold. 1757 1758 When comparing vectors, the result is: 1759 - `-1` (i.e. all ones) in each lane where the condition holds. 1760 - `0` in each lane where the condition does not hold. 1761 "#, 1762 &formats.int_compare, 1763 ) 1764 .operands_in(vec![ 1765 Operand::new("Cond", &imm.intcc), 1766 Operand::new("x", Int), 1767 Operand::new("y", Int), 1768 ]) 1769 .operands_out(vec![Operand::new("a", &Int.as_truthy())]), 1770 ); 1771 1772 ig.push( 1773 Inst::new( 1774 "icmp_imm", 1775 r#" 1776 Compare scalar integer to a constant. 1777 1778 This is the same as the `icmp` instruction, except one operand is 1779 a sign extended 64 bit immediate constant. 1780 1781 This instruction can only compare scalars. Use `icmp` for 1782 lane-wise vector comparisons. 1783 "#, 1784 &formats.int_compare_imm, 1785 ) 1786 .operands_in(vec![ 1787 Operand::new("Cond", &imm.intcc), 1788 Operand::new("x", iB), 1789 Operand::new("Y", &imm.imm64), 1790 ]) 1791 .operands_out(vec![Operand::new("a", i8)]), 1792 ); 1793 1794 ig.push( 1795 Inst::new( 1796 "iadd", 1797 r#" 1798 Wrapping integer addition: `a := x + y \pmod{2^B}`. 1799 1800 This instruction does not depend on the signed/unsigned interpretation 1801 of the operands. 1802 "#, 1803 &formats.binary, 1804 ) 1805 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 1806 .operands_out(vec![Operand::new("a", Int)]), 1807 ); 1808 1809 ig.push( 1810 Inst::new( 1811 "isub", 1812 r#" 1813 Wrapping integer subtraction: `a := x - y \pmod{2^B}`. 1814 1815 This instruction does not depend on the signed/unsigned interpretation 1816 of the operands. 1817 "#, 1818 &formats.binary, 1819 ) 1820 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 1821 .operands_out(vec![Operand::new("a", Int)]), 1822 ); 1823 1824 ig.push( 1825 Inst::new( 1826 "ineg", 1827 r#" 1828 Integer negation: `a := -x \pmod{2^B}`. 1829 "#, 1830 &formats.unary, 1831 ) 1832 .operands_in(vec![Operand::new("x", Int)]) 1833 .operands_out(vec![Operand::new("a", Int)]), 1834 ); 1835 1836 ig.push( 1837 Inst::new( 1838 "iabs", 1839 r#" 1840 Integer absolute value with wrapping: `a := |x|`. 1841 "#, 1842 &formats.unary, 1843 ) 1844 .operands_in(vec![Operand::new("x", Int)]) 1845 .operands_out(vec![Operand::new("a", Int)]), 1846 ); 1847 1848 ig.push( 1849 Inst::new( 1850 "imul", 1851 r#" 1852 Wrapping integer multiplication: `a := x y \pmod{2^B}`. 1853 1854 This instruction does not depend on the signed/unsigned interpretation 1855 of the operands. 1856 1857 Polymorphic over all integer types (vector and scalar). 1858 "#, 1859 &formats.binary, 1860 ) 1861 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 1862 .operands_out(vec![Operand::new("a", Int)]), 1863 ); 1864 1865 ig.push( 1866 Inst::new( 1867 "umulhi", 1868 r#" 1869 Unsigned integer multiplication, producing the high half of a 1870 double-length result. 1871 1872 Polymorphic over all integer types (vector and scalar). 1873 "#, 1874 &formats.binary, 1875 ) 1876 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 1877 .operands_out(vec![Operand::new("a", Int)]), 1878 ); 1879 1880 ig.push( 1881 Inst::new( 1882 "smulhi", 1883 r#" 1884 Signed integer multiplication, producing the high half of a 1885 double-length result. 1886 1887 Polymorphic over all integer types (vector and scalar). 1888 "#, 1889 &formats.binary, 1890 ) 1891 .operands_in(vec![Operand::new("x", Int), Operand::new("y", Int)]) 1892 .operands_out(vec![Operand::new("a", Int)]), 1893 ); 1894 1895 let I16or32 = &TypeVar::new( 1896 "I16or32", 1897 "A vector integer type with 16- or 32-bit numbers", 1898 TypeSetBuilder::new().ints(16..32).simd_lanes(4..8).build(), 1899 ); 1900 1901 ig.push( 1902 Inst::new( 1903 "sqmul_round_sat", 1904 r#" 1905 Fixed-point multiplication of numbers in the QN format, where N + 1 1906 is the number bitwidth: 1907 `a := signed_saturate((x * y + (1 << (Q - 1))) >> Q)` 1908 1909 Polymorphic over all integer vector types with 16- or 32-bit numbers. 1910 "#, 1911 &formats.binary, 1912 ) 1913 .operands_in(vec![Operand::new("x", I16or32), Operand::new("y", I16or32)]) 1914 .operands_out(vec![Operand::new("a", I16or32)]), 1915 ); 1916 1917 ig.push( 1918 Inst::new( 1919 "x86_pmulhrsw", 1920 r#" 1921 A similar instruction to `sqmul_round_sat` except with the semantics 1922 of x86's `pmulhrsw` instruction. 1923 1924 This is the same as `sqmul_round_sat` except when both input lanes are 1925 `i16::MIN`. 1926 "#, 1927 &formats.binary, 1928 ) 1929 .operands_in(vec![Operand::new("x", I16or32), Operand::new("y", I16or32)]) 1930 .operands_out(vec![Operand::new("a", I16or32)]), 1931 ); 1932 1933 // Integer division and remainder are scalar-only; most 1934 // hardware does not directly support vector integer division. 1935 1936 ig.push( 1937 Inst::new( 1938 "udiv", 1939 r#" 1940 Unsigned integer division: `a := \lfloor {x \over y} \rfloor`. 1941 1942 This operation traps if the divisor is zero. 1943 "#, 1944 &formats.binary, 1945 ) 1946 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 1947 .operands_out(vec![Operand::new("a", iB)]) 1948 .can_trap() 1949 .side_effects_idempotent(), 1950 ); 1951 1952 ig.push( 1953 Inst::new( 1954 "sdiv", 1955 r#" 1956 Signed integer division rounded toward zero: `a := sign(xy) 1957 \lfloor {|x| \over |y|}\rfloor`. 1958 1959 This operation traps if the divisor is zero, or if the result is not 1960 representable in `B` bits two's complement. This only happens 1961 when `x = -2^{B-1}, y = -1`. 1962 "#, 1963 &formats.binary, 1964 ) 1965 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 1966 .operands_out(vec![Operand::new("a", iB)]) 1967 .can_trap() 1968 .side_effects_idempotent(), 1969 ); 1970 1971 ig.push( 1972 Inst::new( 1973 "urem", 1974 r#" 1975 Unsigned integer remainder. 1976 1977 This operation traps if the divisor is zero. 1978 "#, 1979 &formats.binary, 1980 ) 1981 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 1982 .operands_out(vec![Operand::new("a", iB)]) 1983 .can_trap() 1984 .side_effects_idempotent(), 1985 ); 1986 1987 ig.push( 1988 Inst::new( 1989 "srem", 1990 r#" 1991 Signed integer remainder. The result has the sign of the dividend. 1992 1993 This operation traps if the divisor is zero. 1994 "#, 1995 &formats.binary, 1996 ) 1997 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 1998 .operands_out(vec![Operand::new("a", iB)]) 1999 .can_trap() 2000 .side_effects_idempotent(), 2001 ); 2002 2003 ig.push( 2004 Inst::new( 2005 "iadd_imm", 2006 r#" 2007 Add immediate integer. 2008 2009 Same as `iadd`, but one operand is a sign extended 64 bit immediate constant. 2010 2011 Polymorphic over all scalar integer types, but does not support vector 2012 types. 2013 "#, 2014 &formats.binary_imm64, 2015 ) 2016 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2017 .operands_out(vec![Operand::new("a", iB)]), 2018 ); 2019 2020 ig.push( 2021 Inst::new( 2022 "imul_imm", 2023 r#" 2024 Integer multiplication by immediate constant. 2025 2026 Same as `imul`, but one operand is a sign extended 64 bit immediate constant. 2027 2028 Polymorphic over all scalar integer types, but does not support vector 2029 types. 2030 "#, 2031 &formats.binary_imm64, 2032 ) 2033 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2034 .operands_out(vec![Operand::new("a", iB)]), 2035 ); 2036 2037 ig.push( 2038 Inst::new( 2039 "udiv_imm", 2040 r#" 2041 Unsigned integer division by an immediate constant. 2042 2043 Same as `udiv`, but one operand is a zero extended 64 bit immediate constant. 2044 2045 This operation traps if the divisor is zero. 2046 "#, 2047 &formats.binary_imm64, 2048 ) 2049 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2050 .operands_out(vec![Operand::new("a", iB)]), 2051 ); 2052 2053 ig.push( 2054 Inst::new( 2055 "sdiv_imm", 2056 r#" 2057 Signed integer division by an immediate constant. 2058 2059 Same as `sdiv`, but one operand is a sign extended 64 bit immediate constant. 2060 2061 This operation traps if the divisor is zero, or if the result is not 2062 representable in `B` bits two's complement. This only happens 2063 when `x = -2^{B-1}, Y = -1`. 2064 "#, 2065 &formats.binary_imm64, 2066 ) 2067 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2068 .operands_out(vec![Operand::new("a", iB)]), 2069 ); 2070 2071 ig.push( 2072 Inst::new( 2073 "urem_imm", 2074 r#" 2075 Unsigned integer remainder with immediate divisor. 2076 2077 Same as `urem`, but one operand is a zero extended 64 bit immediate constant. 2078 2079 This operation traps if the divisor is zero. 2080 "#, 2081 &formats.binary_imm64, 2082 ) 2083 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2084 .operands_out(vec![Operand::new("a", iB)]), 2085 ); 2086 2087 ig.push( 2088 Inst::new( 2089 "srem_imm", 2090 r#" 2091 Signed integer remainder with immediate divisor. 2092 2093 Same as `srem`, but one operand is a sign extended 64 bit immediate constant. 2094 2095 This operation traps if the divisor is zero. 2096 "#, 2097 &formats.binary_imm64, 2098 ) 2099 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2100 .operands_out(vec![Operand::new("a", iB)]), 2101 ); 2102 2103 ig.push( 2104 Inst::new( 2105 "irsub_imm", 2106 r#" 2107 Immediate reverse wrapping subtraction: `a := Y - x \pmod{2^B}`. 2108 2109 The immediate operand is a sign extended 64 bit constant. 2110 2111 Also works as integer negation when `Y = 0`. Use `iadd_imm` 2112 with a negative immediate operand for the reverse immediate 2113 subtraction. 2114 2115 Polymorphic over all scalar integer types, but does not support vector 2116 types. 2117 "#, 2118 &formats.binary_imm64, 2119 ) 2120 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2121 .operands_out(vec![Operand::new("a", iB)]), 2122 ); 2123 2124 ig.push( 2125 Inst::new( 2126 "sadd_overflow_cin", 2127 r#" 2128 Add signed integers with carry in and overflow out. 2129 2130 Same as `sadd_overflow` with an additional carry input. The `c_in` type 2131 is interpreted as 1 if it's nonzero or 0 if it's zero. 2132 "#, 2133 &formats.ternary, 2134 ) 2135 .operands_in(vec![ 2136 Operand::new("x", iB), 2137 Operand::new("y", iB), 2138 Operand::new("c_in", i8).with_doc("Input carry flag"), 2139 ]) 2140 .operands_out(vec![ 2141 Operand::new("a", iB), 2142 Operand::new("c_out", i8).with_doc("Output carry flag"), 2143 ]), 2144 ); 2145 2146 ig.push( 2147 Inst::new( 2148 "uadd_overflow_cin", 2149 r#" 2150 Add unsigned integers with carry in and overflow out. 2151 2152 Same as `uadd_overflow` with an additional carry input. The `c_in` type 2153 is interpreted as 1 if it's nonzero or 0 if it's zero. 2154 "#, 2155 &formats.ternary, 2156 ) 2157 .operands_in(vec![ 2158 Operand::new("x", iB), 2159 Operand::new("y", iB), 2160 Operand::new("c_in", i8).with_doc("Input carry flag"), 2161 ]) 2162 .operands_out(vec![ 2163 Operand::new("a", iB), 2164 Operand::new("c_out", i8).with_doc("Output carry flag"), 2165 ]), 2166 ); 2167 2168 { 2169 let of_out = Operand::new("of", i8).with_doc("Overflow flag"); 2170 ig.push( 2171 Inst::new( 2172 "uadd_overflow", 2173 r#" 2174 Add integers unsigned with overflow out. 2175 ``of`` is set when the addition overflowed. 2176 ```text 2177 a &= x + y \pmod 2^B \\ 2178 of &= x+y >= 2^B 2179 ``` 2180 Polymorphic over all scalar integer types, but does not support vector 2181 types. 2182 "#, 2183 &formats.binary, 2184 ) 2185 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 2186 .operands_out(vec![Operand::new("a", iB), of_out.clone()]), 2187 ); 2188 2189 ig.push( 2190 Inst::new( 2191 "sadd_overflow", 2192 r#" 2193 Add integers signed with overflow out. 2194 ``of`` is set when the addition over- or underflowed. 2195 Polymorphic over all scalar integer types, but does not support vector 2196 types. 2197 "#, 2198 &formats.binary, 2199 ) 2200 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 2201 .operands_out(vec![Operand::new("a", iB), of_out.clone()]), 2202 ); 2203 2204 ig.push( 2205 Inst::new( 2206 "usub_overflow", 2207 r#" 2208 Subtract integers unsigned with overflow out. 2209 ``of`` is set when the subtraction underflowed. 2210 ```text 2211 a &= x - y \pmod 2^B \\ 2212 of &= x - y < 0 2213 ``` 2214 Polymorphic over all scalar integer types, but does not support vector 2215 types. 2216 "#, 2217 &formats.binary, 2218 ) 2219 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 2220 .operands_out(vec![Operand::new("a", iB), of_out.clone()]), 2221 ); 2222 2223 ig.push( 2224 Inst::new( 2225 "ssub_overflow", 2226 r#" 2227 Subtract integers signed with overflow out. 2228 ``of`` is set when the subtraction over- or underflowed. 2229 Polymorphic over all scalar integer types, but does not support vector 2230 types. 2231 "#, 2232 &formats.binary, 2233 ) 2234 .operands_in(vec![Operand::new("x", iB), Operand::new("y", iB)]) 2235 .operands_out(vec![Operand::new("a", iB), of_out.clone()]), 2236 ); 2237 2238 { 2239 let NarrowScalar = &TypeVar::new( 2240 "NarrowScalar", 2241 "A scalar integer type up to 64 bits", 2242 TypeSetBuilder::new().ints(8..64).build(), 2243 ); 2244 2245 ig.push( 2246 Inst::new( 2247 "umul_overflow", 2248 r#" 2249 Multiply integers unsigned with overflow out. 2250 ``of`` is set when the multiplication overflowed. 2251 ```text 2252 a &= x * y \pmod 2^B \\ 2253 of &= x * y > 2^B 2254 ``` 2255 Polymorphic over all scalar integer types except i128, but does not support vector 2256 types. 2257 "#, 2258 &formats.binary, 2259 ) 2260 .operands_in(vec![ 2261 Operand::new("x", NarrowScalar), 2262 Operand::new("y", NarrowScalar), 2263 ]) 2264 .operands_out(vec![Operand::new("a", NarrowScalar), of_out.clone()]), 2265 ); 2266 2267 ig.push( 2268 Inst::new( 2269 "smul_overflow", 2270 r#" 2271 Multiply integers signed with overflow out. 2272 ``of`` is set when the multiplication over- or underflowed. 2273 Polymorphic over all scalar integer types except i128, but does not support vector 2274 types. 2275 "#, 2276 &formats.binary, 2277 ) 2278 .operands_in(vec![ 2279 Operand::new("x", NarrowScalar), 2280 Operand::new("y", NarrowScalar), 2281 ]) 2282 .operands_out(vec![Operand::new("a", NarrowScalar), of_out.clone()]), 2283 ); 2284 } 2285 } 2286 2287 let i32_64 = &TypeVar::new( 2288 "i32_64", 2289 "A 32 or 64-bit scalar integer type", 2290 TypeSetBuilder::new().ints(32..64).build(), 2291 ); 2292 2293 ig.push( 2294 Inst::new( 2295 "uadd_overflow_trap", 2296 r#" 2297 Unsigned addition of x and y, trapping if the result overflows. 2298 2299 Accepts 32 or 64-bit integers, and does not support vector types. 2300 "#, 2301 &formats.int_add_trap, 2302 ) 2303 .operands_in(vec![ 2304 Operand::new("x", i32_64), 2305 Operand::new("y", i32_64), 2306 Operand::new("code", &imm.trapcode), 2307 ]) 2308 .operands_out(vec![Operand::new("a", i32_64)]) 2309 .can_trap() 2310 .side_effects_idempotent(), 2311 ); 2312 2313 ig.push( 2314 Inst::new( 2315 "ssub_overflow_bin", 2316 r#" 2317 Subtract signed integers with borrow in and overflow out. 2318 2319 Same as `ssub_overflow` with an additional borrow input. The `b_in` type 2320 is interpreted as 1 if it's nonzero or 0 if it's zero. The computation 2321 performed here is `x - (y + (b_in != 0))`. 2322 "#, 2323 &formats.ternary, 2324 ) 2325 .operands_in(vec![ 2326 Operand::new("x", iB), 2327 Operand::new("y", iB), 2328 Operand::new("b_in", i8).with_doc("Input borrow flag"), 2329 ]) 2330 .operands_out(vec![ 2331 Operand::new("a", iB), 2332 Operand::new("b_out", i8).with_doc("Output borrow flag"), 2333 ]), 2334 ); 2335 2336 ig.push( 2337 Inst::new( 2338 "usub_overflow_bin", 2339 r#" 2340 Subtract unsigned integers with borrow in and overflow out. 2341 2342 Same as `usub_overflow` with an additional borrow input. The `b_in` type 2343 is interpreted as 1 if it's nonzero or 0 if it's zero. The computation 2344 performed here is `x - (y + (b_in != 0))`. 2345 "#, 2346 &formats.ternary, 2347 ) 2348 .operands_in(vec![ 2349 Operand::new("x", iB), 2350 Operand::new("y", iB), 2351 Operand::new("b_in", i8).with_doc("Input borrow flag"), 2352 ]) 2353 .operands_out(vec![ 2354 Operand::new("a", iB), 2355 Operand::new("b_out", i8).with_doc("Output borrow flag"), 2356 ]), 2357 ); 2358 2359 let bits = &TypeVar::new( 2360 "bits", 2361 "Any integer, float, or vector type", 2362 TypeSetBuilder::new() 2363 .ints(Interval::All) 2364 .floats(Interval::All) 2365 .simd_lanes(Interval::All) 2366 .includes_scalars(true) 2367 .build(), 2368 ); 2369 2370 ig.push( 2371 Inst::new( 2372 "band", 2373 r#" 2374 Bitwise and. 2375 "#, 2376 &formats.binary, 2377 ) 2378 .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)]) 2379 .operands_out(vec![Operand::new("a", bits)]), 2380 ); 2381 2382 ig.push( 2383 Inst::new( 2384 "bor", 2385 r#" 2386 Bitwise or. 2387 "#, 2388 &formats.binary, 2389 ) 2390 .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)]) 2391 .operands_out(vec![Operand::new("a", bits)]), 2392 ); 2393 2394 ig.push( 2395 Inst::new( 2396 "bxor", 2397 r#" 2398 Bitwise xor. 2399 "#, 2400 &formats.binary, 2401 ) 2402 .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)]) 2403 .operands_out(vec![Operand::new("a", bits)]), 2404 ); 2405 2406 ig.push( 2407 Inst::new( 2408 "bnot", 2409 r#" 2410 Bitwise not. 2411 "#, 2412 &formats.unary, 2413 ) 2414 .operands_in(vec![Operand::new("x", bits)]) 2415 .operands_out(vec![Operand::new("a", bits)]), 2416 ); 2417 2418 ig.push( 2419 Inst::new( 2420 "band_not", 2421 r#" 2422 Bitwise and not. 2423 2424 Computes `x & ~y`. 2425 "#, 2426 &formats.binary, 2427 ) 2428 .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)]) 2429 .operands_out(vec![Operand::new("a", bits)]), 2430 ); 2431 2432 ig.push( 2433 Inst::new( 2434 "bor_not", 2435 r#" 2436 Bitwise or not. 2437 2438 Computes `x | ~y`. 2439 "#, 2440 &formats.binary, 2441 ) 2442 .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)]) 2443 .operands_out(vec![Operand::new("a", bits)]), 2444 ); 2445 2446 ig.push( 2447 Inst::new( 2448 "bxor_not", 2449 r#" 2450 Bitwise xor not. 2451 2452 Computes `x ^ ~y`. 2453 "#, 2454 &formats.binary, 2455 ) 2456 .operands_in(vec![Operand::new("x", bits), Operand::new("y", bits)]) 2457 .operands_out(vec![Operand::new("a", bits)]), 2458 ); 2459 2460 ig.push( 2461 Inst::new( 2462 "band_imm", 2463 r#" 2464 Bitwise and with immediate. 2465 2466 Same as `band`, but one operand is a zero extended 64 bit immediate constant. 2467 2468 Polymorphic over all scalar integer types, but does not support vector 2469 types. 2470 "#, 2471 &formats.binary_imm64, 2472 ) 2473 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2474 .operands_out(vec![Operand::new("a", iB)]), 2475 ); 2476 2477 ig.push( 2478 Inst::new( 2479 "bor_imm", 2480 r#" 2481 Bitwise or with immediate. 2482 2483 Same as `bor`, but one operand is a zero extended 64 bit immediate constant. 2484 2485 Polymorphic over all scalar integer types, but does not support vector 2486 types. 2487 "#, 2488 &formats.binary_imm64, 2489 ) 2490 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2491 .operands_out(vec![Operand::new("a", iB)]), 2492 ); 2493 2494 ig.push( 2495 Inst::new( 2496 "bxor_imm", 2497 r#" 2498 Bitwise xor with immediate. 2499 2500 Same as `bxor`, but one operand is a zero extended 64 bit immediate constant. 2501 2502 Polymorphic over all scalar integer types, but does not support vector 2503 types. 2504 "#, 2505 &formats.binary_imm64, 2506 ) 2507 .operands_in(vec![Operand::new("x", iB), Operand::new("Y", &imm.imm64)]) 2508 .operands_out(vec![Operand::new("a", iB)]), 2509 ); 2510 2511 ig.push( 2512 Inst::new( 2513 "rotl", 2514 r#" 2515 Rotate left. 2516 2517 Rotate the bits in ``x`` by ``y`` places. 2518 "#, 2519 &formats.binary, 2520 ) 2521 .operands_in(vec![ 2522 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2523 Operand::new("y", iB).with_doc("Number of bits to shift"), 2524 ]) 2525 .operands_out(vec![Operand::new("a", Int)]), 2526 ); 2527 2528 ig.push( 2529 Inst::new( 2530 "rotr", 2531 r#" 2532 Rotate right. 2533 2534 Rotate the bits in ``x`` by ``y`` places. 2535 "#, 2536 &formats.binary, 2537 ) 2538 .operands_in(vec![ 2539 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2540 Operand::new("y", iB).with_doc("Number of bits to shift"), 2541 ]) 2542 .operands_out(vec![Operand::new("a", Int)]), 2543 ); 2544 2545 ig.push( 2546 Inst::new( 2547 "rotl_imm", 2548 r#" 2549 Rotate left by immediate. 2550 2551 Same as `rotl`, but one operand is a zero extended 64 bit immediate constant. 2552 "#, 2553 &formats.binary_imm64, 2554 ) 2555 .operands_in(vec![ 2556 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2557 Operand::new("Y", &imm.imm64), 2558 ]) 2559 .operands_out(vec![Operand::new("a", Int)]), 2560 ); 2561 2562 ig.push( 2563 Inst::new( 2564 "rotr_imm", 2565 r#" 2566 Rotate right by immediate. 2567 2568 Same as `rotr`, but one operand is a zero extended 64 bit immediate constant. 2569 "#, 2570 &formats.binary_imm64, 2571 ) 2572 .operands_in(vec![ 2573 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2574 Operand::new("Y", &imm.imm64), 2575 ]) 2576 .operands_out(vec![Operand::new("a", Int)]), 2577 ); 2578 2579 ig.push( 2580 Inst::new( 2581 "ishl", 2582 r#" 2583 Integer shift left. Shift the bits in ``x`` towards the MSB by ``y`` 2584 places. Shift in zero bits to the LSB. 2585 2586 The shift amount is masked to the size of ``x``. 2587 2588 When shifting a B-bits integer type, this instruction computes: 2589 2590 ```text 2591 s &:= y \pmod B, 2592 a &:= x \cdot 2^s \pmod{2^B}. 2593 ``` 2594 "#, 2595 &formats.binary, 2596 ) 2597 .operands_in(vec![ 2598 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2599 Operand::new("y", iB).with_doc("Number of bits to shift"), 2600 ]) 2601 .operands_out(vec![Operand::new("a", Int)]), 2602 ); 2603 2604 ig.push( 2605 Inst::new( 2606 "ushr", 2607 r#" 2608 Unsigned shift right. Shift bits in ``x`` towards the LSB by ``y`` 2609 places, shifting in zero bits to the MSB. Also called a *logical 2610 shift*. 2611 2612 The shift amount is masked to the size of ``x``. 2613 2614 When shifting a B-bits integer type, this instruction computes: 2615 2616 ```text 2617 s &:= y \pmod B, 2618 a &:= \lfloor x \cdot 2^{-s} \rfloor. 2619 ``` 2620 "#, 2621 &formats.binary, 2622 ) 2623 .operands_in(vec![ 2624 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2625 Operand::new("y", iB).with_doc("Number of bits to shift"), 2626 ]) 2627 .operands_out(vec![Operand::new("a", Int)]), 2628 ); 2629 2630 ig.push( 2631 Inst::new( 2632 "sshr", 2633 r#" 2634 Signed shift right. Shift bits in ``x`` towards the LSB by ``y`` 2635 places, shifting in sign bits to the MSB. Also called an *arithmetic 2636 shift*. 2637 2638 The shift amount is masked to the size of ``x``. 2639 "#, 2640 &formats.binary, 2641 ) 2642 .operands_in(vec![ 2643 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2644 Operand::new("y", iB).with_doc("Number of bits to shift"), 2645 ]) 2646 .operands_out(vec![Operand::new("a", Int)]), 2647 ); 2648 2649 ig.push( 2650 Inst::new( 2651 "ishl_imm", 2652 r#" 2653 Integer shift left by immediate. 2654 2655 The shift amount is masked to the size of ``x``. 2656 "#, 2657 &formats.binary_imm64, 2658 ) 2659 .operands_in(vec![ 2660 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2661 Operand::new("Y", &imm.imm64), 2662 ]) 2663 .operands_out(vec![Operand::new("a", Int)]), 2664 ); 2665 2666 ig.push( 2667 Inst::new( 2668 "ushr_imm", 2669 r#" 2670 Unsigned shift right by immediate. 2671 2672 The shift amount is masked to the size of ``x``. 2673 "#, 2674 &formats.binary_imm64, 2675 ) 2676 .operands_in(vec![ 2677 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2678 Operand::new("Y", &imm.imm64), 2679 ]) 2680 .operands_out(vec![Operand::new("a", Int)]), 2681 ); 2682 2683 ig.push( 2684 Inst::new( 2685 "sshr_imm", 2686 r#" 2687 Signed shift right by immediate. 2688 2689 The shift amount is masked to the size of ``x``. 2690 "#, 2691 &formats.binary_imm64, 2692 ) 2693 .operands_in(vec![ 2694 Operand::new("x", Int).with_doc("Scalar or vector value to shift"), 2695 Operand::new("Y", &imm.imm64), 2696 ]) 2697 .operands_out(vec![Operand::new("a", Int)]), 2698 ); 2699 2700 ig.push( 2701 Inst::new( 2702 "bitrev", 2703 r#" 2704 Reverse the bits of a integer. 2705 2706 Reverses the bits in ``x``. 2707 "#, 2708 &formats.unary, 2709 ) 2710 .operands_in(vec![Operand::new("x", iB)]) 2711 .operands_out(vec![Operand::new("a", iB)]), 2712 ); 2713 2714 ig.push( 2715 Inst::new( 2716 "clz", 2717 r#" 2718 Count leading zero bits. 2719 2720 Starting from the MSB in ``x``, count the number of zero bits before 2721 reaching the first one bit. When ``x`` is zero, returns the size of x 2722 in bits. 2723 "#, 2724 &formats.unary, 2725 ) 2726 .operands_in(vec![Operand::new("x", iB)]) 2727 .operands_out(vec![Operand::new("a", iB)]), 2728 ); 2729 2730 ig.push( 2731 Inst::new( 2732 "cls", 2733 r#" 2734 Count leading sign bits. 2735 2736 Starting from the MSB after the sign bit in ``x``, count the number of 2737 consecutive bits identical to the sign bit. When ``x`` is 0 or -1, 2738 returns one less than the size of x in bits. 2739 "#, 2740 &formats.unary, 2741 ) 2742 .operands_in(vec![Operand::new("x", iB)]) 2743 .operands_out(vec![Operand::new("a", iB)]), 2744 ); 2745 2746 ig.push( 2747 Inst::new( 2748 "ctz", 2749 r#" 2750 Count trailing zeros. 2751 2752 Starting from the LSB in ``x``, count the number of zero bits before 2753 reaching the first one bit. When ``x`` is zero, returns the size of x 2754 in bits. 2755 "#, 2756 &formats.unary, 2757 ) 2758 .operands_in(vec![Operand::new("x", iB)]) 2759 .operands_out(vec![Operand::new("a", iB)]), 2760 ); 2761 2762 ig.push( 2763 Inst::new( 2764 "bswap", 2765 r#" 2766 Reverse the byte order of an integer. 2767 2768 Reverses the bytes in ``x``. 2769 "#, 2770 &formats.unary, 2771 ) 2772 .operands_in(vec![Operand::new("x", iSwappable)]) 2773 .operands_out(vec![Operand::new("a", iSwappable)]), 2774 ); 2775 2776 ig.push( 2777 Inst::new( 2778 "popcnt", 2779 r#" 2780 Population count 2781 2782 Count the number of one bits in ``x``. 2783 "#, 2784 &formats.unary, 2785 ) 2786 .operands_in(vec![Operand::new("x", Int)]) 2787 .operands_out(vec![Operand::new("a", Int)]), 2788 ); 2789 2790 let Float = &TypeVar::new( 2791 "Float", 2792 "A scalar or vector floating point number", 2793 TypeSetBuilder::new() 2794 .floats(Interval::All) 2795 .simd_lanes(Interval::All) 2796 .dynamic_simd_lanes(Interval::All) 2797 .build(), 2798 ); 2799 2800 ig.push( 2801 Inst::new( 2802 "fcmp", 2803 r#" 2804 Floating point comparison. 2805 2806 Two IEEE 754-2008 floating point numbers, `x` and `y`, relate to each 2807 other in exactly one of four ways: 2808 2809 ```text 2810 == ========================================== 2811 UN Unordered when one or both numbers is NaN. 2812 EQ When `x = y`. (And `0.0 = -0.0`). 2813 LT When `x < y`. 2814 GT When `x > y`. 2815 == ========================================== 2816 ``` 2817 2818 The 14 `floatcc` condition codes each correspond to a subset of 2819 the four relations, except for the empty set which would always be 2820 false, and the full set which would always be true. 2821 2822 The condition codes are divided into 7 'ordered' conditions which don't 2823 include UN, and 7 unordered conditions which all include UN. 2824 2825 ```text 2826 +-------+------------+---------+------------+-------------------------+ 2827 |Ordered |Unordered |Condition | 2828 +=======+============+=========+============+=========================+ 2829 |ord |EQ | LT | GT|uno |UN |NaNs absent / present. | 2830 +-------+------------+---------+------------+-------------------------+ 2831 |eq |EQ |ueq |UN | EQ |Equal | 2832 +-------+------------+---------+------------+-------------------------+ 2833 |one |LT | GT |ne |UN | LT | GT|Not equal | 2834 +-------+------------+---------+------------+-------------------------+ 2835 |lt |LT |ult |UN | LT |Less than | 2836 +-------+------------+---------+------------+-------------------------+ 2837 |le |LT | EQ |ule |UN | LT | EQ|Less than or equal | 2838 +-------+------------+---------+------------+-------------------------+ 2839 |gt |GT |ugt |UN | GT |Greater than | 2840 +-------+------------+---------+------------+-------------------------+ 2841 |ge |GT | EQ |uge |UN | GT | EQ|Greater than or equal | 2842 +-------+------------+---------+------------+-------------------------+ 2843 ``` 2844 2845 The standard C comparison operators, `<, <=, >, >=`, are all ordered, 2846 so they are false if either operand is NaN. The C equality operator, 2847 `==`, is ordered, and since inequality is defined as the logical 2848 inverse it is *unordered*. They map to the `floatcc` condition 2849 codes as follows: 2850 2851 ```text 2852 ==== ====== ============ 2853 C `Cond` Subset 2854 ==== ====== ============ 2855 `==` eq EQ 2856 `!=` ne UN | LT | GT 2857 `<` lt LT 2858 `<=` le LT | EQ 2859 `>` gt GT 2860 `>=` ge GT | EQ 2861 ==== ====== ============ 2862 ``` 2863 2864 This subset of condition codes also corresponds to the WebAssembly 2865 floating point comparisons of the same name. 2866 2867 When this instruction compares floating point vectors, it returns a 2868 vector with the results of lane-wise comparisons. 2869 2870 When comparing scalars, the result is: 2871 - `1` if the condition holds. 2872 - `0` if the condition does not hold. 2873 2874 When comparing vectors, the result is: 2875 - `-1` (i.e. all ones) in each lane where the condition holds. 2876 - `0` in each lane where the condition does not hold. 2877 "#, 2878 &formats.float_compare, 2879 ) 2880 .operands_in(vec![ 2881 Operand::new("Cond", &imm.floatcc), 2882 Operand::new("x", Float), 2883 Operand::new("y", Float), 2884 ]) 2885 .operands_out(vec![Operand::new("a", &Float.as_truthy())]), 2886 ); 2887 2888 ig.push( 2889 Inst::new( 2890 "fadd", 2891 r#" 2892 Floating point addition. 2893 "#, 2894 &formats.binary, 2895 ) 2896 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 2897 .operands_out(vec![ 2898 Operand::new("a", Float).with_doc("Result of applying operator to each lane"), 2899 ]), 2900 ); 2901 2902 ig.push( 2903 Inst::new( 2904 "fsub", 2905 r#" 2906 Floating point subtraction. 2907 "#, 2908 &formats.binary, 2909 ) 2910 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 2911 .operands_out(vec![ 2912 Operand::new("a", Float).with_doc("Result of applying operator to each lane"), 2913 ]), 2914 ); 2915 2916 ig.push( 2917 Inst::new( 2918 "fmul", 2919 r#" 2920 Floating point multiplication. 2921 "#, 2922 &formats.binary, 2923 ) 2924 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 2925 .operands_out(vec![ 2926 Operand::new("a", Float).with_doc("Result of applying operator to each lane"), 2927 ]), 2928 ); 2929 2930 ig.push( 2931 Inst::new( 2932 "fdiv", 2933 r#" 2934 Floating point division. 2935 2936 Unlike the integer division instructions ` and 2937 `udiv`, this can't trap. Division by zero is infinity or 2938 NaN, depending on the dividend. 2939 "#, 2940 &formats.binary, 2941 ) 2942 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 2943 .operands_out(vec![ 2944 Operand::new("a", Float).with_doc("Result of applying operator to each lane"), 2945 ]), 2946 ); 2947 2948 ig.push( 2949 Inst::new( 2950 "sqrt", 2951 r#" 2952 Floating point square root. 2953 "#, 2954 &formats.unary, 2955 ) 2956 .operands_in(vec![Operand::new("x", Float)]) 2957 .operands_out(vec![ 2958 Operand::new("a", Float).with_doc("Result of applying operator to each lane"), 2959 ]), 2960 ); 2961 2962 ig.push( 2963 Inst::new( 2964 "fma", 2965 r#" 2966 Floating point fused multiply-and-add. 2967 2968 Computes `a := xy+z` without any intermediate rounding of the 2969 product. 2970 "#, 2971 &formats.ternary, 2972 ) 2973 .operands_in(vec![ 2974 Operand::new("x", Float), 2975 Operand::new("y", Float), 2976 Operand::new("z", Float), 2977 ]) 2978 .operands_out(vec![ 2979 Operand::new("a", Float).with_doc("Result of applying operator to each lane"), 2980 ]), 2981 ); 2982 2983 ig.push( 2984 Inst::new( 2985 "fneg", 2986 r#" 2987 Floating point negation. 2988 2989 Note that this is a pure bitwise operation. 2990 "#, 2991 &formats.unary, 2992 ) 2993 .operands_in(vec![Operand::new("x", Float)]) 2994 .operands_out(vec![ 2995 Operand::new("a", Float).with_doc("``x`` with its sign bit inverted"), 2996 ]), 2997 ); 2998 2999 ig.push( 3000 Inst::new( 3001 "fabs", 3002 r#" 3003 Floating point absolute value. 3004 3005 Note that this is a pure bitwise operation. 3006 "#, 3007 &formats.unary, 3008 ) 3009 .operands_in(vec![Operand::new("x", Float)]) 3010 .operands_out(vec![ 3011 Operand::new("a", Float).with_doc("``x`` with its sign bit cleared"), 3012 ]), 3013 ); 3014 3015 ig.push( 3016 Inst::new( 3017 "fcopysign", 3018 r#" 3019 Floating point copy sign. 3020 3021 Note that this is a pure bitwise operation. The sign bit from ``y`` is 3022 copied to the sign bit of ``x``. 3023 "#, 3024 &formats.binary, 3025 ) 3026 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 3027 .operands_out(vec![ 3028 Operand::new("a", Float).with_doc("``x`` with its sign bit changed to that of ``y``"), 3029 ]), 3030 ); 3031 3032 ig.push( 3033 Inst::new( 3034 "fmin", 3035 r#" 3036 Floating point minimum, propagating NaNs using the WebAssembly rules. 3037 3038 If either operand is NaN, this returns NaN with an unspecified sign. Furthermore, if 3039 each input NaN consists of a mantissa whose most significant bit is 1 and the rest is 3040 0, then the output has the same form. Otherwise, the output mantissa's most significant 3041 bit is 1 and the rest is unspecified. 3042 "#, 3043 &formats.binary, 3044 ) 3045 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 3046 .operands_out(vec![ 3047 Operand::new("a", Float).with_doc("The smaller of ``x`` and ``y``"), 3048 ]), 3049 ); 3050 3051 ig.push( 3052 Inst::new( 3053 "fmax", 3054 r#" 3055 Floating point maximum, propagating NaNs using the WebAssembly rules. 3056 3057 If either operand is NaN, this returns NaN with an unspecified sign. Furthermore, if 3058 each input NaN consists of a mantissa whose most significant bit is 1 and the rest is 3059 0, then the output has the same form. Otherwise, the output mantissa's most significant 3060 bit is 1 and the rest is unspecified. 3061 "#, 3062 &formats.binary, 3063 ) 3064 .operands_in(vec![Operand::new("x", Float), Operand::new("y", Float)]) 3065 .operands_out(vec![ 3066 Operand::new("a", Float).with_doc("The larger of ``x`` and ``y``"), 3067 ]), 3068 ); 3069 3070 ig.push( 3071 Inst::new( 3072 "ceil", 3073 r#" 3074 Round floating point round to integral, towards positive infinity. 3075 "#, 3076 &formats.unary, 3077 ) 3078 .operands_in(vec![Operand::new("x", Float)]) 3079 .operands_out(vec![ 3080 Operand::new("a", Float).with_doc("``x`` rounded to integral value"), 3081 ]), 3082 ); 3083 3084 ig.push( 3085 Inst::new( 3086 "floor", 3087 r#" 3088 Round floating point round to integral, towards negative infinity. 3089 "#, 3090 &formats.unary, 3091 ) 3092 .operands_in(vec![Operand::new("x", Float)]) 3093 .operands_out(vec![ 3094 Operand::new("a", Float).with_doc("``x`` rounded to integral value"), 3095 ]), 3096 ); 3097 3098 ig.push( 3099 Inst::new( 3100 "trunc", 3101 r#" 3102 Round floating point round to integral, towards zero. 3103 "#, 3104 &formats.unary, 3105 ) 3106 .operands_in(vec![Operand::new("x", Float)]) 3107 .operands_out(vec![ 3108 Operand::new("a", Float).with_doc("``x`` rounded to integral value"), 3109 ]), 3110 ); 3111 3112 ig.push( 3113 Inst::new( 3114 "nearest", 3115 r#" 3116 Round floating point round to integral, towards nearest with ties to 3117 even. 3118 "#, 3119 &formats.unary, 3120 ) 3121 .operands_in(vec![Operand::new("x", Float)]) 3122 .operands_out(vec![ 3123 Operand::new("a", Float).with_doc("``x`` rounded to integral value"), 3124 ]), 3125 ); 3126 3127 ig.push( 3128 Inst::new( 3129 "bitcast", 3130 r#" 3131 Reinterpret the bits in `x` as a different type. 3132 3133 The input and output types must be storable to memory and of the same 3134 size. A bitcast is equivalent to storing one type and loading the other 3135 type from the same address, both using the specified MemFlags. 3136 3137 Note that this operation only supports the `big` or `little` MemFlags. 3138 The specified byte order only affects the result in the case where 3139 input and output types differ in lane count/size. In this case, the 3140 operation is only valid if a byte order specifier is provided. 3141 "#, 3142 &formats.load_no_offset, 3143 ) 3144 .operands_in(vec![ 3145 Operand::new("MemFlags", &imm.memflags), 3146 Operand::new("x", Mem), 3147 ]) 3148 .operands_out(vec![ 3149 Operand::new("a", MemTo).with_doc("Bits of `x` reinterpreted"), 3150 ]), 3151 ); 3152 3153 ig.push( 3154 Inst::new( 3155 "scalar_to_vector", 3156 r#" 3157 Copies a scalar value to a vector value. The scalar is copied into the 3158 least significant lane of the vector, and all other lanes will be zero. 3159 "#, 3160 &formats.unary, 3161 ) 3162 .operands_in(vec![ 3163 Operand::new("s", &TxN.lane_of()).with_doc("A scalar value"), 3164 ]) 3165 .operands_out(vec![Operand::new("a", TxN).with_doc("A vector value")]), 3166 ); 3167 3168 let Truthy = &TypeVar::new( 3169 "Truthy", 3170 "A scalar whose values are truthy", 3171 TypeSetBuilder::new().ints(Interval::All).build(), 3172 ); 3173 let IntTo = &TypeVar::new( 3174 "IntTo", 3175 "An integer type", 3176 TypeSetBuilder::new().ints(Interval::All).build(), 3177 ); 3178 3179 ig.push( 3180 Inst::new( 3181 "bmask", 3182 r#" 3183 Convert `x` to an integer mask. 3184 3185 Non-zero maps to all 1s and zero maps to all 0s. 3186 "#, 3187 &formats.unary, 3188 ) 3189 .operands_in(vec![Operand::new("x", Truthy)]) 3190 .operands_out(vec![Operand::new("a", IntTo)]), 3191 ); 3192 3193 let Int = &TypeVar::new( 3194 "Int", 3195 "A scalar integer type", 3196 TypeSetBuilder::new().ints(Interval::All).build(), 3197 ); 3198 3199 ig.push( 3200 Inst::new( 3201 "ireduce", 3202 r#" 3203 Convert `x` to a smaller integer type by discarding 3204 the most significant bits. 3205 3206 This is the same as reducing modulo `2^n`. 3207 "#, 3208 &formats.unary, 3209 ) 3210 .operands_in(vec![ 3211 Operand::new("x", &Int.wider()) 3212 .with_doc("A scalar integer type, wider than the controlling type"), 3213 ]) 3214 .operands_out(vec![Operand::new("a", Int)]), 3215 ); 3216 3217 let I16or32or64xN = &TypeVar::new( 3218 "I16or32or64xN", 3219 "A SIMD vector type containing integer lanes 16, 32, or 64 bits wide", 3220 TypeSetBuilder::new() 3221 .ints(16..64) 3222 .simd_lanes(2..8) 3223 .dynamic_simd_lanes(2..8) 3224 .includes_scalars(false) 3225 .build(), 3226 ); 3227 3228 ig.push( 3229 Inst::new( 3230 "snarrow", 3231 r#" 3232 Combine `x` and `y` into a vector with twice the lanes but half the integer width while 3233 saturating overflowing values to the signed maximum and minimum. 3234 3235 The lanes will be concatenated after narrowing. For example, when `x` and `y` are `i32x4` 3236 and `x = [x3, x2, x1, x0]` and `y = [y3, y2, y1, y0]`, then after narrowing the value 3237 returned is an `i16x8`: `a = [y3', y2', y1', y0', x3', x2', x1', x0']`. 3238 "#, 3239 &formats.binary, 3240 ) 3241 .operands_in(vec![ 3242 Operand::new("x", I16or32or64xN), 3243 Operand::new("y", I16or32or64xN), 3244 ]) 3245 .operands_out(vec![Operand::new("a", &I16or32or64xN.split_lanes())]), 3246 ); 3247 3248 ig.push( 3249 Inst::new( 3250 "unarrow", 3251 r#" 3252 Combine `x` and `y` into a vector with twice the lanes but half the integer width while 3253 saturating overflowing values to the unsigned maximum and minimum. 3254 3255 Note that all input lanes are considered signed: any negative lanes will overflow and be 3256 replaced with the unsigned minimum, `0x00`. 3257 3258 The lanes will be concatenated after narrowing. For example, when `x` and `y` are `i32x4` 3259 and `x = [x3, x2, x1, x0]` and `y = [y3, y2, y1, y0]`, then after narrowing the value 3260 returned is an `i16x8`: `a = [y3', y2', y1', y0', x3', x2', x1', x0']`. 3261 "#, 3262 &formats.binary, 3263 ) 3264 .operands_in(vec![ 3265 Operand::new("x", I16or32or64xN), 3266 Operand::new("y", I16or32or64xN), 3267 ]) 3268 .operands_out(vec![Operand::new("a", &I16or32or64xN.split_lanes())]), 3269 ); 3270 3271 ig.push( 3272 Inst::new( 3273 "uunarrow", 3274 r#" 3275 Combine `x` and `y` into a vector with twice the lanes but half the integer width while 3276 saturating overflowing values to the unsigned maximum and minimum. 3277 3278 Note that all input lanes are considered unsigned: any negative values will be interpreted as unsigned, overflowing and being replaced with the unsigned maximum. 3279 3280 The lanes will be concatenated after narrowing. For example, when `x` and `y` are `i32x4` 3281 and `x = [x3, x2, x1, x0]` and `y = [y3, y2, y1, y0]`, then after narrowing the value 3282 returned is an `i16x8`: `a = [y3', y2', y1', y0', x3', x2', x1', x0']`. 3283 "#, 3284 &formats.binary, 3285 ) 3286 .operands_in(vec![Operand::new("x", I16or32or64xN), Operand::new("y", I16or32or64xN)]) 3287 .operands_out(vec![Operand::new("a", &I16or32or64xN.split_lanes())]), 3288 ); 3289 3290 let I8or16or32xN = &TypeVar::new( 3291 "I8or16or32xN", 3292 "A SIMD vector type containing integer lanes 8, 16, or 32 bits wide.", 3293 TypeSetBuilder::new() 3294 .ints(8..32) 3295 .simd_lanes(2..16) 3296 .dynamic_simd_lanes(2..16) 3297 .includes_scalars(false) 3298 .build(), 3299 ); 3300 3301 ig.push( 3302 Inst::new( 3303 "swiden_low", 3304 r#" 3305 Widen the low lanes of `x` using signed extension. 3306 3307 This will double the lane width and halve the number of lanes. 3308 "#, 3309 &formats.unary, 3310 ) 3311 .operands_in(vec![Operand::new("x", I8or16or32xN)]) 3312 .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]), 3313 ); 3314 3315 ig.push( 3316 Inst::new( 3317 "swiden_high", 3318 r#" 3319 Widen the high lanes of `x` using signed extension. 3320 3321 This will double the lane width and halve the number of lanes. 3322 "#, 3323 &formats.unary, 3324 ) 3325 .operands_in(vec![Operand::new("x", I8or16or32xN)]) 3326 .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]), 3327 ); 3328 3329 ig.push( 3330 Inst::new( 3331 "uwiden_low", 3332 r#" 3333 Widen the low lanes of `x` using unsigned extension. 3334 3335 This will double the lane width and halve the number of lanes. 3336 "#, 3337 &formats.unary, 3338 ) 3339 .operands_in(vec![Operand::new("x", I8or16or32xN)]) 3340 .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]), 3341 ); 3342 3343 ig.push( 3344 Inst::new( 3345 "uwiden_high", 3346 r#" 3347 Widen the high lanes of `x` using unsigned extension. 3348 3349 This will double the lane width and halve the number of lanes. 3350 "#, 3351 &formats.unary, 3352 ) 3353 .operands_in(vec![Operand::new("x", I8or16or32xN)]) 3354 .operands_out(vec![Operand::new("a", &I8or16or32xN.merge_lanes())]), 3355 ); 3356 3357 ig.push( 3358 Inst::new( 3359 "iadd_pairwise", 3360 r#" 3361 Does lane-wise integer pairwise addition on two operands, putting the 3362 combined results into a single vector result. Here a pair refers to adjacent 3363 lanes in a vector, i.e. i*2 + (i*2+1) for i == num_lanes/2. The first operand 3364 pairwise add results will make up the low half of the resulting vector while 3365 the second operand pairwise add results will make up the upper half of the 3366 resulting vector. 3367 "#, 3368 &formats.binary, 3369 ) 3370 .operands_in(vec![ 3371 Operand::new("x", I8or16or32xN), 3372 Operand::new("y", I8or16or32xN), 3373 ]) 3374 .operands_out(vec![Operand::new("a", I8or16or32xN)]), 3375 ); 3376 3377 let I8x16 = &TypeVar::new( 3378 "I8x16", 3379 "A SIMD vector type consisting of 16 lanes of 8-bit integers", 3380 TypeSetBuilder::new() 3381 .ints(8..8) 3382 .simd_lanes(16..16) 3383 .includes_scalars(false) 3384 .build(), 3385 ); 3386 3387 ig.push( 3388 Inst::new( 3389 "x86_pmaddubsw", 3390 r#" 3391 An instruction with equivalent semantics to `pmaddubsw` on x86. 3392 3393 This instruction will take signed bytes from the first argument and 3394 multiply them against unsigned bytes in the second argument. Adjacent 3395 pairs are then added, with saturating, to a 16-bit value and are packed 3396 into the result. 3397 "#, 3398 &formats.binary, 3399 ) 3400 .operands_in(vec![Operand::new("x", I8x16), Operand::new("y", I8x16)]) 3401 .operands_out(vec![Operand::new("a", I16x8)]), 3402 ); 3403 3404 ig.push( 3405 Inst::new( 3406 "uextend", 3407 r#" 3408 Convert `x` to a larger integer type by zero-extending. 3409 3410 Each lane in `x` is converted to a larger integer type by adding 3411 zeroes. The result has the same numerical value as `x` when both are 3412 interpreted as unsigned integers. 3413 3414 The result type must have the same number of vector lanes as the input, 3415 and each lane must not have fewer bits that the input lanes. If the 3416 input and output types are the same, this is a no-op. 3417 "#, 3418 &formats.unary, 3419 ) 3420 .operands_in(vec![Operand::new("x", &Int.narrower()).with_doc( 3421 "A scalar integer type, narrower than the controlling type", 3422 )]) 3423 .operands_out(vec![Operand::new("a", Int)]), 3424 ); 3425 3426 ig.push( 3427 Inst::new( 3428 "sextend", 3429 r#" 3430 Convert `x` to a larger integer type by sign-extending. 3431 3432 Each lane in `x` is converted to a larger integer type by replicating 3433 the sign bit. The result has the same numerical value as `x` when both 3434 are interpreted as signed integers. 3435 3436 The result type must have the same number of vector lanes as the input, 3437 and each lane must not have fewer bits that the input lanes. If the 3438 input and output types are the same, this is a no-op. 3439 "#, 3440 &formats.unary, 3441 ) 3442 .operands_in(vec![Operand::new("x", &Int.narrower()).with_doc( 3443 "A scalar integer type, narrower than the controlling type", 3444 )]) 3445 .operands_out(vec![Operand::new("a", Int)]), 3446 ); 3447 3448 let FloatScalar = &TypeVar::new( 3449 "FloatScalar", 3450 "A scalar only floating point number", 3451 TypeSetBuilder::new().floats(Interval::All).build(), 3452 ); 3453 3454 ig.push( 3455 Inst::new( 3456 "fpromote", 3457 r#" 3458 Convert `x` to a larger floating point format. 3459 3460 Each lane in `x` is converted to the destination floating point format. 3461 This is an exact operation. 3462 3463 Cranelift currently only supports two floating point formats 3464 - `f32` and `f64`. This may change in the future. 3465 3466 The result type must have the same number of vector lanes as the input, 3467 and the result lanes must not have fewer bits than the input lanes. 3468 "#, 3469 &formats.unary, 3470 ) 3471 .operands_in(vec![Operand::new("x", &FloatScalar.narrower()).with_doc( 3472 "A scalar only floating point number, narrower than the controlling type", 3473 )]) 3474 .operands_out(vec![Operand::new("a", FloatScalar)]), 3475 ); 3476 3477 ig.push( 3478 Inst::new( 3479 "fdemote", 3480 r#" 3481 Convert `x` to a smaller floating point format. 3482 3483 Each lane in `x` is converted to the destination floating point format 3484 by rounding to nearest, ties to even. 3485 3486 Cranelift currently only supports two floating point formats 3487 - `f32` and `f64`. This may change in the future. 3488 3489 The result type must have the same number of vector lanes as the input, 3490 and the result lanes must not have more bits than the input lanes. 3491 "#, 3492 &formats.unary, 3493 ) 3494 .operands_in(vec![Operand::new("x", &FloatScalar.wider()).with_doc( 3495 "A scalar only floating point number, wider than the controlling type", 3496 )]) 3497 .operands_out(vec![Operand::new("a", FloatScalar)]), 3498 ); 3499 3500 let F64x2 = &TypeVar::new( 3501 "F64x2", 3502 "A SIMD vector type consisting of 2 lanes of 64-bit floats", 3503 TypeSetBuilder::new() 3504 .floats(64..64) 3505 .simd_lanes(2..2) 3506 .includes_scalars(false) 3507 .build(), 3508 ); 3509 let F32x4 = &TypeVar::new( 3510 "F32x4", 3511 "A SIMD vector type consisting of 4 lanes of 32-bit floats", 3512 TypeSetBuilder::new() 3513 .floats(32..32) 3514 .simd_lanes(4..4) 3515 .includes_scalars(false) 3516 .build(), 3517 ); 3518 3519 ig.push( 3520 Inst::new( 3521 "fvdemote", 3522 r#" 3523 Convert `x` to a smaller floating point format. 3524 3525 Each lane in `x` is converted to the destination floating point format 3526 by rounding to nearest, ties to even. 3527 3528 Cranelift currently only supports two floating point formats 3529 - `f32` and `f64`. This may change in the future. 3530 3531 Fvdemote differs from fdemote in that with fvdemote it targets vectors. 3532 Fvdemote is constrained to having the input type being F64x2 and the result 3533 type being F32x4. The result lane that was the upper half of the input lane 3534 is initialized to zero. 3535 "#, 3536 &formats.unary, 3537 ) 3538 .operands_in(vec![Operand::new("x", F64x2)]) 3539 .operands_out(vec![Operand::new("a", F32x4)]), 3540 ); 3541 3542 ig.push( 3543 Inst::new( 3544 "fvpromote_low", 3545 r#" 3546 Converts packed single precision floating point to packed double precision floating point. 3547 3548 Considering only the lower half of the register, the low lanes in `x` are interpreted as 3549 single precision floats that are then converted to a double precision floats. 3550 3551 The result type will have half the number of vector lanes as the input. Fvpromote_low is 3552 constrained to input F32x4 with a result type of F64x2. 3553 "#, 3554 &formats.unary, 3555 ) 3556 .operands_in(vec![Operand::new("a", F32x4)]) 3557 .operands_out(vec![Operand::new("x", F64x2)]), 3558 ); 3559 3560 let IntTo = &TypeVar::new( 3561 "IntTo", 3562 "An scalar only integer type", 3563 TypeSetBuilder::new().ints(Interval::All).build(), 3564 ); 3565 3566 ig.push( 3567 Inst::new( 3568 "fcvt_to_uint", 3569 r#" 3570 Converts floating point scalars to unsigned integer. 3571 3572 Only operates on `x` if it is a scalar. If `x` is NaN or if 3573 the unsigned integral value cannot be represented in the result 3574 type, this instruction traps. 3575 3576 "#, 3577 &formats.unary, 3578 ) 3579 .operands_in(vec![Operand::new("x", FloatScalar)]) 3580 .operands_out(vec![Operand::new("a", IntTo)]) 3581 .can_trap() 3582 .side_effects_idempotent(), 3583 ); 3584 3585 ig.push( 3586 Inst::new( 3587 "fcvt_to_sint", 3588 r#" 3589 Converts floating point scalars to signed integer. 3590 3591 Only operates on `x` if it is a scalar. If `x` is NaN or if 3592 the unsigned integral value cannot be represented in the result 3593 type, this instruction traps. 3594 3595 "#, 3596 &formats.unary, 3597 ) 3598 .operands_in(vec![Operand::new("x", FloatScalar)]) 3599 .operands_out(vec![Operand::new("a", IntTo)]) 3600 .can_trap() 3601 .side_effects_idempotent(), 3602 ); 3603 3604 let IntTo = &TypeVar::new( 3605 "IntTo", 3606 "A larger integer type with the same number of lanes", 3607 TypeSetBuilder::new() 3608 .ints(Interval::All) 3609 .simd_lanes(Interval::All) 3610 .build(), 3611 ); 3612 3613 ig.push( 3614 Inst::new( 3615 "fcvt_to_uint_sat", 3616 r#" 3617 Convert floating point to unsigned integer as fcvt_to_uint does, but 3618 saturates the input instead of trapping. NaN and negative values are 3619 converted to 0. 3620 "#, 3621 &formats.unary, 3622 ) 3623 .operands_in(vec![Operand::new("x", Float)]) 3624 .operands_out(vec![Operand::new("a", IntTo)]), 3625 ); 3626 3627 ig.push( 3628 Inst::new( 3629 "fcvt_to_sint_sat", 3630 r#" 3631 Convert floating point to signed integer as fcvt_to_sint does, but 3632 saturates the input instead of trapping. NaN values are converted to 0. 3633 "#, 3634 &formats.unary, 3635 ) 3636 .operands_in(vec![Operand::new("x", Float)]) 3637 .operands_out(vec![Operand::new("a", IntTo)]), 3638 ); 3639 3640 ig.push( 3641 Inst::new( 3642 "x86_cvtt2dq", 3643 r#" 3644 A float-to-integer conversion instruction for vectors-of-floats which 3645 has the same semantics as `cvttp{s,d}2dq` on x86. This specifically 3646 returns `INT_MIN` for NaN or out-of-bounds lanes. 3647 "#, 3648 &formats.unary, 3649 ) 3650 .operands_in(vec![Operand::new("x", Float)]) 3651 .operands_out(vec![Operand::new("a", IntTo)]), 3652 ); 3653 3654 let Int = &TypeVar::new( 3655 "Int", 3656 "A scalar or vector integer type", 3657 TypeSetBuilder::new() 3658 .ints(Interval::All) 3659 .simd_lanes(Interval::All) 3660 .build(), 3661 ); 3662 3663 let FloatTo = &TypeVar::new( 3664 "FloatTo", 3665 "A scalar or vector floating point number", 3666 TypeSetBuilder::new() 3667 .floats(Interval::All) 3668 .simd_lanes(Interval::All) 3669 .build(), 3670 ); 3671 3672 ig.push( 3673 Inst::new( 3674 "fcvt_from_uint", 3675 r#" 3676 Convert unsigned integer to floating point. 3677 3678 Each lane in `x` is interpreted as an unsigned integer and converted to 3679 floating point using round to nearest, ties to even. 3680 3681 The result type must have the same number of vector lanes as the input. 3682 "#, 3683 &formats.unary, 3684 ) 3685 .operands_in(vec![Operand::new("x", Int)]) 3686 .operands_out(vec![Operand::new("a", FloatTo)]), 3687 ); 3688 3689 ig.push( 3690 Inst::new( 3691 "fcvt_from_sint", 3692 r#" 3693 Convert signed integer to floating point. 3694 3695 Each lane in `x` is interpreted as a signed integer and converted to 3696 floating point using round to nearest, ties to even. 3697 3698 The result type must have the same number of vector lanes as the input. 3699 "#, 3700 &formats.unary, 3701 ) 3702 .operands_in(vec![Operand::new("x", Int)]) 3703 .operands_out(vec![Operand::new("a", FloatTo)]), 3704 ); 3705 3706 let WideInt = &TypeVar::new( 3707 "WideInt", 3708 "An integer type of width `i16` upwards", 3709 TypeSetBuilder::new().ints(16..128).build(), 3710 ); 3711 3712 ig.push( 3713 Inst::new( 3714 "isplit", 3715 r#" 3716 Split an integer into low and high parts. 3717 3718 Vectors of integers are split lane-wise, so the results have the same 3719 number of lanes as the input, but the lanes are half the size. 3720 3721 Returns the low half of `x` and the high half of `x` as two independent 3722 values. 3723 "#, 3724 &formats.unary, 3725 ) 3726 .operands_in(vec![Operand::new("x", WideInt)]) 3727 .operands_out(vec![ 3728 Operand::new("lo", &WideInt.half_width()).with_doc("The low bits of `x`"), 3729 Operand::new("hi", &WideInt.half_width()).with_doc("The high bits of `x`"), 3730 ]), 3731 ); 3732 3733 ig.push( 3734 Inst::new( 3735 "iconcat", 3736 r#" 3737 Concatenate low and high bits to form a larger integer type. 3738 3739 Vectors of integers are concatenated lane-wise such that the result has 3740 the same number of lanes as the inputs, but the lanes are twice the 3741 size. 3742 "#, 3743 &formats.binary, 3744 ) 3745 .operands_in(vec![ 3746 Operand::new("lo", NarrowInt), 3747 Operand::new("hi", NarrowInt), 3748 ]) 3749 .operands_out(vec![ 3750 Operand::new("a", &NarrowInt.double_width()) 3751 .with_doc("The concatenation of `lo` and `hi`"), 3752 ]), 3753 ); 3754 3755 // Instructions relating to atomic memory accesses and fences 3756 let AtomicMem = &TypeVar::new( 3757 "AtomicMem", 3758 "Any type that can be stored in memory, which can be used in an atomic operation", 3759 TypeSetBuilder::new().ints(8..128).build(), 3760 ); 3761 3762 ig.push( 3763 Inst::new( 3764 "atomic_rmw", 3765 r#" 3766 Atomically read-modify-write memory at `p`, with second operand `x`. The old value is 3767 returned. `p` has the type of the target word size, and `x` may be any integer type; note 3768 that some targets require specific target features to be enabled in order to support 128-bit 3769 integer atomics. The type of the returned value is the same as the type of `x`. This 3770 operation is sequentially consistent and creates happens-before edges that order normal 3771 (non-atomic) loads and stores. 3772 "#, 3773 &formats.atomic_rmw, 3774 ) 3775 .operands_in(vec![ 3776 Operand::new("MemFlags", &imm.memflags), 3777 Operand::new("AtomicRmwOp", &imm.atomic_rmw_op), 3778 Operand::new("p", iAddr), 3779 Operand::new("x", AtomicMem).with_doc("Value to be atomically stored"), 3780 ]) 3781 .operands_out(vec![ 3782 Operand::new("a", AtomicMem).with_doc("Value atomically loaded"), 3783 ]) 3784 .can_load() 3785 .can_store() 3786 .other_side_effects(), 3787 ); 3788 3789 ig.push( 3790 Inst::new( 3791 "atomic_cas", 3792 r#" 3793 Perform an atomic compare-and-swap operation on memory at `p`, with expected value `e`, 3794 storing `x` if the value at `p` equals `e`. The old value at `p` is returned, 3795 regardless of whether the operation succeeds or fails. `p` has the type of the target 3796 word size, and `x` and `e` must have the same type and the same size, which may be any 3797 integer type; note that some targets require specific target features to be enabled in order 3798 to support 128-bit integer atomics. The type of the returned value is the same as the type 3799 of `x` and `e`. This operation is sequentially consistent and creates happens-before edges 3800 that order normal (non-atomic) loads and stores. 3801 "#, 3802 &formats.atomic_cas, 3803 ) 3804 .operands_in(vec![ 3805 Operand::new("MemFlags", &imm.memflags), 3806 Operand::new("p", iAddr), 3807 Operand::new("e", AtomicMem).with_doc("Expected value in CAS"), 3808 Operand::new("x", AtomicMem).with_doc("Value to be atomically stored"), 3809 ]) 3810 .operands_out(vec![ 3811 Operand::new("a", AtomicMem).with_doc("Value atomically loaded"), 3812 ]) 3813 .can_load() 3814 .can_store() 3815 .other_side_effects(), 3816 ); 3817 3818 ig.push( 3819 Inst::new( 3820 "atomic_load", 3821 r#" 3822 Atomically load from memory at `p`. 3823 3824 This is a polymorphic instruction that can load any value type which has a memory 3825 representation. It can only be used for integer types; note that some targets require 3826 specific target features to be enabled in order to support 128-bit integer atomics. This 3827 operation is sequentially consistent and creates happens-before edges that order normal 3828 (non-atomic) loads and stores. 3829 "#, 3830 &formats.load_no_offset, 3831 ) 3832 .operands_in(vec![ 3833 Operand::new("MemFlags", &imm.memflags), 3834 Operand::new("p", iAddr), 3835 ]) 3836 .operands_out(vec![ 3837 Operand::new("a", AtomicMem).with_doc("Value atomically loaded"), 3838 ]) 3839 .can_load() 3840 .other_side_effects(), 3841 ); 3842 3843 ig.push( 3844 Inst::new( 3845 "atomic_store", 3846 r#" 3847 Atomically store `x` to memory at `p`. 3848 3849 This is a polymorphic instruction that can store any value type with a memory 3850 representation. It can only be used for integer types; note that some targets require 3851 specific target features to be enabled in order to support 128-bit integer atomics This 3852 operation is sequentially consistent and creates happens-before edges that order normal 3853 (non-atomic) loads and stores. 3854 "#, 3855 &formats.store_no_offset, 3856 ) 3857 .operands_in(vec![ 3858 Operand::new("MemFlags", &imm.memflags), 3859 Operand::new("x", AtomicMem).with_doc("Value to be atomically stored"), 3860 Operand::new("p", iAddr), 3861 ]) 3862 .can_store() 3863 .other_side_effects(), 3864 ); 3865 3866 ig.push( 3867 Inst::new( 3868 "fence", 3869 r#" 3870 A memory fence. This must provide ordering to ensure that, at a minimum, neither loads 3871 nor stores of any kind may move forwards or backwards across the fence. This operation 3872 is sequentially consistent. 3873 "#, 3874 &formats.nullary, 3875 ) 3876 .other_side_effects(), 3877 ); 3878 3879 let TxN = &TypeVar::new( 3880 "TxN", 3881 "A dynamic vector type", 3882 TypeSetBuilder::new() 3883 .ints(Interval::All) 3884 .floats(Interval::All) 3885 .dynamic_simd_lanes(Interval::All) 3886 .build(), 3887 ); 3888 3889 ig.push( 3890 Inst::new( 3891 "extract_vector", 3892 r#" 3893 Return a fixed length sub vector, extracted from a dynamic vector. 3894 "#, 3895 &formats.binary_imm8, 3896 ) 3897 .operands_in(vec![ 3898 Operand::new("x", TxN).with_doc("The dynamic vector to extract from"), 3899 Operand::new("y", &imm.uimm8).with_doc("128-bit vector index"), 3900 ]) 3901 .operands_out(vec![ 3902 Operand::new("a", &TxN.dynamic_to_vector()).with_doc("New fixed vector"), 3903 ]), 3904 ); 3905 3906 ig.push( 3907 Inst::new( 3908 "sequence_point", 3909 r#" 3910 A compiler barrier that acts as an immovable marker from IR input to machine-code output. 3911 3912 This "sequence point" can have debug tags attached to it, and these tags will be 3913 noted in the output `MachBuffer`. 3914 3915 It prevents motion of any other side-effects across this boundary. 3916 "#, 3917 &formats.nullary, 3918 ) 3919 .other_side_effects(), 3920 ); 3921 } 3922