1 //===-- llvm/CodeGen/ISDOpcodes.h - CodeGen opcodes -------------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file declares codegen opcodes and related utilities.
11 //===----------------------------------------------------------------------===//
13 #ifndef LLVM_CODEGEN_ISDOPCODES_H
14 #define LLVM_CODEGEN_ISDOPCODES_H
18 /// ISD namespace - This namespace contains an enum which represents all of the
19 /// SelectionDAG node types and value types.
23 //===--------------------------------------------------------------------===//
24 /// ISD::NodeType enum - This enum defines the target-independent operators
25 /// for a SelectionDAG.
27 /// Targets may also define target-dependent operator codes for SDNodes. For
28 /// example, on x86, these are the enum values in the X86ISD namespace.
29 /// Targets should aim to use target-independent operators to model their
30 /// instruction sets as much as possible, and only use target-dependent
31 /// operators when they have special requirements.
33 /// Finally, during and after selection proper, SNodes may use special
34 /// operator codes that correspond directly with MachineInstr opcodes. These
35 /// are used to represent selected instructions. See the isMachineOpcode()
36 /// and getMachineOpcode() member functions of SDNode.
39 /// DELETED_NODE - This is an illegal value that is used to catch
40 /// errors. This opcode is not a legal opcode for any node.
43 /// EntryToken - This is the marker used to indicate the start of a region.
46 /// TokenFactor - This node takes multiple tokens as input and produces a
47 /// single token result. This is used to represent the fact that the operand
48 /// operators are independent of each other.
51 /// AssertSext, AssertZext - These nodes record if a register contains a
52 /// value that has already been zero or sign extended from a narrower type.
53 /// These nodes take two operands. The first is the node that has already
54 /// been extended, and the second is a value type node indicating the width
56 AssertSext
, AssertZext
,
58 /// Various leaf nodes.
59 BasicBlock
, VALUETYPE
, CONDCODE
, Register
, RegisterMask
,
61 GlobalAddress
, GlobalTLSAddress
, FrameIndex
,
62 JumpTable
, ConstantPool
, ExternalSymbol
, BlockAddress
,
64 /// The address of the GOT
67 /// FRAMEADDR, RETURNADDR - These nodes represent llvm.frameaddress and
68 /// llvm.returnaddress on the DAG. These nodes take one operand, the index
69 /// of the frame or return address to return. An index of zero corresponds
70 /// to the current function's frame or return address, an index of one to
71 /// the parent's frame or return address, and so on.
72 FRAMEADDR
, RETURNADDR
, ADDROFRETURNADDR
, SPONENTRY
,
74 /// LOCAL_RECOVER - Represents the llvm.localrecover intrinsic.
75 /// Materializes the offset from the local object pointer of another
76 /// function to a particular local object passed to llvm.localescape. The
77 /// operand is the MCSymbol label used to represent this offset, since
78 /// typically the offset is not known until after code generation of the
82 /// READ_REGISTER, WRITE_REGISTER - This node represents llvm.register on
83 /// the DAG, which implements the named register global variables extension.
87 /// FRAME_TO_ARGS_OFFSET - This node represents offset from frame pointer to
88 /// first (possible) on-stack argument. This is needed for correct stack
89 /// adjustment during unwind.
92 /// EH_DWARF_CFA - This node represents the pointer to the DWARF Canonical
93 /// Frame Address (CFA), generally the value of the stack pointer at the
94 /// call site in the previous frame.
97 /// OUTCHAIN = EH_RETURN(INCHAIN, OFFSET, HANDLER) - This node represents
98 /// 'eh_return' gcc dwarf builtin, which is used to return from
99 /// exception. The general meaning is: adjust stack by OFFSET and pass
100 /// execution to HANDLER. Many platform-related details also :)
103 /// RESULT, OUTCHAIN = EH_SJLJ_SETJMP(INCHAIN, buffer)
104 /// This corresponds to the eh.sjlj.setjmp intrinsic.
105 /// It takes an input chain and a pointer to the jump buffer as inputs
106 /// and returns an outchain.
109 /// OUTCHAIN = EH_SJLJ_LONGJMP(INCHAIN, buffer)
110 /// This corresponds to the eh.sjlj.longjmp intrinsic.
111 /// It takes an input chain and a pointer to the jump buffer as inputs
112 /// and returns an outchain.
115 /// OUTCHAIN = EH_SJLJ_SETUP_DISPATCH(INCHAIN)
116 /// The target initializes the dispatch table here.
117 EH_SJLJ_SETUP_DISPATCH
,
119 /// TargetConstant* - Like Constant*, but the DAG does not do any folding,
120 /// simplification, or lowering of the constant. They are used for constants
121 /// which are known to fit in the immediate fields of their users, or for
122 /// carrying magic numbers which are not values which need to be
123 /// materialized in registers.
127 /// TargetGlobalAddress - Like GlobalAddress, but the DAG does no folding or
128 /// anything else with this node, and this is valid in the target-specific
129 /// dag, turning into a GlobalAddress operand.
131 TargetGlobalTLSAddress
,
135 TargetExternalSymbol
,
140 /// TargetIndex - Like a constant pool entry, but with completely
141 /// target-dependent semantics. Holds target flags, a 32-bit index, and a
142 /// 64-bit index. Targets can use this however they like.
145 /// RESULT = INTRINSIC_WO_CHAIN(INTRINSICID, arg1, arg2, ...)
146 /// This node represents a target intrinsic function with no side effects.
147 /// The first operand is the ID number of the intrinsic from the
148 /// llvm::Intrinsic namespace. The operands to the intrinsic follow. The
149 /// node returns the result of the intrinsic.
152 /// RESULT,OUTCHAIN = INTRINSIC_W_CHAIN(INCHAIN, INTRINSICID, arg1, ...)
153 /// This node represents a target intrinsic function with side effects that
154 /// returns a result. The first operand is a chain pointer. The second is
155 /// the ID number of the intrinsic from the llvm::Intrinsic namespace. The
156 /// operands to the intrinsic follow. The node has two results, the result
157 /// of the intrinsic and an output chain.
160 /// OUTCHAIN = INTRINSIC_VOID(INCHAIN, INTRINSICID, arg1, arg2, ...)
161 /// This node represents a target intrinsic function with side effects that
162 /// does not return a result. The first operand is a chain pointer. The
163 /// second is the ID number of the intrinsic from the llvm::Intrinsic
164 /// namespace. The operands to the intrinsic follow.
167 /// CopyToReg - This node has three operands: a chain, a register number to
168 /// set to this value, and a value.
171 /// CopyFromReg - This node indicates that the input value is a virtual or
172 /// physical register that is defined outside of the scope of this
173 /// SelectionDAG. The register is available from the RegisterSDNode object.
176 /// UNDEF - An undefined node.
179 /// EXTRACT_ELEMENT - This is used to get the lower or upper (determined by
180 /// a Constant, which is required to be operand #1) half of the integer or
181 /// float value specified as operand #0. This is only for use before
182 /// legalization, for values that will be broken into multiple registers.
185 /// BUILD_PAIR - This is the opposite of EXTRACT_ELEMENT in some ways.
186 /// Given two values of the same integer value type, this produces a value
187 /// twice as big. Like EXTRACT_ELEMENT, this can only be used before
188 /// legalization. The lower part of the composite value should be in
189 /// element 0 and the upper part should be in element 1.
192 /// MERGE_VALUES - This node takes multiple discrete operands and returns
193 /// them all as its individual results. This nodes has exactly the same
194 /// number of inputs and outputs. This node is useful for some pieces of the
195 /// code generator that want to think about a single node with multiple
196 /// results, not multiple nodes.
199 /// Simple integer binary arithmetic operators.
200 ADD
, SUB
, MUL
, SDIV
, UDIV
, SREM
, UREM
,
202 /// SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing
203 /// a signed/unsigned value of type i[2*N], and return the full value as
204 /// two results, each of type iN.
205 SMUL_LOHI
, UMUL_LOHI
,
207 /// SDIVREM/UDIVREM - Divide two integers and produce both a quotient and
208 /// remainder result.
211 /// CARRY_FALSE - This node is used when folding other nodes,
212 /// like ADDC/SUBC, which indicate the carry result is always false.
215 /// Carry-setting nodes for multiple precision addition and subtraction.
216 /// These nodes take two operands of the same value type, and produce two
217 /// results. The first result is the normal add or sub result, the second
218 /// result is the carry flag result.
219 /// FIXME: These nodes are deprecated in favor of ADDCARRY and SUBCARRY.
220 /// They are kept around for now to provide a smooth transition path
221 /// toward the use of ADDCARRY/SUBCARRY and will eventually be removed.
224 /// Carry-using nodes for multiple precision addition and subtraction. These
225 /// nodes take three operands: The first two are the normal lhs and rhs to
226 /// the add or sub, and the third is the input carry flag. These nodes
227 /// produce two results; the normal result of the add or sub, and the output
228 /// carry flag. These nodes both read and write a carry flag to allow them
229 /// to them to be chained together for add and sub of arbitrarily large
233 /// Carry-using nodes for multiple precision addition and subtraction.
234 /// These nodes take three operands: The first two are the normal lhs and
235 /// rhs to the add or sub, and the third is a boolean indicating if there
236 /// is an incoming carry. These nodes produce two results: the normal
237 /// result of the add or sub, and the output carry so they can be chained
238 /// together. The use of this opcode is preferable to adde/sube if the
239 /// target supports it, as the carry is a regular value rather than a
240 /// glue, which allows further optimisation.
243 /// RESULT, BOOL = [SU]ADDO(LHS, RHS) - Overflow-aware nodes for addition.
244 /// These nodes take two operands: the normal LHS and RHS to the add. They
245 /// produce two results: the normal result of the add, and a boolean that
246 /// indicates if an overflow occurred (*not* a flag, because it may be store
247 /// to memory, etc.). If the type of the boolean is not i1 then the high
248 /// bits conform to getBooleanContents.
249 /// These nodes are generated from llvm.[su]add.with.overflow intrinsics.
252 /// Same for subtraction.
255 /// Same for multiplication.
258 /// RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2
259 /// integers with the same bit width (W). If the true value of LHS + RHS
260 /// exceeds the largest value that can be represented by W bits, the
261 /// resulting value is this maximum value. Otherwise, if this value is less
262 /// than the smallest value that can be represented by W bits, the
263 /// resulting value is this minimum value.
266 /// RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2
267 /// integers with the same bit width (W). If the true value of LHS - RHS
268 /// exceeds the largest value that can be represented by W bits, the
269 /// resulting value is this maximum value. Otherwise, if this value is less
270 /// than the smallest value that can be represented by W bits, the
271 /// resulting value is this minimum value.
274 /// RESULT = [US]MULFIX(LHS, RHS, SCALE) - Perform fixed point multiplication on
275 /// 2 integers with the same width and scale. SCALE represents the scale of
276 /// both operands as fixed point numbers. This SCALE parameter must be a
277 /// constant integer. A scale of zero is effectively performing
278 /// multiplication on 2 integers.
281 /// Same as the corresponding unsaturated fixed point instructions, but the
282 /// result is clamped between the min and max values representable by the
283 /// bits of the first 2 operands.
284 SMULFIXSAT
, UMULFIXSAT
,
286 /// Simple binary floating point operators.
287 FADD
, FSUB
, FMUL
, FDIV
, FREM
,
289 /// Constrained versions of the binary floating point operators.
290 /// These will be lowered to the simple operators before final selection.
291 /// They are used to limit optimizations while the DAG is being
293 STRICT_FADD
, STRICT_FSUB
, STRICT_FMUL
, STRICT_FDIV
, STRICT_FREM
,
296 /// Constrained versions of libm-equivalent floating point intrinsics.
297 /// These will be lowered to the equivalent non-constrained pseudo-op
298 /// (or expanded to the equivalent library call) before final selection.
299 /// They are used to limit optimizations while the DAG is being optimized.
300 STRICT_FSQRT
, STRICT_FPOW
, STRICT_FPOWI
, STRICT_FSIN
, STRICT_FCOS
,
301 STRICT_FEXP
, STRICT_FEXP2
, STRICT_FLOG
, STRICT_FLOG10
, STRICT_FLOG2
,
302 STRICT_FRINT
, STRICT_FNEARBYINT
, STRICT_FMAXNUM
, STRICT_FMINNUM
,
303 STRICT_FCEIL
, STRICT_FFLOOR
, STRICT_FROUND
, STRICT_FTRUNC
,
304 STRICT_LROUND
, STRICT_LLROUND
, STRICT_LRINT
, STRICT_LLRINT
,
306 /// STRICT_FP_TO_[US]INT - Convert a floating point value to a signed or
307 /// unsigned integer. These have the same semantics as fptosi and fptoui
309 /// They are used to limit optimizations while the DAG is being optimized.
313 /// X = STRICT_FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating
314 /// point type down to the precision of the destination VT. TRUNC is a
315 /// flag, which is always an integer that is zero or one. If TRUNC is 0,
316 /// this is a normal rounding, if it is 1, this FP_ROUND is known to not
317 /// change the value of Y.
319 /// The TRUNC = 1 case is used in cases where we know that the value will
320 /// not be modified by the node, because Y is not using any of the extra
321 /// precision of source type. This allows certain transformations like
322 /// STRICT_FP_EXTEND(STRICT_FP_ROUND(X,1)) -> X which are not safe for
323 /// STRICT_FP_EXTEND(STRICT_FP_ROUND(X,0)) because the extra bits aren't
325 /// It is used to limit optimizations while the DAG is being optimized.
328 /// X = STRICT_FP_EXTEND(Y) - Extend a smaller FP type into a larger FP
330 /// It is used to limit optimizations while the DAG is being optimized.
333 /// FMA - Perform a * b + c with no intermediate rounding step.
336 /// FMAD - Perform a * b + c, while getting the same result as the
337 /// separately rounded operations.
340 /// FCOPYSIGN(X, Y) - Return the value of X with the sign of Y. NOTE: This
341 /// DAG node does not require that X and Y have the same type, just that
342 /// they are both floating point. X and the result must have the same type.
343 /// FCOPYSIGN(f32, f64) is allowed.
346 /// INT = FGETSIGN(FP) - Return the sign bit of the specified floating point
347 /// value as an integer 0/1 value.
350 /// Returns platform specific canonical encoding of a floating point number.
353 /// BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a vector with the
354 /// specified, possibly variable, elements. The number of elements is
355 /// required to be a power of two. The types of the operands must all be
356 /// the same and must match the vector element type, except that integer
357 /// types are allowed to be larger than the element type, in which case
358 /// the operands are implicitly truncated.
361 /// INSERT_VECTOR_ELT(VECTOR, VAL, IDX) - Returns VECTOR with the element
362 /// at IDX replaced with VAL. If the type of VAL is larger than the vector
363 /// element type then VAL is truncated before replacement.
366 /// EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR
367 /// identified by the (potentially variable) element number IDX. If the
368 /// return type is an integer type larger than the element type of the
369 /// vector, the result is extended to the width of the return type. In
370 /// that case, the high bits are undefined.
373 /// CONCAT_VECTORS(VECTOR0, VECTOR1, ...) - Given a number of values of
374 /// vector type with the same length and element type, this produces a
375 /// concatenated vector result value, with length equal to the sum of the
376 /// lengths of the input vectors.
379 /// INSERT_SUBVECTOR(VECTOR1, VECTOR2, IDX) - Returns a vector
380 /// with VECTOR2 inserted into VECTOR1 at the (potentially
381 /// variable) element number IDX, which must be a multiple of the
382 /// VECTOR2 vector length. The elements of VECTOR1 starting at
383 /// IDX are overwritten with VECTOR2. Elements IDX through
384 /// vector_length(VECTOR2) must be valid VECTOR1 indices.
387 /// EXTRACT_SUBVECTOR(VECTOR, IDX) - Returns a subvector from VECTOR (an
388 /// vector value) starting with the element number IDX, which must be a
389 /// constant multiple of the result vector length.
392 /// VECTOR_SHUFFLE(VEC1, VEC2) - Returns a vector, of the same type as
393 /// VEC1/VEC2. A VECTOR_SHUFFLE node also contains an array of constant int
394 /// values that indicate which value (or undef) each result element will
395 /// get. These constant ints are accessible through the
396 /// ShuffleVectorSDNode class. This is quite similar to the Altivec
397 /// 'vperm' instruction, except that the indices must be constants and are
398 /// in terms of the element size of VEC1/VEC2, not in terms of bytes.
401 /// SCALAR_TO_VECTOR(VAL) - This represents the operation of loading a
402 /// scalar value into element 0 of the resultant vector type. The top
403 /// elements 1 to N-1 of the N-element vector are undefined. The type
404 /// of the operand must match the vector element type, except when they
405 /// are integer types. In this case the operand is allowed to be wider
406 /// than the vector element type, and is implicitly truncated to it.
409 /// SPLAT_VECTOR(VAL) - Returns a vector with the scalar value VAL
410 /// duplicated in all lanes. The type of the operand must match the vector
411 /// element type, except when they are integer types. In this case the
412 /// operand is allowed to be wider than the vector element type, and is
413 /// implicitly truncated to it.
416 /// MULHU/MULHS - Multiply high - Multiply two integers of type iN,
417 /// producing an unsigned/signed value of type i[2*N], then return the top
421 /// [US]{MIN/MAX} - Binary minimum or maximum or signed or unsigned
423 SMIN
, SMAX
, UMIN
, UMAX
,
425 /// Bitwise operators - logical and, logical or, logical xor.
428 /// ABS - Determine the unsigned absolute value of a signed integer value of
429 /// the same bitwidth.
430 /// Note: A value of INT_MIN will return INT_MIN, no saturation or overflow
434 /// Shift and rotation operations. After legalization, the type of the
435 /// shift amount is known to be TLI.getShiftAmountTy(). Before legalization
436 /// the shift amount can be any type, but care must be taken to ensure it is
437 /// large enough. TLI.getShiftAmountTy() is i8 on some targets, but before
438 /// legalization, types like i1024 can occur and i8 doesn't have enough bits
439 /// to represent the shift amount.
440 /// When the 1st operand is a vector, the shift amount must be in the same
441 /// type. (TLI.getShiftAmountTy() will return the same type when the input
442 /// type is a vector.)
443 /// For rotates and funnel shifts, the shift amount is treated as an unsigned
444 /// amount modulo the element size of the first operand.
446 /// Funnel 'double' shifts take 3 operands, 2 inputs and the shift amount.
447 /// fshl(X,Y,Z): (X << (Z % BW)) | (Y >> (BW - (Z % BW)))
448 /// fshr(X,Y,Z): (X << (BW - (Z % BW))) | (Y >> (Z % BW))
449 SHL
, SRA
, SRL
, ROTL
, ROTR
, FSHL
, FSHR
,
451 /// Byte Swap and Counting operators.
452 BSWAP
, CTTZ
, CTLZ
, CTPOP
, BITREVERSE
,
454 /// Bit counting operators with an undefined result for zero inputs.
455 CTTZ_ZERO_UNDEF
, CTLZ_ZERO_UNDEF
,
457 /// Select(COND, TRUEVAL, FALSEVAL). If the type of the boolean COND is not
458 /// i1 then the high bits must conform to getBooleanContents.
461 /// Select with a vector condition (op #0) and two vector operands (ops #1
462 /// and #2), returning a vector result. All vectors have the same length.
463 /// Much like the scalar select and setcc, each bit in the condition selects
464 /// whether the corresponding result element is taken from op #1 or op #2.
465 /// At first, the VSELECT condition is of vXi1 type. Later, targets may
466 /// change the condition type in order to match the VSELECT node using a
467 /// pattern. The condition follows the BooleanContent format of the target.
470 /// Select with condition operator - This selects between a true value and
471 /// a false value (ops #2 and #3) based on the boolean result of comparing
472 /// the lhs and rhs (ops #0 and #1) of a conditional expression with the
473 /// condition code in op #4, a CondCodeSDNode.
476 /// SetCC operator - This evaluates to a true value iff the condition is
477 /// true. If the result value type is not i1 then the high bits conform
478 /// to getBooleanContents. The operands to this are the left and right
479 /// operands to compare (ops #0, and #1) and the condition code to compare
480 /// them with (op #2) as a CondCodeSDNode. If the operands are vector types
481 /// then the result type must also be a vector type.
484 /// Like SetCC, ops #0 and #1 are the LHS and RHS operands to compare, but
485 /// op #2 is a boolean indicating if there is an incoming carry. This
486 /// operator checks the result of "LHS - RHS - Carry", and can be used to
487 /// compare two wide integers:
488 /// (setcccarry lhshi rhshi (subcarry lhslo rhslo) cc).
489 /// Only valid for integers.
492 /// SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded
493 /// integer shift operations. The operation ordering is:
494 /// [Lo,Hi] = op [LoLHS,HiLHS], Amt
495 SHL_PARTS
, SRA_PARTS
, SRL_PARTS
,
497 /// Conversion operators. These are all single input single output
498 /// operations. For all of these, the result type must be strictly
499 /// wider or narrower (depending on the operation) than the source
502 /// SIGN_EXTEND - Used for integer types, replicating the sign bit
506 /// ZERO_EXTEND - Used for integer types, zeroing the new bits.
509 /// ANY_EXTEND - Used for integer types. The high bits are undefined.
512 /// TRUNCATE - Completely drop the high bits.
515 /// [SU]INT_TO_FP - These operators convert integers (whose interpreted sign
516 /// depends on the first letter) to floating point.
520 /// SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to
521 /// sign extend a small value in a large integer register (e.g. sign
522 /// extending the low 8 bits of a 32-bit register to fill the top 24 bits
523 /// with the 7th bit). The size of the smaller type is indicated by the 1th
524 /// operand, a ValueType node.
527 /// ANY_EXTEND_VECTOR_INREG(Vector) - This operator represents an
528 /// in-register any-extension of the low lanes of an integer vector. The
529 /// result type must have fewer elements than the operand type, and those
530 /// elements must be larger integer types such that the total size of the
531 /// operand type is less than or equal to the size of the result type. Each
532 /// of the low operand elements is any-extended into the corresponding,
533 /// wider result elements with the high bits becoming undef.
534 /// NOTE: The type legalizer prefers to make the operand and result size
535 /// the same to allow expansion to shuffle vector during op legalization.
536 ANY_EXTEND_VECTOR_INREG
,
538 /// SIGN_EXTEND_VECTOR_INREG(Vector) - This operator represents an
539 /// in-register sign-extension of the low lanes of an integer vector. The
540 /// result type must have fewer elements than the operand type, and those
541 /// elements must be larger integer types such that the total size of the
542 /// operand type is less than or equal to the size of the result type. Each
543 /// of the low operand elements is sign-extended into the corresponding,
544 /// wider result elements.
545 /// NOTE: The type legalizer prefers to make the operand and result size
546 /// the same to allow expansion to shuffle vector during op legalization.
547 SIGN_EXTEND_VECTOR_INREG
,
549 /// ZERO_EXTEND_VECTOR_INREG(Vector) - This operator represents an
550 /// in-register zero-extension of the low lanes of an integer vector. The
551 /// result type must have fewer elements than the operand type, and those
552 /// elements must be larger integer types such that the total size of the
553 /// operand type is less than or equal to the size of the result type. Each
554 /// of the low operand elements is zero-extended into the corresponding,
555 /// wider result elements.
556 /// NOTE: The type legalizer prefers to make the operand and result size
557 /// the same to allow expansion to shuffle vector during op legalization.
558 ZERO_EXTEND_VECTOR_INREG
,
560 /// FP_TO_[US]INT - Convert a floating point value to a signed or unsigned
561 /// integer. These have the same semantics as fptosi and fptoui in IR. If
562 /// the FP value cannot fit in the integer type, the results are undefined.
566 /// X = FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type
567 /// down to the precision of the destination VT. TRUNC is a flag, which is
568 /// always an integer that is zero or one. If TRUNC is 0, this is a
569 /// normal rounding, if it is 1, this FP_ROUND is known to not change the
572 /// The TRUNC = 1 case is used in cases where we know that the value will
573 /// not be modified by the node, because Y is not using any of the extra
574 /// precision of source type. This allows certain transformations like
575 /// FP_EXTEND(FP_ROUND(X,1)) -> X which are not safe for
576 /// FP_EXTEND(FP_ROUND(X,0)) because the extra bits aren't removed.
579 /// FLT_ROUNDS_ - Returns current rounding mode:
582 /// 1 Round to nearest
587 /// X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
590 /// BITCAST - This operator converts between integer, vector and FP
591 /// values, as if the value was stored to memory with one type and loaded
592 /// from the same address with the other type (or equivalently for vector
593 /// format conversions, etc). The source and result are required to have
594 /// the same bit size (e.g. f32 <-> i32). This can also be used for
595 /// int-to-int or fp-to-fp conversions, but that is a noop, deleted by
598 /// This operator is subtly different from the bitcast instruction from
599 /// LLVM-IR since this node may change the bits in the register. For
600 /// example, this occurs on big-endian NEON and big-endian MSA where the
601 /// layout of the bits in the register depends on the vector type and this
602 /// operator acts as a shuffle operation for some vector type combinations.
605 /// ADDRSPACECAST - This operator converts between pointers of different
609 /// FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions
610 /// and truncation for half-precision (16 bit) floating numbers. These nodes
611 /// form a semi-softened interface for dealing with f16 (as an i16), which
612 /// is often a storage-only type but has native conversions.
613 FP16_TO_FP
, FP_TO_FP16
,
615 /// Perform various unary floating-point operations inspired by libm. For
616 /// FPOWI, the result is undefined if if the integer operand doesn't fit
618 FNEG
, FABS
, FSQRT
, FCBRT
, FSIN
, FCOS
, FPOWI
, FPOW
,
619 FLOG
, FLOG2
, FLOG10
, FEXP
, FEXP2
,
620 FCEIL
, FTRUNC
, FRINT
, FNEARBYINT
, FROUND
, FFLOOR
,
621 LROUND
, LLROUND
, LRINT
, LLRINT
,
623 /// FMINNUM/FMAXNUM - Perform floating-point minimum or maximum on two
626 /// In the case where a single input is a NaN (either signaling or quiet),
627 /// the non-NaN input is returned.
629 /// The return value of (FMINNUM 0.0, -0.0) could be either 0.0 or -0.0.
632 /// FMINNUM_IEEE/FMAXNUM_IEEE - Perform floating-point minimum or maximum on
633 /// two values, following the IEEE-754 2008 definition. This differs from
634 /// FMINNUM/FMAXNUM in the handling of signaling NaNs. If one input is a
635 /// signaling NaN, returns a quiet NaN.
636 FMINNUM_IEEE
, FMAXNUM_IEEE
,
638 /// FMINIMUM/FMAXIMUM - NaN-propagating minimum/maximum that also treat -0.0
639 /// as less than 0.0. While FMINNUM_IEEE/FMAXNUM_IEEE follow IEEE 754-2008
640 /// semantics, FMINIMUM/FMAXIMUM follow IEEE 754-2018 draft semantics.
643 /// FSINCOS - Compute both fsin and fcos as a single operation.
646 /// LOAD and STORE have token chains as their first operand, then the same
647 /// operands as an LLVM load/store instruction, then an offset node that
648 /// is added / subtracted from the base pointer to form the address (for
649 /// indexed memory ops).
652 /// DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned
653 /// to a specified boundary. This node always has two return values: a new
654 /// stack pointer value and a chain. The first operand is the token chain,
655 /// the second is the number of bytes to allocate, and the third is the
656 /// alignment boundary. The size is guaranteed to be a multiple of the
657 /// stack alignment, and the alignment is guaranteed to be bigger than the
658 /// stack alignment (if required) or 0 to get standard stack alignment.
661 /// Control flow instructions. These all have token chains.
663 /// BR - Unconditional branch. The first operand is the chain
664 /// operand, the second is the MBB to branch to.
667 /// BRIND - Indirect branch. The first operand is the chain, the second
668 /// is the value to branch to, which must be of the same type as the
669 /// target's pointer type.
672 /// BR_JT - Jumptable branch. The first operand is the chain, the second
673 /// is the jumptable index, the last one is the jumptable entry index.
676 /// BRCOND - Conditional branch. The first operand is the chain, the
677 /// second is the condition, the third is the block to branch to if the
678 /// condition is true. If the type of the condition is not i1, then the
679 /// high bits must conform to getBooleanContents.
682 /// BR_CC - Conditional branch. The behavior is like that of SELECT_CC, in
683 /// that the condition is represented as condition code, and two nodes to
684 /// compare, rather than as a combined SetCC node. The operands in order
685 /// are chain, cc, lhs, rhs, block to branch to if condition is true.
688 /// INLINEASM - Represents an inline asm block. This node always has two
689 /// return values: a chain and a flag result. The inputs are as follows:
690 /// Operand #0 : Input chain.
691 /// Operand #1 : a ExternalSymbolSDNode with a pointer to the asm string.
692 /// Operand #2 : a MDNodeSDNode with the !srcloc metadata.
693 /// Operand #3 : HasSideEffect, IsAlignStack bits.
694 /// After this, it is followed by a list of operands with this format:
695 /// ConstantSDNode: Flags that encode whether it is a mem or not, the
696 /// of operands that follow, etc. See InlineAsm.h.
697 /// ... however many operands ...
698 /// Operand #last: Optional, an incoming flag.
700 /// The variable width operands are required to represent target addressing
701 /// modes as a single "operand", even though they may have multiple
705 /// INLINEASM_BR - Terminator version of inline asm. Used by asm-goto.
708 /// EH_LABEL - Represents a label in mid basic block used to track
709 /// locations needed for debug and exception handling tables. These nodes
710 /// take a chain as input and return a chain.
713 /// ANNOTATION_LABEL - Represents a mid basic block label used by
714 /// annotations. This should remain within the basic block and be ordered
715 /// with respect to other call instructions, but loads and stores may float
719 /// CATCHPAD - Represents a catchpad instruction.
722 /// CATCHRET - Represents a return from a catch block funclet. Used for
723 /// MSVC compatible exception handling. Takes a chain operand and a
724 /// destination basic block operand.
727 /// CLEANUPRET - Represents a return from a cleanup block funclet. Used for
728 /// MSVC compatible exception handling. Takes only a chain operand.
731 /// STACKSAVE - STACKSAVE has one operand, an input chain. It produces a
732 /// value, the same type as the pointer type for the system, and an output
736 /// STACKRESTORE has two operands, an input chain and a pointer to restore
737 /// to it returns an output chain.
740 /// CALLSEQ_START/CALLSEQ_END - These operators mark the beginning and end
741 /// of a call sequence, and carry arbitrary information that target might
742 /// want to know. The first operand is a chain, the rest are specified by
743 /// the target and not touched by the DAG optimizers.
744 /// Targets that may use stack to pass call arguments define additional
746 /// - size of the call frame part that must be set up within the
747 /// CALLSEQ_START..CALLSEQ_END pair,
748 /// - part of the call frame prepared prior to CALLSEQ_START.
749 /// Both these parameters must be constants, their sum is the total call
751 /// CALLSEQ_START..CALLSEQ_END pairs may not be nested.
752 CALLSEQ_START
, // Beginning of a call sequence
753 CALLSEQ_END
, // End of a call sequence
755 /// VAARG - VAARG has four operands: an input chain, a pointer, a SRCVALUE,
756 /// and the alignment. It returns a pair of values: the vaarg value and a
760 /// VACOPY - VACOPY has 5 operands: an input chain, a destination pointer,
761 /// a source pointer, a SRCVALUE for the destination, and a SRCVALUE for the
765 /// VAEND, VASTART - VAEND and VASTART have three operands: an input chain,
766 /// pointer, and a SRCVALUE.
769 /// SRCVALUE - This is a node type that holds a Value* that is used to
770 /// make reference to a value in the LLVM IR.
773 /// MDNODE_SDNODE - This is a node that holdes an MDNode*, which is used to
774 /// reference metadata in the IR.
777 /// PCMARKER - This corresponds to the pcmarker intrinsic.
780 /// READCYCLECOUNTER - This corresponds to the readcyclecounter intrinsic.
781 /// It produces a chain and one i64 value. The only operand is a chain.
782 /// If i64 is not legal, the result will be expanded into smaller values.
783 /// Still, it returns an i64, so targets should set legality for i64.
784 /// The result is the content of the architecture-specific cycle
785 /// counter-like register (or other high accuracy low latency clock source).
788 /// HANDLENODE node - Used as a handle for various purposes.
791 /// INIT_TRAMPOLINE - This corresponds to the init_trampoline intrinsic. It
792 /// takes as input a token chain, the pointer to the trampoline, the pointer
793 /// to the nested function, the pointer to pass for the 'nest' parameter, a
794 /// SRCVALUE for the trampoline and another for the nested function
795 /// (allowing targets to access the original Function*).
796 /// It produces a token chain as output.
799 /// ADJUST_TRAMPOLINE - This corresponds to the adjust_trampoline intrinsic.
800 /// It takes a pointer to the trampoline and produces a (possibly) new
801 /// pointer to the same trampoline with platform-specific adjustments
802 /// applied. The pointer it returns points to an executable block of code.
805 /// TRAP - Trapping instruction
808 /// DEBUGTRAP - Trap intended to get the attention of a debugger.
811 /// PREFETCH - This corresponds to a prefetch intrinsic. The first operand
812 /// is the chain. The other operands are the address to prefetch,
813 /// read / write specifier, locality specifier and instruction / data cache
817 /// OUTCHAIN = ATOMIC_FENCE(INCHAIN, ordering, scope)
818 /// This corresponds to the fence instruction. It takes an input chain, and
819 /// two integer constants: an AtomicOrdering and a SynchronizationScope.
822 /// Val, OUTCHAIN = ATOMIC_LOAD(INCHAIN, ptr)
823 /// This corresponds to "load atomic" instruction.
826 /// OUTCHAIN = ATOMIC_STORE(INCHAIN, ptr, val)
827 /// This corresponds to "store atomic" instruction.
830 /// Val, OUTCHAIN = ATOMIC_CMP_SWAP(INCHAIN, ptr, cmp, swap)
831 /// For double-word atomic operations:
832 /// ValLo, ValHi, OUTCHAIN = ATOMIC_CMP_SWAP(INCHAIN, ptr, cmpLo, cmpHi,
834 /// This corresponds to the cmpxchg instruction.
837 /// Val, Success, OUTCHAIN
838 /// = ATOMIC_CMP_SWAP_WITH_SUCCESS(INCHAIN, ptr, cmp, swap)
839 /// N.b. this is still a strong cmpxchg operation, so
840 /// Success == "Val == cmp".
841 ATOMIC_CMP_SWAP_WITH_SUCCESS
,
843 /// Val, OUTCHAIN = ATOMIC_SWAP(INCHAIN, ptr, amt)
844 /// Val, OUTCHAIN = ATOMIC_LOAD_[OpName](INCHAIN, ptr, amt)
845 /// For double-word atomic operations:
846 /// ValLo, ValHi, OUTCHAIN = ATOMIC_SWAP(INCHAIN, ptr, amtLo, amtHi)
847 /// ValLo, ValHi, OUTCHAIN = ATOMIC_LOAD_[OpName](INCHAIN, ptr, amtLo, amtHi)
848 /// These correspond to the atomicrmw instruction.
864 // Masked load and store - consecutive vector load and store operations
865 // with additional mask operand that prevents memory accesses to the
868 // Val, OutChain = MLOAD(BasePtr, Mask, PassThru)
869 // OutChain = MSTORE(Value, BasePtr, Mask)
872 // Masked gather and scatter - load and store operations for a vector of
873 // random addresses with additional mask operand that prevents memory
874 // accesses to the masked-off lanes.
876 // Val, OutChain = GATHER(InChain, PassThru, Mask, BasePtr, Index, Scale)
877 // OutChain = SCATTER(InChain, Value, Mask, BasePtr, Index, Scale)
879 // The Index operand can have more vector elements than the other operands
880 // due to type legalization. The extra elements are ignored.
883 /// This corresponds to the llvm.lifetime.* intrinsics. The first operand
884 /// is the chain and the second operand is the alloca pointer.
885 LIFETIME_START
, LIFETIME_END
,
887 /// GC_TRANSITION_START/GC_TRANSITION_END - These operators mark the
888 /// beginning and end of GC transition sequence, and carry arbitrary
889 /// information that target might need for lowering. The first operand is
890 /// a chain, the rest are specified by the target and not touched by the DAG
891 /// optimizers. GC_TRANSITION_START..GC_TRANSITION_END pairs may not be
896 /// GET_DYNAMIC_AREA_OFFSET - get offset from native SP to the address of
897 /// the most recent dynamic alloca. For most targets that would be 0, but
898 /// for some others (e.g. PowerPC, PowerPC64) that would be compile-time
899 /// known nonzero constant. The only operand here is the chain.
900 GET_DYNAMIC_AREA_OFFSET
,
902 /// Generic reduction nodes. These nodes represent horizontal vector
903 /// reduction operations, producing a scalar result.
904 /// The STRICT variants perform reductions in sequential order. The first
905 /// operand is an initial scalar accumulator value, and the second operand
906 /// is the vector to reduce.
907 VECREDUCE_STRICT_FADD
, VECREDUCE_STRICT_FMUL
,
908 /// These reductions are non-strict, and have a single vector operand.
909 VECREDUCE_FADD
, VECREDUCE_FMUL
,
910 /// FMIN/FMAX nodes can have flags, for NaN/NoNaN variants.
911 VECREDUCE_FMAX
, VECREDUCE_FMIN
,
912 /// Integer reductions may have a result type larger than the vector element
913 /// type. However, the reduction is performed using the vector element type
914 /// and the value in the top bits is unspecified.
915 VECREDUCE_ADD
, VECREDUCE_MUL
,
916 VECREDUCE_AND
, VECREDUCE_OR
, VECREDUCE_XOR
,
917 VECREDUCE_SMAX
, VECREDUCE_SMIN
, VECREDUCE_UMAX
, VECREDUCE_UMIN
,
919 /// BUILTIN_OP_END - This must be the last enum value in this list.
920 /// The target-specific pre-isel opcode values start here.
924 /// FIRST_TARGET_MEMORY_OPCODE - Target-specific pre-isel operations
925 /// which do not reference a specific memory location should be less than
926 /// this value. Those that do must not be less than this value, and can
927 /// be used with SelectionDAG::getMemIntrinsicNode.
928 static const int FIRST_TARGET_MEMORY_OPCODE
= BUILTIN_OP_END
+400;
930 //===--------------------------------------------------------------------===//
931 /// MemIndexedMode enum - This enum defines the load / store indexed
932 /// addressing modes.
934 /// UNINDEXED "Normal" load / store. The effective address is already
935 /// computed and is available in the base pointer. The offset
936 /// operand is always undefined. In addition to producing a
937 /// chain, an unindexed load produces one value (result of the
938 /// load); an unindexed store does not produce a value.
940 /// PRE_INC Similar to the unindexed mode where the effective address is
941 /// PRE_DEC the value of the base pointer add / subtract the offset.
942 /// It considers the computation as being folded into the load /
943 /// store operation (i.e. the load / store does the address
944 /// computation as well as performing the memory transaction).
945 /// The base operand is always undefined. In addition to
946 /// producing a chain, pre-indexed load produces two values
947 /// (result of the load and the result of the address
948 /// computation); a pre-indexed store produces one value (result
949 /// of the address computation).
951 /// POST_INC The effective address is the value of the base pointer. The
952 /// POST_DEC value of the offset operand is then added to / subtracted
953 /// from the base after memory transaction. In addition to
954 /// producing a chain, post-indexed load produces two values
955 /// (the result of the load and the result of the base +/- offset
956 /// computation); a post-indexed store produces one value (the
957 /// the result of the base +/- offset computation).
958 enum MemIndexedMode
{
966 static const int LAST_INDEXED_MODE
= POST_DEC
+ 1;
968 //===--------------------------------------------------------------------===//
969 /// MemIndexType enum - This enum defines how to interpret MGATHER/SCATTER's
970 /// index parameter when calculating addresses.
972 /// SIGNED_SCALED Addr = Base + ((signed)Index * sizeof(element))
973 /// SIGNED_UNSCALED Addr = Base + (signed)Index
974 /// UNSIGNED_SCALED Addr = Base + ((unsigned)Index * sizeof(element))
975 /// UNSIGNED_UNSCALED Addr = Base + (unsigned)Index
983 static const int LAST_MEM_INDEX_TYPE
= UNSIGNED_UNSCALED
+ 1;
985 //===--------------------------------------------------------------------===//
986 /// LoadExtType enum - This enum defines the three variants of LOADEXT
987 /// (load with extension).
989 /// SEXTLOAD loads the integer operand and sign extends it to a larger
990 /// integer result type.
991 /// ZEXTLOAD loads the integer operand and zero extends it to a larger
992 /// integer result type.
993 /// EXTLOAD is used for two things: floating point extending loads and
994 /// integer extending loads [the top bits are undefined].
1002 static const int LAST_LOADEXT_TYPE
= ZEXTLOAD
+ 1;
1004 NodeType
getExtForLoadExtType(bool IsFP
, LoadExtType
);
1006 //===--------------------------------------------------------------------===//
1007 /// ISD::CondCode enum - These are ordered carefully to make the bitfields
1008 /// below work out, when considering SETFALSE (something that never exists
1009 /// dynamically) as 0. "U" -> Unsigned (for integer operands) or Unordered
1010 /// (for floating point), "L" -> Less than, "G" -> Greater than, "E" -> Equal
1011 /// to. If the "N" column is 1, the result of the comparison is undefined if
1012 /// the input is a NAN.
1014 /// All of these (except for the 'always folded ops') should be handled for
1015 /// floating point. For integer, only the SETEQ,SETNE,SETLT,SETLE,SETGT,
1016 /// SETGE,SETULT,SETULE,SETUGT, and SETUGE opcodes are used.
1018 /// Note that these are laid out in a specific order to allow bit-twiddling
1019 /// to transform conditions.
1021 // Opcode N U L G E Intuitive operation
1022 SETFALSE
, // 0 0 0 0 Always false (always folded)
1023 SETOEQ
, // 0 0 0 1 True if ordered and equal
1024 SETOGT
, // 0 0 1 0 True if ordered and greater than
1025 SETOGE
, // 0 0 1 1 True if ordered and greater than or equal
1026 SETOLT
, // 0 1 0 0 True if ordered and less than
1027 SETOLE
, // 0 1 0 1 True if ordered and less than or equal
1028 SETONE
, // 0 1 1 0 True if ordered and operands are unequal
1029 SETO
, // 0 1 1 1 True if ordered (no nans)
1030 SETUO
, // 1 0 0 0 True if unordered: isnan(X) | isnan(Y)
1031 SETUEQ
, // 1 0 0 1 True if unordered or equal
1032 SETUGT
, // 1 0 1 0 True if unordered or greater than
1033 SETUGE
, // 1 0 1 1 True if unordered, greater than, or equal
1034 SETULT
, // 1 1 0 0 True if unordered or less than
1035 SETULE
, // 1 1 0 1 True if unordered, less than, or equal
1036 SETUNE
, // 1 1 1 0 True if unordered or not equal
1037 SETTRUE
, // 1 1 1 1 Always true (always folded)
1038 // Don't care operations: undefined if the input is a nan.
1039 SETFALSE2
, // 1 X 0 0 0 Always false (always folded)
1040 SETEQ
, // 1 X 0 0 1 True if equal
1041 SETGT
, // 1 X 0 1 0 True if greater than
1042 SETGE
, // 1 X 0 1 1 True if greater than or equal
1043 SETLT
, // 1 X 1 0 0 True if less than
1044 SETLE
, // 1 X 1 0 1 True if less than or equal
1045 SETNE
, // 1 X 1 1 0 True if not equal
1046 SETTRUE2
, // 1 X 1 1 1 Always true (always folded)
1048 SETCC_INVALID
// Marker value.
1051 /// Return true if this is a setcc instruction that performs a signed
1052 /// comparison when used with integer operands.
1053 inline bool isSignedIntSetCC(CondCode Code
) {
1054 return Code
== SETGT
|| Code
== SETGE
|| Code
== SETLT
|| Code
== SETLE
;
1057 /// Return true if this is a setcc instruction that performs an unsigned
1058 /// comparison when used with integer operands.
1059 inline bool isUnsignedIntSetCC(CondCode Code
) {
1060 return Code
== SETUGT
|| Code
== SETUGE
|| Code
== SETULT
|| Code
== SETULE
;
1063 /// Return true if the specified condition returns true if the two operands to
1064 /// the condition are equal. Note that if one of the two operands is a NaN,
1065 /// this value is meaningless.
1066 inline bool isTrueWhenEqual(CondCode Cond
) {
1067 return ((int)Cond
& 1) != 0;
1070 /// This function returns 0 if the condition is always false if an operand is
1071 /// a NaN, 1 if the condition is always true if the operand is a NaN, and 2 if
1072 /// the condition is undefined if the operand is a NaN.
1073 inline unsigned getUnorderedFlavor(CondCode Cond
) {
1074 return ((int)Cond
>> 3) & 3;
1077 /// Return the operation corresponding to !(X op Y), where 'op' is a valid
1078 /// SetCC operation.
1079 CondCode
getSetCCInverse(CondCode Operation
, bool isInteger
);
1081 /// Return the operation corresponding to (Y op X) when given the operation
1083 CondCode
getSetCCSwappedOperands(CondCode Operation
);
1085 /// Return the result of a logical OR between different comparisons of
1086 /// identical values: ((X op1 Y) | (X op2 Y)). This function returns
1087 /// SETCC_INVALID if it is not possible to represent the resultant comparison.
1088 CondCode
getSetCCOrOperation(CondCode Op1
, CondCode Op2
, bool isInteger
);
1090 /// Return the result of a logical AND between different comparisons of
1091 /// identical values: ((X op1 Y) & (X op2 Y)). This function returns
1092 /// SETCC_INVALID if it is not possible to represent the resultant comparison.
1093 CondCode
getSetCCAndOperation(CondCode Op1
, CondCode Op2
, bool isInteger
);
1095 } // end llvm::ISD namespace
1097 } // end llvm namespace