;; Machine Description for LoongArch for GNU compiler.
;; Copyright (C) 2021-2024 Free Software Foundation, Inc.
;; Contributed by Loongson Ltd.
;; Based on MIPS target for GNU compiler.
;; This file is part of GCC.
;; GCC is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 3, or (at your option)
;; any later version.
;; GCC is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with GCC; see the file COPYING3. If not see
;; .
(define_c_enum "unspec" [
;; Integer operations that are too cumbersome to describe directly.
UNSPEC_REVB_2H
UNSPEC_REVB_4H
UNSPEC_REVH_D
;; Floating-point moves.
UNSPEC_LOAD_LOW
UNSPEC_LOAD_HIGH
UNSPEC_STORE_WORD
UNSPEC_MOVGR2FRH
UNSPEC_MOVFRH2GR
;; Floating point unspecs.
UNSPEC_FRINT
UNSPEC_FCLASS
UNSPEC_FMAX
UNSPEC_FMIN
UNSPEC_FTINT
UNSPEC_FTINTRM
UNSPEC_FTINTRP
UNSPEC_FSCALEB
UNSPEC_FLOGB
;; Override return address for exception handling.
UNSPEC_EH_RETURN
;; Bit operation
UNSPEC_BITREV_4B
UNSPEC_BITREV_8B
;; TLS
UNSPEC_TLS
UNSPEC_TLS_DESC
UNSPEC_TLS_DESC_OFF64
;; Stack tie
UNSPEC_TIE
;; RSQRT
UNSPEC_RSQRT
UNSPEC_RSQRTE
;; RECIP
UNSPEC_RECIPE
;; CRC
UNSPEC_CRC
UNSPEC_CRCC
UNSPEC_LOAD_FROM_GOT
UNSPEC_PCALAU12I
UNSPEC_PCALAU12I_GR
UNSPEC_ADD_TLS_LE_RELAX
UNSPEC_ORI_L_LO12
UNSPEC_LUI_L_HI20
UNSPEC_LUI_H_LO20
UNSPEC_LUI_H_HI12
UNSPEC_TLS_LOW
;; Fake div.w[u] mod.w[u]
UNSPEC_FAKE_ANY_DIV
UNSPEC_SIBCALL_VALUE_MULTIPLE_INTERNAL_1
UNSPEC_CALL_VALUE_MULTIPLE_INTERNAL_1
UNSPEC_LOAD_SYMBOL_OFFSET64
UNSPEC_LA_PCREL_64_PART1
UNSPEC_LA_PCREL_64_PART2
])
(define_c_enum "unspecv" [
;; Blockage and synchronisation.
UNSPECV_BLOCKAGE
UNSPECV_DBAR
UNSPECV_IBAR
;; Privileged instructions
UNSPECV_CSRRD
UNSPECV_CSRWR
UNSPECV_CSRXCHG
UNSPECV_IOCSRRD
UNSPECV_IOCSRWR
UNSPECV_CACOP
UNSPECV_LDDIR
UNSPECV_LDPTE
UNSPECV_ERTN
;; Stack checking.
UNSPECV_PROBE_STACK_RANGE
;; Floating-point environment.
UNSPECV_MOVFCSR2GR
UNSPECV_MOVGR2FCSR
;; Others
UNSPECV_CPUCFG
UNSPECV_ASRTLE_D
UNSPECV_ASRTGT_D
UNSPECV_SYSCALL
UNSPECV_BREAK
])
(define_constants
[(RETURN_ADDR_REGNUM 1)
(TP_REGNUM 2)
(T0_REGNUM 12)
(T1_REGNUM 13)
(S0_REGNUM 23)
(FCC0_REGNUM 64)
(FCC1_REGNUM 65)
(FCC2_REGNUM 66)
(FCC3_REGNUM 67)
(FCC4_REGNUM 68)
(FCC5_REGNUM 69)
(FCC6_REGNUM 70)
(FCC7_REGNUM 71)
;; Return path styles
(NORMAL_RETURN 0)
(SIBCALL_RETURN 1)
(EXCEPTION_RETURN 2)
;; PIC long branch sequences are never longer than 100 bytes.
(MAX_PIC_BRANCH_LENGTH 100)
])
(include "predicates.md")
(include "constraints.md")
;; ....................
;;
;; Attributes
;;
;; ....................
(define_attr "enabled" "no,yes" (const_string "yes"))
(define_attr "got" "unset,load"
(const_string "unset"))
;; For jirl instructions, this attribute is DIRECT when the target address
;; is symbolic and INDIRECT when it is a register.
(define_attr "jirl" "unset,direct,indirect"
(const_string "unset"))
;; Classification of moves, extensions and truncations. Most values
;; are as for "type" (see below) but there are also the following
;; move-specific values:
;;
;; sll0 "slli.w DEST,SRC,0", which on 64-bit targets is guaranteed
;; to produce a sign-extended DEST, even if SRC is not
;; properly sign-extended
;; pick_ins BSTRPICK.W, BSTRPICK.D, BSTRINS.W or BSTRINS.D instruction
;; andi a single ANDI instruction
;; shift_shift a shift left followed by a shift right
;;
;; This attribute is used to determine the instruction's length and
;; scheduling type. For doubleword moves, the attribute always describes
;; the split instructions; in some cases, it is more appropriate for the
;; scheduling type to be "multi" instead.
(define_attr "move_type"
"unknown,load,fpload,store,fpstore,mgtf,mftg,imul,move,fmove,
const,signext,pick_ins,logical,arith,sll0,andi,shift_shift"
(const_string "unknown"))
(define_attr "alu_type" "unknown,add,sub,not,nor,and,or,xor,simd_add"
(const_string "unknown"))
;; Main data type used by the insn
(define_attr "mode" "unknown,none,QI,HI,SI,DI,TI,SF,DF,TF,FCC,
V2DI,V4SI,V8HI,V16QI,V2DF,V4SF,V4DI,V8SI,V16HI,V32QI,V4DF,V8SF"
(const_string "unknown"))
;; True if the main data type is twice the size of a word.
(define_attr "dword_mode" "no,yes"
(cond [(and (eq_attr "mode" "DI,DF")
(not (match_test "TARGET_64BIT")))
(const_string "yes")
(and (eq_attr "mode" "TI,TF")
(match_test "TARGET_64BIT"))
(const_string "yes")]
(const_string "no")))
;; True if the main data type is four times of the size of a word.
(define_attr "qword_mode" "no,yes"
(cond [(and (eq_attr "mode" "TI,TF")
(not (match_test "TARGET_64BIT")))
(const_string "yes")]
(const_string "no")))
;; Classification of each insn.
;; branch conditional branch
;; jump unconditional jump
;; call unconditional call
;; load load instruction(s)
;; fpload floating point load
;; fpidxload floating point indexed load
;; store store instruction(s)
;; fpstore floating point store
;; fpidxstore floating point indexed store
;; prefetch memory prefetch (register + offset)
;; prefetchx memory indexed prefetch (register + register)
;; condmove conditional moves
;; mgtf move general-purpose register to floating point register
;; mftg move floating point register to general-purpose register
;; const load constant
;; arith integer arithmetic instructions
;; logical integer logical instructions
;; shift integer shift instructions
;; slt set less than instructions
;; signext sign extend instructions
;; clz the clz and clo instructions
;; trap trap if instructions
;; imul integer multiply
;; idiv integer divide
;; move integer move
;; fmove floating point register move
;; fadd floating point add/subtract
;; fmul floating point multiply
;; fmadd floating point multiply-add
;; fdiv floating point divide
;; frdiv floating point reciprocal divide
;; frecipe floating point approximate reciprocal
;; fabs floating point absolute value
;; flogb floating point exponent extract
;; fneg floating point negation
;; fcmp floating point compare
;; fcopysign floating point copysign
;; fcvt floating point convert
;; fscaleb floating point scale
;; fsqrt floating point square root
;; frsqrt floating point reciprocal square root
;; frsqrte floating point approximate reciprocal square root
;; multi multiword sequence (or user asm statements)
;; atomic atomic memory update instruction
;; syncloop memory atomic operation implemented as a sync loop
;; nop no operation
;; ghost an instruction that produces no real code
(define_attr "type"
"unknown,branch,jump,call,load,fpload,fpidxload,store,fpstore,fpidxstore,
prefetch,prefetchx,condmove,mgtf,mftg,const,arith,logical,
shift,slt,signext,clz,trap,imul,idiv,move,
fmove,fadd,fmul,fmadd,fdiv,frdiv,frecipe,fabs,flogb,fneg,fcmp,fcopysign,fcvt,
fscaleb,fsqrt,frsqrt,frsqrte,accext,accmod,multi,atomic,syncloop,nop,ghost,
simd_div,simd_fclass,simd_flog2,simd_fadd,simd_fcvt,simd_fmul,simd_fmadd,
simd_fdiv,simd_bitins,simd_bitmov,simd_insert,simd_sld,simd_mul,simd_fcmp,
simd_fexp2,simd_int_arith,simd_bit,simd_shift,simd_splat,simd_fill,
simd_permute,simd_shf,simd_sat,simd_pcnt,simd_copy,simd_branch,simd_clsx,
simd_fminmax,simd_logic,simd_move,simd_load,simd_store"
(cond [(eq_attr "jirl" "!unset") (const_string "call")
(eq_attr "got" "load") (const_string "load")
(eq_attr "alu_type" "add,sub") (const_string "arith")
(eq_attr "alu_type" "not,nor,and,or,xor") (const_string "logical")
;; If a doubleword move uses these expensive instructions,
;; it is usually better to schedule them in the same way
;; as the singleword form, rather than as "multi".
(eq_attr "move_type" "load") (const_string "load")
(eq_attr "move_type" "fpload") (const_string "fpload")
(eq_attr "move_type" "store") (const_string "store")
(eq_attr "move_type" "fpstore") (const_string "fpstore")
(eq_attr "move_type" "mgtf") (const_string "mgtf")
(eq_attr "move_type" "mftg") (const_string "mftg")
;; These types of move are always single insns.
(eq_attr "move_type" "imul") (const_string "imul")
(eq_attr "move_type" "fmove") (const_string "fmove")
(eq_attr "move_type" "signext") (const_string "signext")
(eq_attr "move_type" "pick_ins") (const_string "arith")
(eq_attr "move_type" "arith") (const_string "arith")
(eq_attr "move_type" "logical") (const_string "logical")
(eq_attr "move_type" "sll0") (const_string "shift")
(eq_attr "move_type" "andi") (const_string "logical")
;; These types of move are always split.
(eq_attr "move_type" "shift_shift")
(const_string "multi")
;; These types of move are split for quadword modes only.
(and (eq_attr "move_type" "move,const")
(eq_attr "qword_mode" "yes"))
(const_string "multi")
;; These types of move are split for doubleword modes only.
(and (eq_attr "move_type" "move,const")
(eq_attr "dword_mode" "yes"))
(const_string "multi")
(eq_attr "move_type" "move") (const_string "move")
(eq_attr "move_type" "const") (const_string "const")]
(const_string "unknown")))
;; Mode for conversion types (fcvt)
;; I2S integer to float single (SI/DI to SF)
;; I2D integer to float double (SI/DI to DF)
;; S2I float to integer (SF to SI/DI)
;; D2I float to integer (DF to SI/DI)
;; D2S double to float single
;; S2D float single to double
(define_attr "cnv_mode" "unknown,I2S,I2D,S2I,D2I,D2S,S2D"
(const_string "unknown"))
;; The number of individual instructions that a non-branch pattern generates
(define_attr "insn_count" ""
(cond [;; "Ghost" instructions occupy no space.
(eq_attr "type" "ghost")
(const_int 0)
;; Check for doubleword moves that are decomposed into two
;; instructions.
(and (eq_attr "move_type" "mgtf,mftg,move")
(eq_attr "dword_mode" "yes"))
(const_int 2)
;; Check for quadword moves that are decomposed into four
;; instructions.
(and (eq_attr "move_type" "mgtf,mftg,move")
(eq_attr "qword_mode" "yes"))
(const_int 4)
;; Constants, loads and stores are handled by external routines.
(and (eq_attr "move_type" "const")
(eq_attr "dword_mode" "yes"))
(symbol_ref "loongarch_split_const_insns (operands[1])")
(eq_attr "move_type" "const")
(symbol_ref "loongarch_const_insns (operands[1])")
(eq_attr "move_type" "load,fpload")
(symbol_ref "loongarch_load_store_insns (operands[1], insn)")
(eq_attr "move_type" "store,fpstore")
(symbol_ref "loongarch_load_store_insns (operands[0], insn)")
(eq_attr "type" "idiv")
(symbol_ref "loongarch_idiv_insns (GET_MODE (PATTERN (insn)))")]
(const_int 1)))
;; Length of instruction in bytes.
(define_attr "length" ""
(cond [
;; Branch futher than +/- 128 KiB require two instructions.
(eq_attr "type" "branch")
(if_then_else (and (le (minus (match_dup 0) (pc)) (const_int 131064))
(le (minus (pc) (match_dup 0)) (const_int 131068)))
(const_int 4)
(const_int 8))]
(symbol_ref "get_attr_insn_count (insn) * 4")))
;; Describe a user's asm statement.
(define_asm_attributes
[(set_attr "type" "multi")])
;; This mode iterator allows 32-bit and 64-bit GPR patterns to be generated
;; from the same template.
(define_mode_iterator GPR [SI (DI "TARGET_64BIT")])
;; A copy of GPR that can be used when a pattern has two independent
;; modes.
(define_mode_iterator GPR2 [SI (DI "TARGET_64BIT")])
;; This mode iterator allows 16-bit and 32-bit GPR patterns and 32-bit 64-bit
;; FPR patterns to be generated from the same template.
(define_mode_iterator JOIN_MODE [HI
SI
(SF "TARGET_HARD_FLOAT")
(DF "TARGET_DOUBLE_FLOAT")])
;; This mode iterator allows :P to be used for patterns that operate on
;; pointer-sized quantities. Exactly one of the two alternatives will match.
(define_mode_iterator P [(SI "Pmode == SImode") (DI "Pmode == DImode")])
;; Likewise, but for GRLEN-sized quantities.
(define_mode_iterator X [(SI "!TARGET_64BIT") (DI "TARGET_64BIT")])
;; 64-bit modes for which we provide move patterns.
(define_mode_iterator MOVE64 [DI DF])
;; 128-bit modes for which we provide move patterns on 64-bit targets.
(define_mode_iterator MOVE128 [TI TF])
;; Iterator for sub-32-bit integer modes.
(define_mode_iterator SHORT [QI HI])
;; Likewise the 64-bit truncate-and-shift patterns.
(define_mode_iterator SUBDI [QI HI SI])
;; Iterator for scalar fixed point modes.
(define_mode_iterator QHWD [QI HI SI (DI "TARGET_64BIT")])
;; Iterator for hardware-supported floating-point modes.
(define_mode_iterator ANYF [(SF "TARGET_HARD_FLOAT")
(DF "TARGET_DOUBLE_FLOAT")])
;; Iterator for fixed-point modes which can be hold by a hardware
;; floating-point register.
(define_mode_iterator ANYFI [(SI "TARGET_HARD_FLOAT")
(DI "TARGET_DOUBLE_FLOAT")])
;; A mode for which moves involving FPRs may need to be split.
(define_mode_iterator SPLITF
[(DF "!TARGET_64BIT && TARGET_DOUBLE_FLOAT")
(DI "!TARGET_64BIT && TARGET_DOUBLE_FLOAT")
(TF "TARGET_64BIT && TARGET_DOUBLE_FLOAT")])
;; A mode for anything with 32 bits or more, and able to be loaded with
;; the same addressing mode as ld.w.
(define_mode_iterator LD_AT_LEAST_32_BIT [GPR ANYF])
;; A mode for anything able to be stored with the same addressing mode as
;; st.w.
(define_mode_iterator ST_ANY [QHWD ANYF])
;; A mode for anything legal as a input of a div or mod instruction.
(define_mode_iterator DIV [(DI "TARGET_64BIT")
(SI "!TARGET_64BIT || ISA_HAS_DIV32")])
;; In GPR templates, a string like "mul." will expand to "mul.w" in the
;; 32-bit version and "mul.d" in the 64-bit version.
(define_mode_attr d [(SI "w") (DI "d")])
;; This attribute gives the length suffix for a load or store instruction.
;; The same suffixes work for zero and sign extensions.
(define_mode_attr size [(QI "b") (HI "h") (SI "w") (DI "d")])
(define_mode_attr SIZE [(QI "B") (HI "H") (SI "W") (DI "D")])
;; This attribute gives the mode mask of a SHORT.
(define_mode_attr mask [(QI "0x00ff") (HI "0xffff")])
;; This attribute gives the size (bits) of a SHORT.
(define_mode_attr 7_or_15 [(QI "7") (HI "15")])
;; Instruction names for stores.
(define_mode_attr store [(QI "sb") (HI "sh") (SI "sw") (DI "sd")])
;; This attribute gives the format suffix for floating-point operations.
(define_mode_attr fmt [(SF "s") (DF "d")])
(define_mode_attr ifmt [(SI "w") (DI "l")])
;; This attribute gives the upper-case mode name for one unit of a
;; floating-point mode or vector mode.
(define_mode_attr UNITMODE [(SF "SF") (DF "DF") (V2SF "SF") (V4SF "SF")
(V16QI "QI") (V8HI "HI") (V4SI "SI") (V2DI "DI")
(V2DF "DF")(V8SF "SF")(V32QI "QI")(V16HI "HI")(V8SI "SI")(V4DI "DI")(V4DF "DF")])
;; As above, but in lower case.
(define_mode_attr unitmode [(SF "sf") (DF "df") (V2SF "sf") (V4SF "sf")
(V16QI "qi") (V8QI "qi") (V8HI "hi") (V4HI "hi")
(V4SI "si") (V2SI "si") (V2DI "di") (V2DF "df")
(V8SI "si") (V4DI "di") (V32QI "qi") (V16HI "hi")
(V8SF "sf") (V4DF "df")])
;; This attribute gives the integer mode that has half the size of
;; the controlling mode.
(define_mode_attr HALFMODE [(DF "SI") (DI "SI") (V2SF "SI")
(V2SI "SI") (V4HI "SI") (V8QI "SI")
(TF "DI")])
;; This attribute gives the integer mode that has the same size of a
;; floating-point mode.
(define_mode_attr IMODE [(SF "SI") (DF "DI")])
;; This code iterator allows signed and unsigned widening multiplications
;; to use the same template.
(define_code_iterator any_extend [sign_extend zero_extend])
;; This code iterator allows the two right shift instructions to be
;; generated from the same template.
(define_code_iterator any_shiftrt [ashiftrt lshiftrt])
;; This code iterator allows the three shift instructions to be generated
;; from the same template.
(define_code_iterator any_shift [ashift ashiftrt lshiftrt])
;; This code iterator allows the three bitwise instructions to be generated
;; from the same template.
(define_code_iterator any_bitwise [and ior xor])
(define_code_iterator neg_bitwise [and ior])
;; This code iterator allows unsigned and signed division to be generated
;; from the same template.
(define_code_iterator any_div [div udiv mod umod])
;; This code iterator allows addition and subtraction to be generated
;; from the same template.
(define_code_iterator addsub [plus minus])
;; This code iterator allows addition and multiplication to be generated
;; from the same template.
(define_code_iterator addmul [plus mult])
;; This code iterator allows addition subtraction and multiplication to be
;; generated from the same template
(define_code_iterator addsubmul [plus minus mult])
;; This code iterator allows all native floating-point comparisons to be
;; generated from the same template.
(define_code_iterator fcond [unordered uneq unlt unle eq lt le
ordered ltgt ne ge gt unge ungt])
;; Equality operators.
(define_code_iterator equality_op [eq ne])
;; These code iterators allow the signed and unsigned scc operations to use
;; the same template.
(define_code_iterator any_gt [gt gtu])
(define_code_iterator any_lt [lt ltu])
(define_code_iterator any_le [le leu])
(define_code_iterator any_return [return simple_return])
;; expands to an empty string when doing a signed operation and
;; "u" when doing an unsigned operation.
(define_code_attr u [(sign_extend "") (zero_extend "u")
(div "") (udiv "u")
(mod "") (umod "u")
(gt "") (gtu "u")
(ge "") (geu "u")
(lt "") (ltu "u")
(le "") (leu "u")])
;; is like except uppercase.
(define_code_attr U [(sign_extend "") (zero_extend "U")])
;; is like , but the signed form expands to "s" rather than "".
(define_code_attr su [(sign_extend "s") (zero_extend "u")])
(define_code_attr u_bool [(sign_extend "false") (zero_extend "true")])
;; expands to the name of the optab for a particular code.
(define_code_attr optab [(ashift "ashl")
(ashiftrt "ashr")
(lshiftrt "lshr")
(ior "ior")
(xor "xor")
(and "and")
(plus "add")
(minus "sub")
(mult "mul")
(div "div")
(udiv "udiv")
(mod "mod")
(umod "umod")
(return "return")
(simple_return "simple_return")])
;; expands to the name of the insn that implements a particular code.
(define_code_attr insn [(ashift "sll")
(ashiftrt "sra")
(lshiftrt "srl")
(ior "or")
(xor "xor")
(and "and")
(plus "addu")
(minus "subu")
(div "div")
(udiv "div")
(mod "mod")
(umod "mod")])
;; is the fcmp.cond.fmt condition associated with a particular code.
(define_code_attr fcond [(unordered "cun")
(uneq "cueq")
(unlt "cult")
(unle "cule")
(eq "ceq")
(lt "slt")
(le "sle")
(ordered "cor")
(ltgt "sne")
(ne "cune")
(ge "sge")
(gt "sgt")
(unge "cuge")
(ungt "cugt")])
;; The sel mnemonic to use depending on the condition test.
(define_code_attr sel [(eq "masknez") (ne "maskeqz")])
(define_code_attr selinv [(eq "maskeqz") (ne "masknez")])
;; Iterator and attributes for floating-point to fixed-point conversion
;; instructions.
(define_int_iterator LRINT [UNSPEC_FTINT UNSPEC_FTINTRM UNSPEC_FTINTRP])
(define_int_attr lrint_pattern [(UNSPEC_FTINT "lrint")
(UNSPEC_FTINTRM "lfloor")
(UNSPEC_FTINTRP "lceil")])
(define_int_attr lrint_submenmonic [(UNSPEC_FTINT "")
(UNSPEC_FTINTRM "rm")
(UNSPEC_FTINTRP "rp")])
;; Iterator and attributes for bytepick.d
(define_int_iterator bytepick_w_ashift_amount [8 16 24])
(define_int_attr bytepick_w_lshiftrt_amount [(8 "24")
(16 "16")
(24 "8")])
(define_int_iterator bytepick_d_ashift_amount [8 16 24 32 40 48 56])
(define_int_attr bytepick_d_lshiftrt_amount [(8 "56")
(16 "48")
(24 "40")
(32 "32")
(40 "24")
(48 "16")
(56 "8")])
(define_int_attr bytepick_imm [(8 "1")
(16 "2")
(24 "3")
(32 "4")
(40 "5")
(48 "6")
(56 "7")])
;;
;; ....................
;;
;; CONDITIONAL TRAPS
;;
;; ....................
;;
(define_insn "trap"
[(trap_if (const_int 1) (const_int 0))]
""
{
return "break\t0";
}
[(set_attr "type" "trap")])
;;
;; ....................
;;
;; ADDITION
;;
;; ....................
;;
(define_insn "add3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(plus:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"fadd.\t%0,%1,%2"
[(set_attr "type" "fadd")
(set_attr "mode" "")])
(define_insn_and_split "*addsi3"
[(set (match_operand:SI 0 "register_operand" "=r,r,r,r,r")
(plus:SI (match_operand:SI 1 "register_operand" "r,r,r,r,r")
(match_operand:SI 2 "plus_si_operand"
"r,I,La,Lb,Le")))]
""
"@
add.w\t%0,%1,%2
addi.w\t%0,%1,%2
#
* operands[2] = GEN_INT (INTVAL (operands[2]) / 65536); \
return \"addu16i.d\t%0,%1,%2\";
#"
"CONST_INT_P (operands[2]) && !IMM12_INT (operands[2]) \
&& !ADDU16I_OPERAND (INTVAL (operands[2]))"
[(set (match_dup 0) (plus:SI (match_dup 1) (match_dup 3)))
(set (match_dup 0) (plus:SI (match_dup 0) (match_dup 4)))]
{
loongarch_split_plus_constant (&operands[2], SImode);
}
[(set_attr "alu_type" "add")
(set_attr "mode" "SI")
(set_attr "insn_count" "1,1,2,1,2")])
(define_expand "addsi3"
[(set (match_operand:SI 0 "register_operand" "=r,r,r,r,r")
(plus:SI (match_operand:SI 1 "register_operand" "r,r,r,r,r")
(match_operand:SI 2 "plus_si_operand" "r,I,La,Le,Lb")))]
"TARGET_64BIT"
{
if (CONST_INT_P (operands[2]) && !IMM12_INT (operands[2])
&& ADDU16I_OPERAND (INTVAL (operands[2])))
{
rtx t1 = gen_reg_rtx (DImode);
rtx t2 = gen_reg_rtx (DImode);
rtx t3 = gen_reg_rtx (DImode);
emit_insn (gen_extend_insn (t1, operands[1], DImode, SImode, 0));
t2 = operands[2];
emit_insn (gen_adddi3 (t3, t1, t2));
t3 = gen_lowpart (SImode, t3);
emit_move_insn (operands[0], t3);
DONE;
}
else
{
rtx t = gen_reg_rtx (DImode);
emit_insn (gen_addsi3_extended (t, operands[1], operands[2]));
t = gen_lowpart (SImode, t);
SUBREG_PROMOTED_VAR_P (t) = 1;
SUBREG_PROMOTED_SET (t, SRP_SIGNED);
emit_move_insn (operands[0], t);
DONE;
}
})
(define_insn_and_split "adddi3"
[(set (match_operand:DI 0 "register_operand" "=r,r,r,r,r,r")
(plus:DI (match_operand:DI 1 "register_operand" "r,r,r,r,r,r")
(match_operand:DI 2 "plus_di_operand"
"r,I,La,Lb,Lc,Ld")))]
"TARGET_64BIT"
"@
add.d\t%0,%1,%2
addi.d\t%0,%1,%2
#
* operands[2] = GEN_INT (INTVAL (operands[2]) / 65536); \
return \"addu16i.d\t%0,%1,%2\";
#
#"
"&& CONST_INT_P (operands[2]) && !IMM12_INT (operands[2]) \
&& !ADDU16I_OPERAND (INTVAL (operands[2]))"
[(set (match_dup 0) (plus:DI (match_dup 1) (match_dup 3)))
(set (match_dup 0) (plus:DI (match_dup 0) (match_dup 4)))]
{
loongarch_split_plus_constant (&operands[2], DImode);
}
[(set_attr "alu_type" "add")
(set_attr "mode" "DI")
(set_attr "insn_count" "1,1,2,1,2,2")])
(define_insn_and_split "addsi3_extended"
[(set (match_operand:DI 0 "register_operand" "=r,r,r,r")
(sign_extend:DI
(plus:SI (match_operand:SI 1 "register_operand" "r,r,r,r")
(match_operand:SI 2 "plus_si_extend_operand"
"r,I,La,Le"))))]
"TARGET_64BIT"
"@
add.w\t%0,%1,%2
addi.w\t%0,%1,%2
#
#"
"CONST_INT_P (operands[2]) && !IMM12_INT (operands[2])"
[(set (subreg:SI (match_dup 0) 0) (plus:SI (match_dup 1) (match_dup 3)))
(set (match_dup 0)
(sign_extend:DI (plus:SI (subreg:SI (match_dup 0) 0)
(match_dup 4))))]
{
loongarch_split_plus_constant (&operands[2], SImode);
}
[(set_attr "alu_type" "add")
(set_attr "mode" "SI")
(set_attr "insn_count" "1,1,2,2")])
;;
;; ....................
;;
;; SUBTRACTION
;;
;; ....................
;;
(define_insn "sub3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(minus:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"fsub.\t%0,%1,%2"
[(set_attr "type" "fadd")
(set_attr "mode" "")])
(define_insn "sub3"
[(set (match_operand:GPR 0 "register_operand" "=r")
(minus:GPR (match_operand:GPR 1 "register_operand" "r")
(match_operand:GPR 2 "register_operand" "r")))]
""
"sub.\t%0,%z1,%2"
[(set_attr "alu_type" "sub")
(set_attr "mode" "")])
(define_insn "*subsi3_extended"
[(set (match_operand:DI 0 "register_operand" "=r")
(sign_extend:DI
(minus:SI (match_operand:SI 1 "reg_or_0_operand" "rJ")
(match_operand:SI 2 "register_operand" "r"))))]
"TARGET_64BIT"
"sub.w\t%0,%z1,%2"
[(set_attr "type" "arith")
(set_attr "mode" "SI")])
;;
;; ....................
;;
;; MULTIPLICATION
;;
;; ....................
;;
(define_insn "mul3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(mult:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"fmul.\t%0,%1,%2"
[(set_attr "type" "fmul")
(set_attr "mode" "")])
(define_insn "mul3"
[(set (match_operand:GPR 0 "register_operand" "=r")
(mult:GPR (match_operand:GPR 1 "register_operand" "r")
(match_operand:GPR 2 "register_operand" "r")))]
""
"mul.\t%0,%1,%2"
[(set_attr "type" "imul")
(set_attr "mode" "")])
(define_insn "*mulsi3_extended"
[(set (match_operand:DI 0 "register_operand" "=r")
(sign_extend:DI
(mult:SI (match_operand:SI 1 "register_operand" "r")
(match_operand:SI 2 "register_operand" "r"))))]
"TARGET_64BIT"
"mul.w\t%0,%1,%2"
[(set_attr "type" "imul")
(set_attr "mode" "SI")])
;;
;; ........................
;;
;; MULTIPLICATION HIGH-PART
;;
;; ........................
;;
(define_expand "mulditi3"
[(set (match_operand:TI 0 "register_operand")
(mult:TI (any_extend:TI (match_operand:DI 1 "register_operand"))
(any_extend:TI (match_operand:DI 2 "register_operand"))))]
"TARGET_64BIT"
{
rtx low = gen_reg_rtx (DImode);
emit_insn (gen_muldi3 (low, operands[1], operands[2]));
rtx high = gen_reg_rtx (DImode);
emit_insn (gen_muldi3_highpart (high, operands[1], operands[2]));
emit_move_insn (gen_lowpart (DImode, operands[0]), low);
emit_move_insn (gen_highpart (DImode, operands[0]), high);
DONE;
})
(define_insn "muldi3_highpart"
[(set (match_operand:DI 0 "register_operand" "=r")
(truncate:DI
(lshiftrt:TI
(mult:TI (any_extend:TI
(match_operand:DI 1 "register_operand" " r"))
(any_extend:TI
(match_operand:DI 2 "register_operand" " r")))
(const_int 64))))]
"TARGET_64BIT"
"mulh.d\t%0,%1,%2"
[(set_attr "type" "imul")
(set_attr "mode" "DI")])
(define_expand "mulsidi3"
[(set (match_operand:DI 0 "register_operand")
(mult:DI (any_extend:DI
(match_operand:SI 1 "register_operand"))
(any_extend:DI
(match_operand:SI 2 "register_operand"))))]
""
{
if (!TARGET_64BIT)
{
rtx temp = gen_reg_rtx (SImode);
emit_insn (gen_mulsi3 (temp, operands[1], operands[2]));
emit_insn (gen_mulsi3_highpart (loongarch_subword (operands[0], true),
operands[1], operands[2]));
emit_insn (gen_movsi (loongarch_subword (operands[0], false), temp));
DONE;
}
})
(define_insn "mulsidi3_64bit"
[(set (match_operand:DI 0 "register_operand" "=r")
(mult:DI (any_extend:DI (match_operand:SI 1 "register_operand" "r"))
(any_extend:DI (match_operand:SI 2 "register_operand" "r"))))]
"TARGET_64BIT"
"mulw.d.w\t%0,%1,%2"
[(set_attr "type" "imul")
(set_attr "mode" "DI")])
(define_insn "mulsi3_highpart"
[(set (match_operand:SI 0 "register_operand" "=r")
(truncate:SI
(lshiftrt:DI
(mult:DI (any_extend:DI
(match_operand:SI 1 "register_operand" " r"))
(any_extend:DI
(match_operand:SI 2 "register_operand" " r")))
(const_int 32))))]
""
"mulh.w\t%0,%1,%2"
[(set_attr "type" "imul")
(set_attr "mode" "SI")])
;; Under the LoongArch architecture, the mulh.w[u] instruction performs
;; sign extension by default, so the sign extension instruction can be
;; eliminated.
(define_peephole
[(set (match_operand:SI 0 "register_operand")
(truncate:SI
(lshiftrt:DI
(mult:DI (any_extend:DI
(match_operand:SI 1 "register_operand"))
(any_extend:DI
(match_operand:SI 2 "register_operand")))
(const_int 32))))
(set (match_operand:DI 3 "register_operand")
(sign_extend:DI (match_dup 0)))]
"TARGET_64BIT && REGNO (operands[0]) == REGNO (operands[3])"
"mulh.w\t%0,%1,%2")
;;
;; ....................
;;
;; DIVISION and REMAINDER
;;
;; ....................
;;
;; Float division and modulus.
(define_expand "div3"
[(set (match_operand:ANYF 0 "register_operand")
(div:ANYF (match_operand:ANYF 1 "reg_or_1_operand")
(match_operand:ANYF 2 "register_operand")))]
""
{
if (mode == SFmode
&& TARGET_RECIP_DIV
&& optimize_insn_for_speed_p ()
&& flag_finite_math_only && !flag_trapping_math
&& flag_unsafe_math_optimizations)
{
loongarch_emit_swdivsf (operands[0], operands[1],
operands[2], SFmode);
DONE;
}
})
(define_insn "*div3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(div:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"fdiv.\t%0,%1,%2"
[(set_attr "type" "fdiv")
(set_attr "mode" "")])
;; In 3A5000, the reciprocal operation is the same as the division operation.
(define_insn "*recip3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(div:ANYF (match_operand:ANYF 1 "const_1_operand" "")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"frecip.\t%0,%2"
[(set_attr "type" "frdiv")
(set_attr "mode" "")])
;; Approximate Reciprocal Instructions.
(define_insn "loongarch_frecipe_"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(match_operand:ANYF 1 "register_operand" "f")]
UNSPEC_RECIPE))]
"ISA_HAS_FRECIPE"
"frecipe.\t%0,%1"
[(set_attr "type" "frecipe")
(set_attr "mode" "")
(set_attr "insn_count" "1")])
;; Integer division and modulus.
(define_expand "3"
[(set (match_operand:GPR 0 "register_operand")
(any_div:GPR (match_operand:GPR 1 "register_operand")
(match_operand:GPR 2 "register_operand")))]
""
{
if (GET_MODE (operands[0]) == SImode && TARGET_64BIT && !ISA_HAS_DIV32)
{
rtx reg1 = gen_reg_rtx (DImode);
rtx reg2 = gen_reg_rtx (DImode);
rtx rd = gen_reg_rtx (DImode);
operands[1] = gen_rtx_SIGN_EXTEND (word_mode, operands[1]);
operands[2] = gen_rtx_SIGN_EXTEND (word_mode, operands[2]);
emit_insn (gen_rtx_SET (reg1, operands[1]));
emit_insn (gen_rtx_SET (reg2, operands[2]));
emit_insn (gen_di3_fake (rd, reg1, reg2));
emit_insn (gen_rtx_SET (operands[0],
simplify_gen_subreg (SImode, rd, DImode, 0)));
DONE;
}
})
(define_insn "*3"
[(set (match_operand:DIV 0 "register_operand" "=r,&r,&r")
(any_div:DIV (match_operand:DIV 1 "register_operand" "r,r,0")
(match_operand:DIV 2 "register_operand" "r,r,r")))]
""
{
return loongarch_output_division (".\t%0,%1,%2", operands);
}
[(set_attr "type" "idiv")
(set_attr "mode" "")
(set (attr "enabled")
(if_then_else
(match_test "!!which_alternative == loongarch_check_zero_div_p()")
(const_string "yes")
(const_string "no")))])
(define_insn "si3_extended"
[(set (match_operand:DI 0 "register_operand" "=r,&r,&r")
(sign_extend
(any_div:SI (match_operand:SI 1 "register_operand" "r,r,0")
(match_operand:SI 2 "register_operand" "r,r,r"))))]
"TARGET_64BIT && ISA_HAS_DIV32"
{
return loongarch_output_division (".w\t%0,%1,%2", operands);
}
[(set_attr "type" "idiv")
(set_attr "mode" "SI")
(set (attr "enabled")
(if_then_else
(match_test "!!which_alternative == loongarch_check_zero_div_p()")
(const_string "yes")
(const_string "no")))])
(define_insn "di3_fake"
[(set (match_operand:DI 0 "register_operand" "=r,&r,&r")
(sign_extend:DI
(unspec:SI
[(subreg:SI
(any_div:DI (match_operand:DI 1 "register_operand" "r,r,0")
(match_operand:DI 2 "register_operand" "r,r,r")) 0)]
UNSPEC_FAKE_ANY_DIV)))]
"TARGET_64BIT && !ISA_HAS_DIV32"
{
return loongarch_output_division (".w\t%0,%1,%2", operands);
}
[(set_attr "type" "idiv")
(set_attr "mode" "SI")
(set (attr "enabled")
(if_then_else
(match_test "!!which_alternative == loongarch_check_zero_div_p()")
(const_string "yes")
(const_string "no")))])
;; Floating point multiply accumulate instructions.
;; a * b + c
(define_insn "fma4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(fma:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")
(match_operand:ANYF 3 "register_operand" "f")))]
""
"fmadd.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; a * b - c
(define_insn "fms4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(fma:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")
(neg:ANYF (match_operand:ANYF 3 "register_operand" "f"))))]
""
"fmsub.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; fnma is defined in GCC as (fma (neg op1) op2 op3)
;; (-op1 * op2) + op3 ==> -(op1 * op2) + op3 ==> -((op1 * op2) - op3)
;; The loongarch nmsub instructions implement -((op1 * op2) - op3)
;; This transformation means we may return the wrong signed zero
;; so we check HONOR_SIGNED_ZEROS.
;; -a * b + c
(define_insn "fnma4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(fma:ANYF (neg:ANYF (match_operand:ANYF 1 "register_operand" "f"))
(match_operand:ANYF 2 "register_operand" "f")
(match_operand:ANYF 3 "register_operand" "f")))]
"!HONOR_SIGNED_ZEROS (mode)"
"fnmsub.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; fnms is defined as: (fma (neg op1) op2 (neg op3))
;; ((-op1) * op2) - op3 ==> -(op1 * op2) - op3 ==> -((op1 * op2) + op3)
;; The loongarch nmadd instructions implement -((op1 * op2) + op3)
;; This transformation means we may return the wrong signed zero
;; so we check HONOR_SIGNED_ZEROS.
;; -a * b - c
(define_insn "fnms4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(fma:ANYF
(neg:ANYF (match_operand:ANYF 1 "register_operand" "f"))
(match_operand:ANYF 2 "register_operand" "f")
(neg:ANYF (match_operand:ANYF 3 "register_operand" "f"))))]
"!HONOR_SIGNED_ZEROS (mode)"
"fnmadd.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; -(-a * b - c), modulo signed zeros
(define_insn "*fma4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(neg:ANYF
(fma:ANYF
(neg:ANYF (match_operand:ANYF 1 "register_operand" " f"))
(match_operand:ANYF 2 "register_operand" " f")
(neg:ANYF (match_operand:ANYF 3 "register_operand" " f")))))]
"!HONOR_SIGNED_ZEROS (mode)"
"fmadd.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; -(-a * b + c), modulo signed zeros
(define_insn "*fms4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(neg:ANYF
(fma:ANYF
(neg:ANYF (match_operand:ANYF 1 "register_operand" " f"))
(match_operand:ANYF 2 "register_operand" " f")
(match_operand:ANYF 3 "register_operand" " f"))))]
"!HONOR_SIGNED_ZEROS (mode)"
"fmsub.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; -(a * b + c)
(define_insn "*fnms4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(neg:ANYF
(fma:ANYF
(match_operand:ANYF 1 "register_operand" " f")
(match_operand:ANYF 2 "register_operand" " f")
(match_operand:ANYF 3 "register_operand" " f"))))]
""
"fnmadd.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;; -(a * b - c)
(define_insn "*fnma4"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(neg:ANYF
(fma:ANYF
(match_operand:ANYF 1 "register_operand" " f")
(match_operand:ANYF 2 "register_operand" " f")
(neg:ANYF (match_operand:ANYF 3 "register_operand" " f")))))]
""
"fnmsub.\t%0,%1,%2,%3"
[(set_attr "type" "fmadd")
(set_attr "mode" "")])
;;
;; ....................
;;
;; SQUARE ROOT
;;
;; ....................
(define_expand "sqrt2"
[(set (match_operand:ANYF 0 "register_operand")
(sqrt:ANYF (match_operand:ANYF 1 "register_operand")))]
""
{
if (mode == SFmode
&& TARGET_RECIP_SQRT
&& flag_unsafe_math_optimizations
&& !optimize_insn_for_size_p ()
&& flag_finite_math_only && !flag_trapping_math)
{
loongarch_emit_swrsqrtsf (operands[0], operands[1], SFmode, 0);
DONE;
}
})
(define_insn "*sqrt2"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(sqrt:ANYF (match_operand:ANYF 1 "register_operand" "f")))]
""
"fsqrt.\t%0,%1"
[(set_attr "type" "fsqrt")
(set_attr "mode" "")
(set_attr "insn_count" "1")])
(define_expand "rsqrt2"
[(set (match_operand:ANYF 0 "register_operand")
(unspec:ANYF [(match_operand:ANYF 1 "register_operand")]
UNSPEC_RSQRT))]
"TARGET_HARD_FLOAT"
{
if (mode == SFmode && TARGET_RECIP_RSQRT)
{
loongarch_emit_swrsqrtsf (operands[0], operands[1], SFmode, 1);
DONE;
}
})
(define_insn "*rsqrt2"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(match_operand:ANYF 1 "register_operand" "f")]
UNSPEC_RSQRT))]
"TARGET_HARD_FLOAT"
"frsqrt.\t%0,%1"
[(set_attr "type" "frsqrt")
(set_attr "mode" "")])
;; Approximate Reciprocal Square Root Instructions.
(define_insn "loongarch_frsqrte_"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(match_operand:ANYF 1 "register_operand" "f")]
UNSPEC_RSQRTE))]
"ISA_HAS_FRECIPE"
"frsqrte.\t%0,%1"
[(set_attr "type" "frsqrte")
(set_attr "mode" "")])
;;
;; ....................
;;
;; ABSOLUTE VALUE
;;
;; ....................
(define_insn "abs2"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(abs:ANYF (match_operand:ANYF 1 "register_operand" "f")))]
""
"fabs.\t%0,%1"
[(set_attr "type" "fabs")
(set_attr "mode" "")])
;;
;; ....................
;;
;; FLOATING POINT COPYSIGN
;;
;; ....................
(define_insn "copysign3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(copysign:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
"TARGET_HARD_FLOAT"
"fcopysign.\t%0,%1,%2"
[(set_attr "type" "fcopysign")
(set_attr "mode" "")])
(define_expand "@xorsign3"
[(match_operand:ANYF 0 "register_operand")
(match_operand:ANYF 1 "register_operand")
(match_operand:ANYF 2 "register_operand")]
"ISA_HAS_LSX"
{
machine_mode lsx_mode
= mode == SFmode ? V4SFmode : V2DFmode;
rtx tmp = gen_reg_rtx (lsx_mode);
rtx op1 = lowpart_subreg (lsx_mode, operands[1], mode);
rtx op2 = lowpart_subreg (lsx_mode, operands[2], mode);
emit_insn (gen_xorsign3 (lsx_mode, tmp, op1, op2));
emit_move_insn (operands[0],
lowpart_subreg (mode, tmp, lsx_mode));
DONE;
})
;;
;; ....................
;;
;; FLOATING POINT SCALE
;;
;; ....................
(define_insn "ldexp3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(match_operand:ANYF 1 "register_operand" "f")
(match_operand: 2 "register_operand" "f")]
UNSPEC_FSCALEB))]
"TARGET_HARD_FLOAT"
"fscaleb.\t%0,%1,%2"
[(set_attr "type" "fscaleb")
(set_attr "mode" "")])
;;
;; ....................
;;
;; FLOATING POINT EXPONENT EXTRACT
;;
;; ....................
(define_insn "logb_non_negative2"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(match_operand:ANYF 1 "register_operand" "f")]
UNSPEC_FLOGB))]
"TARGET_HARD_FLOAT"
"flogb.\t%0,%1"
[(set_attr "type" "flogb")
(set_attr "mode" "")])
(define_expand "logb2"
[(set (match_operand:ANYF 0 "register_operand")
(unspec:ANYF [(abs:ANYF (match_operand:ANYF 1 "register_operand"))]
UNSPEC_FLOGB))]
"TARGET_HARD_FLOAT"
{
rtx tmp = gen_reg_rtx (mode);
emit_insn (gen_abs2 (tmp, operands[1]));
emit_insn (gen_logb_non_negative2 (operands[0], tmp));
DONE;
})
;;
;; ...................
;;
;; Count leading zeroes.
;;
;; ...................
;;
(define_insn "clz2"
[(set (match_operand:GPR 0 "register_operand" "=r")
(clz:GPR (match_operand:GPR 1 "register_operand" "r")))]
""
"clz.\t%0,%1"
[(set_attr "type" "clz")
(set_attr "mode" "")])
;;
;; ...................
;;
;; Count trailing zeroes.
;;
;; ...................
;;
(define_insn "ctz2"
[(set (match_operand:GPR 0 "register_operand" "=r")
(ctz:GPR (match_operand:GPR 1 "register_operand" "r")))]
""
"ctz.\t%0,%1"
[(set_attr "type" "clz")
(set_attr "mode" "")])
;;
;; ....................
;;
;; MIN/MAX
;;
;; ....................
(define_insn "smax3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(smax:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"fmax.\t%0,%1,%2"
[(set_attr "type" "fmove")
(set_attr "mode" "")])
(define_insn "smin3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(smin:ANYF (match_operand:ANYF 1 "register_operand" "f")
(match_operand:ANYF 2 "register_operand" "f")))]
""
"fmin.\t%0,%1,%2"
[(set_attr "type" "fmove")
(set_attr "mode" "")])
(define_insn "fmax3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(use (match_operand:ANYF 1 "register_operand" "f"))
(use (match_operand:ANYF 2 "register_operand" "f"))]
UNSPEC_FMAX))]
""
"fmax.\t%0,%1,%2"
[(set_attr "type" "fmove")
(set_attr "mode" "")])
(define_insn "fmin3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(unspec:ANYF [(use (match_operand:ANYF 1 "register_operand" "f"))
(use (match_operand:ANYF 2 "register_operand" "f"))]
UNSPEC_FMIN))]
""
"fmin.\t%0,%1,%2"
[(set_attr "type" "fmove")
(set_attr "mode" "")])
(define_insn "smaxa3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(if_then_else:ANYF
(gt (abs:ANYF (match_operand:ANYF 1 "register_operand" "f"))
(abs:ANYF (match_operand:ANYF 2 "register_operand" "f")))
(match_dup 1)
(match_dup 2)))]
""
"fmaxa.\t%0,%1,%2"
[(set_attr "type" "fmove")
(set_attr "mode" "")])
(define_insn "smina3"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(if_then_else:ANYF
(lt (abs:ANYF (match_operand:ANYF 1 "register_operand" "f"))
(abs:ANYF (match_operand:ANYF 2 "register_operand" "f")))
(match_dup 1)
(match_dup 2)))]
""
"fmina.\t%0,%1,%2"
[(set_attr "type" "fmove")
(set_attr "mode" "")])
;;
;; ....................
;;
;; NEGATION and ONE'S COMPLEMENT
;;
;; ....................
(define_insn "neg2"
[(set (match_operand:GPR 0 "register_operand" "=r")
(neg:GPR (match_operand:GPR 1 "register_operand" "r")))]
""
"sub.\t%0,%.,%1"
[(set_attr "alu_type" "sub")
(set_attr "mode" "")])
(define_insn "*negsi2_extended"
[(set (match_operand:DI 0 "register_operand" "=r")
(sign_extend:DI (neg:SI (match_operand:SI 1 "register_operand" "r"))))]
"TARGET_64BIT"
"sub.w\t%0,%.,%1"
[(set_attr "alu_type" "sub")
(set_attr "mode" "SI")])
(define_insn "neg2"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(neg:ANYF (match_operand:ANYF 1 "register_operand" "f")))]
""
"fneg.\t%0,%1"
[(set_attr "type" "fneg")
(set_attr "mode" "")])
;;
;; ....................
;;
;; LOGICAL
;;
;; ....................
;;
(define_insn "3"
[(set (match_operand:X 0 "register_operand" "=r,r")
(any_bitwise:X (match_operand:X 1 "register_operand" "%r,r")
(match_operand:X 2 "uns_arith_operand" "r,K")))]
""
"%i2\t%0,%1,%2"
[(set_attr "type" "logical")
(set_attr "mode" "")])
(define_insn "*si3_internal"
[(set (match_operand:SI 0 "register_operand" "=r,r")
(any_bitwise:SI (match_operand:SI 1 "register_operand" "%r,r")
(match_operand:SI 2 "uns_arith_operand" " r,K")))]
"TARGET_64BIT"
"%i2\t%0,%1,%2"
[(set_attr "type" "logical")
(set_attr "mode" "SI")])
(define_insn "one_cmpl2"
[(set (match_operand:X 0 "register_operand" "=r")
(not:X (match_operand:X 1 "register_operand" "r")))]
""
"nor\t%0,%.,%1"
[(set_attr "alu_type" "not")
(set_attr "mode" "")])
(define_insn "*one_cmplsi2_internal"
[(set (match_operand:SI 0 "register_operand" "=r")
(not:SI (match_operand:SI 1 "register_operand" " r")))]
"TARGET_64BIT"
"nor\t%0,%.,%1"
[(set_attr "type" "logical")
(set_attr "mode" "SI")])
(define_insn "and3_extended"
[(set (match_operand:GPR 0 "register_operand" "=r")
(and:GPR (match_operand:GPR 1 "nonimmediate_operand" "r")
(match_operand:GPR 2 "low_bitmask_operand" "Yx")))]
""
{
int len;
len = low_bitmask_len (mode, INTVAL (operands[2]));
operands[2] = GEN_INT (len-1);
return "bstrpick.\t%0,%1,%2,0";
}
[(set_attr "move_type" "pick_ins")
(set_attr "mode" "")])
(define_insn_and_split "*bstrins__for_mask"
[(set (match_operand:GPR 0 "register_operand" "=r")
(and:GPR (match_operand:GPR 1 "register_operand" "r")
(match_operand:GPR 2 "ins_zero_bitmask_operand" "i")))]
""
"#"
""
[(set (match_dup 0) (match_dup 1))
(set (zero_extract:GPR (match_dup 0) (match_dup 2) (match_dup 3))
(const_int 0))]
{
unsigned HOST_WIDE_INT mask = ~UINTVAL (operands[2]);
int lo = ffs_hwi (mask) - 1;
int len = low_bitmask_len (mode, mask >> lo);
len = MIN (len, GET_MODE_BITSIZE (mode) - lo);
operands[2] = GEN_INT (len);
operands[3] = GEN_INT (lo);
})
(define_insn_and_split "*bstrins__for_ior_mask"
[(set (match_operand:GPR 0 "register_operand" "=r")
(ior:GPR (and:GPR (match_operand:GPR 1 "register_operand" "r")
(match_operand:GPR 2 "const_int_operand" "i"))
(and:GPR (match_operand:GPR 3 "register_operand" "r")
(match_operand:GPR 4 "const_int_operand" "i"))))]
"loongarch_pre_reload_split ()
&& loongarch_use_bstrins_for_ior_with_mask (mode, operands)"
"#"
"&& true"
[(set (match_dup 0) (match_dup 1))
(set (zero_extract:GPR (match_dup 0) (match_dup 2) (match_dup 4))
(match_dup 3))]
{
if (loongarch_use_bstrins_for_ior_with_mask (mode, operands) < 0)
{
std::swap (operands[1], operands[3]);
std::swap (operands[2], operands[4]);
}
unsigned HOST_WIDE_INT mask = ~UINTVAL (operands[2]);
int lo = ffs_hwi (mask) - 1;
int len = low_bitmask_len (mode, mask >> lo);
len = MIN (len, GET_MODE_BITSIZE (mode) - lo);
operands[2] = GEN_INT (len);
operands[4] = GEN_INT (lo);
if (lo)
{
rtx tmp = gen_reg_rtx (mode);
emit_move_insn (tmp, gen_rtx_ASHIFTRT(mode, operands[3],
GEN_INT (lo)));
operands[3] = tmp;
}
})
;; We always avoid the shift operation in bstrins__for_ior_mask
;; if possible, but the result may be sub-optimal when one of the masks
;; is (1 << N) - 1 and one of the src register is the dest register.
;; For example:
;; move t0, a0
;; move a0, a1
;; bstrins.d a0, t0, 42, 0
;; ret
;; using a shift operation would be better:
;; srai.d t0, a1, 43
;; bstrins.d a0, t0, 63, 43
;; ret
;; unfortunately we cannot figure it out in split1: before reload we cannot
;; know if the dest register is one of the src register. Fix it up in
;; peephole2.
(define_peephole2
[(set (match_operand:GPR 0 "register_operand")
(match_operand:GPR 1 "register_operand"))
(set (match_dup 1) (match_operand:GPR 2 "register_operand"))
(set (zero_extract:GPR (match_dup 1)
(match_operand:SI 3 "const_int_operand")
(const_int 0))
(match_dup 0))]
"peep2_reg_dead_p (3, operands[0])"
[(const_int 0)]
{
int len = GET_MODE_BITSIZE (mode) - INTVAL (operands[3]);
emit_insn (gen_ashr3 (operands[0], operands[2], operands[3]));
emit_insn (gen_insv (operands[1], GEN_INT (len), operands[3],
operands[0]));
DONE;
})
(define_insn "*iorhi3"
[(set (match_operand:HI 0 "register_operand" "=r,r")
(ior:HI (match_operand:HI 1 "register_operand" "%r,r")
(match_operand:HI 2 "uns_arith_operand" "r,K")))]
""
"or%i2\t%0,%1,%2"
[(set_attr "type" "logical")
(set_attr "mode" "HI")])
(define_insn "nor3"
[(set (match_operand:X 0 "register_operand" "=r")
(and:X (not:X (match_operand:X 1 "register_operand" "%r"))
(not:X (match_operand:X 2 "register_operand" "r"))))]
""
"nor\t%0,%1,%2"
[(set_attr "type" "logical")
(set_attr "mode" "")])
(define_insn "*norsi3_internal"
[(set (match_operand:SI 0 "register_operand" "=r")
(and:SI (not:SI (match_operand:SI 1 "register_operand" "%r"))
(not:SI (match_operand:SI 2 "register_operand" "r"))))]
"TARGET_64BIT"
"nor\t%0,%1,%2"
[(set_attr "type" "logical")
(set_attr "mode" "SI")])
(define_insn "n"
[(set (match_operand:X 0 "register_operand" "=r")
(neg_bitwise:X
(not:X (match_operand:X 1 "register_operand" "r"))
(match_operand:X 2 "register_operand" "r")))]
""
"n\t%0,%2,%1"
[(set_attr "type" "logical")
(set_attr "mode" "")])
(define_insn "*nsi_internal"
[(set (match_operand:SI 0 "register_operand" "=r")
(neg_bitwise:SI
(not:SI (match_operand:SI 1 "register_operand" "r"))
(match_operand:SI 2 "register_operand" "r")))]
"TARGET_64BIT"
"n\t%0,%2,%1"
[(set_attr "type" "logical")
(set_attr "mode" "SI")])
;;
;; ....................
;;
;; TRUNCATION
;;
;; ....................
(define_insn "truncdfsf2"
[(set (match_operand:SF 0 "register_operand" "=f")
(float_truncate:SF (match_operand:DF 1 "register_operand" "f")))]
"TARGET_DOUBLE_FLOAT"
"fcvt.s.d\t%0,%1"
[(set_attr "type" "fcvt")
(set_attr "cnv_mode" "D2S")
(set_attr "mode" "SF")])
;; In vector registers, popcount can be implemented directly through
;; the vector instruction [X]VPCNT. For GP registers, we can implement
;; it through the following method. Compared with loop implementation
;; of popcount, the following method has better performance.
;; This attribute used for get connection of scalar mode and corresponding
;; vector mode.
(define_mode_attr cntmap [(SI "v4si") (DI "v2di")])
(define_expand "popcount2"
[(set (match_operand:GPR 0 "register_operand")
(popcount:GPR (match_operand:GPR 1 "register_operand")))]
"ISA_HAS_LSX"
{
rtx in = operands[1];
rtx out = operands[0];
rtx vreg = mode == SImode ? gen_reg_rtx (V4SImode) :
gen_reg_rtx (V2DImode);
emit_insn (gen_lsx_vinsgr2vr_ (vreg, in, vreg, GEN_INT (1)));
emit_insn (gen_popcount2 (vreg, vreg));
emit_insn (gen_lsx_vpickve2gr_ (out, vreg, GEN_INT (0)));
DONE;
})
;;
;; ....................
;;
;; ZERO EXTENSION
;;
;; ....................
(define_expand "zero_extendsidi2"
[(set (match_operand:DI 0 "register_operand")
(zero_extend:DI (match_operand:SI 1 "nonimmediate_operand")))]
"TARGET_64BIT")
(define_insn_and_split "*zero_extendsidi2_internal"
[(set (match_operand:DI 0 "register_operand" "=r,r,r,r")
(zero_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m,ZC,k")))]
"TARGET_64BIT"
"@
bstrpick.d\t%0,%1,31,0
ld.wu\t%0,%1
#
ldx.wu\t%0,%1"
"&& reload_completed
&& MEM_P (operands[1])
&& (loongarch_14bit_shifted_offset_address_p (XEXP (operands[1], 0), SImode)
&& !loongarch_12bit_offset_address_p (XEXP (operands[1], 0), SImode))
&& !paradoxical_subreg_p (operands[0])"
[(set (match_dup 3) (match_dup 1))
(set (match_dup 0)
(ior:DI (zero_extend:DI
(subreg:SI (match_dup 0) 0))
(match_dup 2)))]
{
operands[1] = gen_lowpart (SImode, operands[1]);
operands[3] = gen_lowpart (SImode, operands[0]);
operands[2] = const0_rtx;
}
[(set_attr "move_type" "arith,load,load,load")
(set_attr "mode" "DI")])
(define_insn "zero_extend2"
[(set (match_operand:GPR 0 "register_operand" "=r,r,r")
(zero_extend:GPR
(match_operand:SHORT 1 "nonimmediate_operand" "r,m,k")))]
""
"@
bstrpick.w\t%0,%1,,0
ld.u\t%0,%1
ldx.u\t%0,%1"
[(set_attr "move_type" "pick_ins,load,load")
(set_attr "mode" "")])
(define_insn "zero_extendqihi2"
[(set (match_operand:HI 0 "register_operand" "=r,r,r")
(zero_extend:HI (match_operand:QI 1 "nonimmediate_operand" "r,k,m")))]
""
"@
andi\t%0,%1,0xff
ldx.bu\t%0,%1
ld.bu\t%0,%1"
[(set_attr "move_type" "andi,load,load")
(set_attr "mode" "HI")])
;; Combiner patterns to optimize truncate/zero_extend combinations.
(define_insn "*zero_extend_trunc"
[(set (match_operand:GPR 0 "register_operand" "=r")
(zero_extend:GPR
(truncate:SHORT (match_operand:DI 1 "register_operand" "r"))))]
"TARGET_64BIT"
"bstrpick.w\t%0,%1,,0"
[(set_attr "move_type" "pick_ins")
(set_attr "mode" "")])
(define_insn "*zero_extendhi_truncqi"
[(set (match_operand:HI 0 "register_operand" "=r")
(zero_extend:HI
(truncate:QI (match_operand:DI 1 "register_operand" "r"))))]
"TARGET_64BIT"
"andi\t%0,%1,0xff"
[(set_attr "alu_type" "and")
(set_attr "mode" "HI")])
;;
;; ....................
;;
;; SIGN EXTENSION
;;
;; ....................
(define_insn "extendsidi2"
[(set (match_operand:DI 0 "register_operand" "=r,r,r,r")
(sign_extend:DI
(match_operand:SI 1 "nonimmediate_operand" "r,ZC,m,k")))]
"TARGET_64BIT"
"@
slli.w\t%0,%1,0
ldptr.w\t%0,%1
ld.w\t%0,%1
ldx.w\t%0,%1"
[(set_attr "move_type" "sll0,load,load,load")
(set_attr "mode" "DI")])
(define_insn "extend2"
[(set (match_operand:GPR 0 "register_operand" "=r,r,r")
(sign_extend:GPR
(match_operand:SHORT 1 "nonimmediate_operand" "r,m,k")))]
""
"@
ext.w.\t%0,%1
ld.\t%0,%1
ldx.\t%0,%1"
[(set_attr "move_type" "signext,load,load")
(set_attr "mode" "")])
(define_insn "extendqihi2"
[(set (match_operand:HI 0 "register_operand" "=r,r,r")
(sign_extend:HI
(match_operand:QI 1 "nonimmediate_operand" "r,m,k")))]
""
"@
ext.w.b\t%0,%1
ld.b\t%0,%1
ldx.b\t%0,%1"
[(set_attr "move_type" "signext,load,load")
(set_attr "mode" "SI")])
(define_insn "extendsfdf2"
[(set (match_operand:DF 0 "register_operand" "=f")
(float_extend:DF (match_operand:SF 1 "register_operand" "f")))]
"TARGET_DOUBLE_FLOAT"
"fcvt.d.s\t%0,%1"
[(set_attr "type" "fcvt")
(set_attr "cnv_mode" "S2D")
(set_attr "mode" "DF")])
;;
;; ....................
;;
;; CONVERSIONS
;;
;; ....................
;; conversion of a floating-point value to a integer
(define_insn "fix_trunc2"
[(set (match_operand:GPR 0 "register_operand" "=f")
(fix:GPR (match_operand:ANYF 1 "register_operand" "f")))]
""
"ftintrz.. %0,%1"
[(set_attr "type" "fcvt")
(set_attr "mode" "")])
;; conversion of an integeral (or boolean) value to a floating-point value
(define_insn "floatsidf2"
[(set (match_operand:DF 0 "register_operand" "=f")
(float:DF (match_operand:SI 1 "register_operand" "f")))]
"TARGET_DOUBLE_FLOAT"
"ffint.d.w\t%0,%1"
[(set_attr "type" "fcvt")
(set_attr "mode" "DF")
(set_attr "cnv_mode" "I2D")])
(define_insn "floatdidf2"
[(set (match_operand:DF 0 "register_operand" "=f")
(float:DF (match_operand:DI 1 "register_operand" "f")))]
"TARGET_DOUBLE_FLOAT"
"ffint.d.l\t%0,%1"
[(set_attr "type" "fcvt")
(set_attr "mode" "DF")
(set_attr "cnv_mode" "I2D")])
(define_insn "floatsisf2"
[(set (match_operand:SF 0 "register_operand" "=f")
(float:SF (match_operand:SI 1 "register_operand" "f")))]
"TARGET_HARD_FLOAT"
"ffint.s.w\t%0,%1"
[(set_attr "type" "fcvt")
(set_attr "mode" "SF")
(set_attr "cnv_mode" "I2S")])
(define_insn "floatdisf2"
[(set (match_operand:SF 0 "register_operand" "=f")
(float:SF (match_operand:DI 1 "register_operand" "f")))]
"TARGET_DOUBLE_FLOAT"
"ffint.s.l\t%0,%1"
[(set_attr "type" "fcvt")
(set_attr "mode" "SF")
(set_attr "cnv_mode" "I2S")])
;; Convert a floating-point value to an unsigned integer.
(define_expand "fixuns_truncdfsi2"
[(set (match_operand:SI 0 "register_operand")
(unsigned_fix:SI (match_operand:DF 1 "register_operand")))]
"TARGET_DOUBLE_FLOAT"
{
rtx reg1 = gen_reg_rtx (DFmode);
rtx reg2 = gen_reg_rtx (DFmode);
rtx reg3 = gen_reg_rtx (SImode);
rtx_code_label *label1 = gen_label_rtx ();
rtx_code_label *label2 = gen_label_rtx ();
rtx test;
REAL_VALUE_TYPE offset;
real_2expN (&offset, 31, DFmode);
loongarch_emit_move (reg1,
const_double_from_real_value (offset, DFmode));
do_pending_stack_adjust ();
test = gen_rtx_GE (VOIDmode, operands[1], reg1);
emit_jump_insn (gen_cbranchdf4 (test, operands[1], reg1, label1));
emit_insn (gen_fix_truncdfsi2 (operands[0], operands[1]));
emit_jump_insn (gen_rtx_SET (pc_rtx,
gen_rtx_LABEL_REF (VOIDmode, label2)));
emit_barrier ();
emit_label (label1);
loongarch_emit_move (reg2, gen_rtx_MINUS (DFmode, operands[1], reg1));
loongarch_emit_move (reg3, GEN_INT (trunc_int_for_mode
(BITMASK_HIGH, SImode)));
emit_insn (gen_fix_truncdfsi2 (operands[0], reg2));
emit_insn (gen_iorsi3 (operands[0], operands[0], reg3));
emit_label (label2);
/* Allow REG_NOTES to be set on last insn (labels don't have enough
fields, and can't be used for REG_NOTES anyway). */
emit_use (stack_pointer_rtx);
DONE;
})
(define_expand "fixuns_truncdfdi2"
[(set (match_operand:DI 0 "register_operand")
(unsigned_fix:DI (match_operand:DF 1 "register_operand")))]
"TARGET_DOUBLE_FLOAT"
{
rtx reg1 = gen_reg_rtx (DFmode);
rtx reg2 = gen_reg_rtx (DFmode);
rtx reg3 = gen_reg_rtx (DImode);
rtx_code_label *label1 = gen_label_rtx ();
rtx_code_label *label2 = gen_label_rtx ();
rtx test;
REAL_VALUE_TYPE offset;
real_2expN (&offset, 63, DFmode);
loongarch_emit_move (reg1, const_double_from_real_value (offset, DFmode));
do_pending_stack_adjust ();
test = gen_rtx_GE (VOIDmode, operands[1], reg1);
emit_jump_insn (gen_cbranchdf4 (test, operands[1], reg1, label1));
emit_insn (gen_fix_truncdfdi2 (operands[0], operands[1]));
emit_jump_insn (gen_rtx_SET (pc_rtx, gen_rtx_LABEL_REF (VOIDmode, label2)));
emit_barrier ();
emit_label (label1);
loongarch_emit_move (reg2, gen_rtx_MINUS (DFmode, operands[1], reg1));
loongarch_emit_move (reg3, GEN_INT (BITMASK_HIGH));
emit_insn (gen_ashldi3 (reg3, reg3, GEN_INT (32)));
emit_insn (gen_fix_truncdfdi2 (operands[0], reg2));
emit_insn (gen_iordi3 (operands[0], operands[0], reg3));
emit_label (label2);
/* Allow REG_NOTES to be set on last insn (labels don't have enough
fields, and can't be used for REG_NOTES anyway). */
emit_use (stack_pointer_rtx);
DONE;
})
(define_expand "fixuns_truncsfsi2"
[(set (match_operand:SI 0 "register_operand")
(unsigned_fix:SI (match_operand:SF 1 "register_operand")))]
"TARGET_HARD_FLOAT"
{
rtx reg1 = gen_reg_rtx (SFmode);
rtx reg2 = gen_reg_rtx (SFmode);
rtx reg3 = gen_reg_rtx (SImode);
rtx_code_label *label1 = gen_label_rtx ();
rtx_code_label *label2 = gen_label_rtx ();
rtx test;
REAL_VALUE_TYPE offset;
real_2expN (&offset, 31, SFmode);
loongarch_emit_move (reg1, const_double_from_real_value (offset, SFmode));
do_pending_stack_adjust ();
test = gen_rtx_GE (VOIDmode, operands[1], reg1);
emit_jump_insn (gen_cbranchsf4 (test, operands[1], reg1, label1));
emit_insn (gen_fix_truncsfsi2 (operands[0], operands[1]));
emit_jump_insn (gen_rtx_SET (pc_rtx, gen_rtx_LABEL_REF (VOIDmode, label2)));
emit_barrier ();
emit_label (label1);
loongarch_emit_move (reg2, gen_rtx_MINUS (SFmode, operands[1], reg1));
loongarch_emit_move (reg3, GEN_INT (trunc_int_for_mode
(BITMASK_HIGH, SImode)));
emit_insn (gen_fix_truncsfsi2 (operands[0], reg2));
emit_insn (gen_iorsi3 (operands[0], operands[0], reg3));
emit_label (label2);
/* Allow REG_NOTES to be set on last insn (labels don't have enough
fields, and can't be used for REG_NOTES anyway). */
emit_use (stack_pointer_rtx);
DONE;
})
(define_expand "fixuns_truncsfdi2"
[(set (match_operand:DI 0 "register_operand")
(unsigned_fix:DI (match_operand:SF 1 "register_operand")))]
"TARGET_DOUBLE_FLOAT"
{
rtx reg1 = gen_reg_rtx (SFmode);
rtx reg2 = gen_reg_rtx (SFmode);
rtx reg3 = gen_reg_rtx (DImode);
rtx_code_label *label1 = gen_label_rtx ();
rtx_code_label *label2 = gen_label_rtx ();
rtx test;
REAL_VALUE_TYPE offset;
real_2expN (&offset, 63, SFmode);
loongarch_emit_move (reg1, const_double_from_real_value (offset, SFmode));
do_pending_stack_adjust ();
test = gen_rtx_GE (VOIDmode, operands[1], reg1);
emit_jump_insn (gen_cbranchsf4 (test, operands[1], reg1, label1));
emit_insn (gen_fix_truncsfdi2 (operands[0], operands[1]));
emit_jump_insn (gen_rtx_SET (pc_rtx, gen_rtx_LABEL_REF (VOIDmode, label2)));
emit_barrier ();
emit_label (label1);
loongarch_emit_move (reg2, gen_rtx_MINUS (SFmode, operands[1], reg1));
loongarch_emit_move (reg3, GEN_INT (BITMASK_HIGH));
emit_insn (gen_ashldi3 (reg3, reg3, GEN_INT (32)));
emit_insn (gen_fix_truncsfdi2 (operands[0], reg2));
emit_insn (gen_iordi3 (operands[0], operands[0], reg3));
emit_label (label2);
/* Allow REG_NOTES to be set on last insn (labels don't have enough
fields, and can't be used for REG_NOTES anyway). */
emit_use (stack_pointer_rtx);
DONE;
})
;;
;; ....................
;;
;; EXTRACT AND INSERT
;;
;; ....................
(define_expand "extzv"
[(set (match_operand:X 0 "register_operand")
(zero_extract:X (match_operand:X 1 "register_operand")
(match_operand 2 "const_int_operand")
(match_operand 3 "const_int_operand")))]
""
{
if (!loongarch_use_ins_ext_p (operands[1], INTVAL (operands[2]),
INTVAL (operands[3])))
FAIL;
})
(define_insn "*extzv"
[(set (match_operand:X 0 "register_operand" "=r")
(zero_extract:X (match_operand:X 1 "register_operand" "r")
(match_operand 2 "const_int_operand" "")
(match_operand 3 "const_int_operand" "")))]
"loongarch_use_ins_ext_p (operands[1], INTVAL (operands[2]),
INTVAL (operands[3]))"
{
operands[2] = GEN_INT (INTVAL (operands[2]) + INTVAL (operands[3]) - 1);
return "bstrpick.\t%0,%1,%2,%3";
}
[(set_attr "type" "arith")
(set_attr "mode" "")])
(define_expand "insv"
[(set (zero_extract:GPR (match_operand:GPR 0 "register_operand")
(match_operand 1 "const_int_operand")
(match_operand 2 "const_int_operand"))
(match_operand:GPR 3 "reg_or_0_operand"))]
""
{
if (!loongarch_use_ins_ext_p (operands[0], INTVAL (operands[1]),
INTVAL (operands[2])))
FAIL;
})
(define_insn "*insv"
[(set (zero_extract:GPR (match_operand:GPR 0 "register_operand" "+r")
(match_operand:SI 1 "const_int_operand" "")
(match_operand:SI 2 "const_int_operand" ""))
(match_operand:GPR 3 "reg_or_0_operand" "rJ"))]
"loongarch_use_ins_ext_p (operands[0], INTVAL (operands[1]),
INTVAL (operands[2]))"
{
operands[1] = GEN_INT (INTVAL (operands[1]) + INTVAL (operands[2]) - 1);
return "bstrins.\t%0,%z3,%1,%2";
}
[(set_attr "type" "arith")
(set_attr "mode" "")])
;;
;; ....................
;;
;; DATA MOVEMENT
;;
;; ....................
;; 64-bit integer moves
;; Unlike most other insns, the move insns can't be split with
;; different predicates, because register spilling and other parts of
;; the compiler, have memoized the insn number already.
(define_expand "movdi"
[(set (match_operand:DI 0 "")
(match_operand:DI 1 ""))]
""
{
if (loongarch_legitimize_move (DImode, operands[0], operands[1]))
DONE;
})
(define_insn_and_split "*movdi_32bit"
[(set (match_operand:DI 0 "nonimmediate_operand" "=r,r,r,w,*f,*f,*r,*m")
(match_operand:DI 1 "move_operand" "r,i,w,r,*J*r,*m,*f,*f"))]
"!TARGET_64BIT
&& (register_operand (operands[0], DImode)
|| reg_or_0_operand (operands[1], DImode))"
{ return loongarch_output_move (operands[0], operands[1]); }
"CONST_INT_P (operands[1]) && REG_P (operands[0]) && GP_REG_P (REGNO
(operands[0]))"
[(const_int 0)]
"
{
loongarch_move_integer (operands[0], operands[0], INTVAL (operands[1]));
DONE;
}
"
[(set_attr "move_type" "move,const,load,store,mgtf,fpload,mftg,fpstore")
(set_attr "mode" "DI")])
(define_insn_and_split "*movdi_64bit"
[(set (match_operand:DI 0 "nonimmediate_operand" "=r,r,r,w,*f,*f,*r,*m")
(match_operand:DI 1 "move_operand" "r,Yd,w,rJ,*r*J,*m,*f,*f"))]
"TARGET_64BIT
&& (register_operand (operands[0], DImode)
|| reg_or_0_operand (operands[1], DImode))"
{ return loongarch_output_move (operands[0], operands[1]); }
"CONST_INT_P (operands[1]) && REG_P (operands[0]) && GP_REG_P (REGNO
(operands[0]))"
[(const_int 0)]
"
{
loongarch_move_integer (operands[0], operands[0], INTVAL (operands[1]));
DONE;
}
"
[(set_attr "move_type" "move,const,load,store,mgtf,fpload,mftg,fpstore")
(set_attr "mode" "DI")])
;; Use two registers to get the global symbol address from the got table.
;; la.global rd, rt, sym
(define_insn_and_split "movdi_symbolic_off64"
[(set (match_operand:DI 0 "register_operand" "=r,r")
(match_operand:DI 1 "symbolic_off64_or_reg_operand" "Yd,r"))
(unspec:DI [(const_int 0)]
UNSPEC_LOAD_SYMBOL_OFFSET64)
(clobber (match_operand:DI 2 "register_operand" "=&r,r"))]
"TARGET_64BIT && TARGET_CMODEL_EXTREME"
{
if (which_alternative == 1)
return "#";
enum loongarch_symbol_type symbol_type;
gcc_assert (loongarch_symbolic_constant_p (operands[1], &symbol_type));
switch (symbol_type)
{
case SYMBOL_PCREL64:
return "la.local\t%0,%2,%1";
case SYMBOL_GOT_DISP:
return "la.global\t%0,%2,%1";
case SYMBOL_TLS_IE:
return "la.tls.ie\t%0,%2,%1";
case SYMBOL_TLSGD:
return "la.tls.gd\t%0,%2,%1";
case SYMBOL_TLSLDM:
return "la.tls.ld\t%0,%2,%1";
default:
gcc_unreachable ();
}
}
"&& REG_P (operands[1]) && find_reg_note (insn, REG_UNUSED, operands[2]) != 0"
[(set (match_dup 0) (match_dup 1))]
""
[(set_attr "mode" "DI")
(set_attr "insn_count" "5")])
;; The 64-bit PC-relative part of address loading.
;; Note that the psABI does not allow splitting it.
(define_insn "la_pcrel64_two_parts"
[(set (match_operand:DI 0 "register_operand" "=r")
(unspec:DI [(match_operand:DI 2 "") (pc)] UNSPEC_LA_PCREL_64_PART1))
(set (match_operand:DI 1 "register_operand" "=r")
(unspec:DI [(match_dup 2) (pc)] UNSPEC_LA_PCREL_64_PART2))]
"TARGET_ABI_LP64 && la_opt_explicit_relocs != EXPLICIT_RELOCS_NONE"
{
return "pcalau12i\t%0,%r2\n\t"
"addi.d\t%1,$r0,%L2\n\t"
"lu32i.d\t%1,%R2\n\t"
"lu52i.d\t%1,%1,%H2";
}
[(set_attr "move_type" "move")
(set_attr "mode" "DI")
(set_attr "length" "16")])
;; 32-bit Integer moves
(define_expand "movsi"
[(set (match_operand:SI 0 "")
(match_operand:SI 1 ""))]
""
{
if (loongarch_legitimize_move (SImode, operands[0], operands[1]))
DONE;
})
(define_insn_and_split "*movsi_internal"
[(set (match_operand:SI 0 "nonimmediate_operand" "=r,r,r,w,*f,f,*r,*m")
(match_operand:SI 1 "move_operand" "r,Yd,w,rJ,*r*J,m,*f,*f"))]
"(register_operand (operands[0], SImode)
|| reg_or_0_operand (operands[1], SImode))"
{ return loongarch_output_move (operands[0], operands[1]); }
"CONST_INT_P (operands[1]) && REG_P (operands[0]) && GP_REG_P (REGNO
(operands[0]))"
[(const_int 0)]
"
{
loongarch_move_integer (operands[0], operands[0], INTVAL (operands[1]));
DONE;
}
"
[(set_attr "move_type" "move,const,load,store,mgtf,fpload,mftg,fpstore")
(set_attr "mode" "SI")])
;; 16-bit Integer moves
;; Unlike most other insns, the move insns can't be split with
;; different predicates, because register spilling and other parts of
;; the compiler, have memoized the insn number already.
;; Unsigned loads are used because LOAD_EXTEND_OP returns ZERO_EXTEND.
(define_expand "movhi"
[(set (match_operand:HI 0 "")
(match_operand:HI 1 ""))]
""
{
if (loongarch_legitimize_move (HImode, operands[0], operands[1]))
DONE;
})
(define_insn_and_split "*movhi_internal"
[(set (match_operand:HI 0 "nonimmediate_operand" "=r,r,r,r,m,r,k")
(match_operand:HI 1 "move_operand" "r,Yd,I,m,rJ,k,rJ"))]
"(register_operand (operands[0], HImode)
|| reg_or_0_operand (operands[1], HImode))"
{ return loongarch_output_move (operands[0], operands[1]); }
"CONST_INT_P (operands[1]) && REG_P (operands[0]) && GP_REG_P (REGNO
(operands[0]))"
[(const_int 0)]
"
{
loongarch_move_integer (operands[0], operands[0], INTVAL (operands[1]));
DONE;
}
"
[(set_attr "move_type" "move,const,const,load,store,load,store")
(set_attr "mode" "HI")])
;; 8-bit Integer moves
;; Unlike most other insns, the move insns can't be split with
;; different predicates, because register spilling and other parts of
;; the compiler, have memoized the insn number already.
;; Unsigned loads are used because LOAD_EXTEND_OP returns ZERO_EXTEND.
(define_expand "movqi"
[(set (match_operand:QI 0 "")
(match_operand:QI 1 ""))]
""
{
if (loongarch_legitimize_move (QImode, operands[0], operands[1]))
DONE;
})
(define_insn "*movqi_internal"
[(set (match_operand:QI 0 "nonimmediate_operand" "=r,r,r,m,r,k")
(match_operand:QI 1 "move_operand" "r,I,m,rJ,k,rJ"))]
"(register_operand (operands[0], QImode)
|| reg_or_0_operand (operands[1], QImode))"
{ return loongarch_output_move (operands[0], operands[1]); }
[(set_attr "move_type" "move,const,load,store,load,store")
(set_attr "mode" "QI")])
;; 32-bit floating point moves
(define_expand "movsf"
[(set (match_operand:SF 0 "")
(match_operand:SF 1 ""))]
""
{
if (loongarch_legitimize_move (SFmode, operands[0], operands[1]))
DONE;
})
(define_insn "*movsf_hardfloat"
[(set (match_operand:SF 0 "nonimmediate_operand" "=f,f,f,m,f,k,m,k,*f,*r,*r,*r,*m")
(match_operand:SF 1 "move_operand" "f,G,m,f,k,f,G,G,*r,*f,*G*r,*m,*r"))]
"TARGET_HARD_FLOAT
&& (register_operand (operands[0], SFmode)
|| reg_or_0_operand (operands[1], SFmode))"
{ return loongarch_output_move (operands[0], operands[1]); }
[(set_attr "move_type" "fmove,mgtf,fpload,fpstore,fpload,fpstore,store,store,mgtf,mftg,move,load,store")
(set_attr "mode" "SF")])
(define_insn "*movsf_softfloat"
[(set (match_operand:SF 0 "nonimmediate_operand" "=r,r,m")
(match_operand:SF 1 "move_operand" "Gr,m,r"))]
"TARGET_SOFT_FLOAT
&& (register_operand (operands[0], SFmode)
|| reg_or_0_operand (operands[1], SFmode))"
{ return loongarch_output_move (operands[0], operands[1]); }
[(set_attr "move_type" "move,load,store")
(set_attr "mode" "SF")])
;; 64-bit floating point moves
(define_expand "movdf"
[(set (match_operand:DF 0 "")
(match_operand:DF 1 ""))]
""
{
if (loongarch_legitimize_move (DFmode, operands[0], operands[1]))
DONE;
})
(define_insn "*movdf_hardfloat"
[(set (match_operand:DF 0 "nonimmediate_operand" "=f,f,f,m,f,k,m,k,*f,*r,*r,*r,*m")
(match_operand:DF 1 "move_operand" "f,G,m,f,k,f,G,G,*r,*f,*r*G,*m,*r"))]
"TARGET_DOUBLE_FLOAT
&& (register_operand (operands[0], DFmode)
|| reg_or_0_operand (operands[1], DFmode))"
{ return loongarch_output_move (operands[0], operands[1]); }
[(set_attr "move_type" "fmove,mgtf,fpload,fpstore,fpload,fpstore,store,store,mgtf,mftg,move,load,store")
(set_attr "mode" "DF")])
(define_insn "*movdf_softfloat"
[(set (match_operand:DF 0 "nonimmediate_operand" "=r,r,m")
(match_operand:DF 1 "move_operand" "rG,m,rG"))]
"(TARGET_SOFT_FLOAT || TARGET_SINGLE_FLOAT)
&& (register_operand (operands[0], DFmode)
|| reg_or_0_operand (operands[1], DFmode))"
{ return loongarch_output_move (operands[0], operands[1]); }
[(set_attr "move_type" "move,load,store")
(set_attr "mode" "DF")])
;; Emit a doubleword move in which exactly one of the operands is
;; a floating-point register. We can't just emit two normal moves
;; because of the constraints imposed by the FPU register model;
;; see loongarch_can_change_mode_class for details. Instead, we keep
;; the FPR whole and use special patterns to refer to each word of
;; the other operand.
(define_expand "move_doubleword_fpr"
[(set (match_operand:SPLITF 0)
(match_operand:SPLITF 1))]
""
{
if (FP_REG_RTX_P (operands[0]))
{
rtx low = loongarch_subword (operands[1], 0);
rtx high = loongarch_subword (operands[1], 1);
emit_insn (gen_load_low (operands[0], low));
if (!TARGET_64BIT)
emit_insn (gen_movgr2frh (operands[0], high, operands[0]));
else
emit_insn (gen_load_high (operands[0], high, operands[0]));
}
else
{
rtx low = loongarch_subword (operands[0], 0);
rtx high = loongarch_subword (operands[0], 1);
emit_insn (gen_store_word (low, operands[1], const0_rtx));
if (!TARGET_64BIT)
emit_insn (gen_movfrh2gr (high, operands[1]));
else
emit_insn (gen_store_word (high, operands[1], const1_rtx));
}
DONE;
})
;; Clear one FCC register
(define_expand "movfcc"
[(set (match_operand:FCC 0 "")
(match_operand:FCC 1 ""))]
"TARGET_HARD_FLOAT"
{
if (memory_operand (operands[0], FCCmode)
&& memory_operand (operands[1], FCCmode))
operands[1] = force_reg (FCCmode, operands[1]);
})
(define_insn "movfcc_internal"
[(set (match_operand:FCC 0 "nonimmediate_operand"
"=z,z,*f,*f,*r,*r,*m,*f,*r,z,*r")
(match_operand:FCC 1 "reg_or_0_operand"
"J,*f,z,*f,J*r,*m,J*r,J*r,*f,*r,z"))]
"TARGET_HARD_FLOAT"
"@
fcmp.caf.s\t%0,$f0,$f0
movfr2cf\t%0,%1
movcf2fr\t%0,%1
fmov.s\t%0,%1
or\t%0,%z1,$r0
ld.b\t%0,%1
st.b\t%z1,%0
movgr2fr.w\t%0,%1
movfr2gr.s\t%0,%1
movgr2cf\t%0,%1
movcf2gr\t%0,%1"
[(set_attr "type" "move")
(set_attr "mode" "FCC")])
(define_insn "fcc_to_"
[(set (match_operand:X 0 "register_operand" "=r")
(if_then_else:X (ne (match_operand:FCC 1 "register_operand" "0")
(const_int 0))
(const_int 1)
(const_int 0)))]
"TARGET_HARD_FLOAT"
""
[(set_attr "length" "0")
(set_attr "type" "ghost")])
(define_expand "cstore4"
[(set (match_operand:SI 0 "register_operand")
(match_operator:SI 1 "loongarch_fcmp_operator"
[(match_operand:ANYF 2 "register_operand")
(match_operand:ANYF 3 "register_operand")]))]
""
{
rtx fcc = gen_reg_rtx (FCCmode);
rtx cmp = gen_rtx_fmt_ee (GET_CODE (operands[1]), FCCmode,
operands[2], operands[3]);
emit_insn (gen_rtx_SET (fcc, cmp));
if (TARGET_64BIT)
{
rtx gpr = gen_reg_rtx (DImode);
emit_insn (gen_fcc_to_di (gpr, fcc));
emit_insn (gen_rtx_SET (operands[0],
lowpart_subreg (SImode, gpr, DImode)));
}
else
emit_insn (gen_fcc_to_si (operands[0], fcc));
DONE;
})
;; Conditional move instructions.
(define_insn "*sel_using_"
[(set (match_operand:GPR 0 "register_operand" "=r,r")
(if_then_else:GPR
(equality_op:GPR2 (match_operand:GPR2 1 "register_operand" "r,r")
(const_int 0))
(match_operand:GPR 2 "reg_or_0_operand" "r,J")
(match_operand:GPR 3 "reg_or_0_operand" "J,r")))]
"register_operand (operands[2], mode)
!= register_operand (operands[3], mode)"
"@
\t%0,%2,%1
\t%0,%3,%1"
[(set_attr "type" "condmove")
(set_attr "mode" "")])
;; fsel copies the 3rd argument when the 1st is non-zero and the 2nd
;; argument if the 1st is zero. This means operand 2 and 3 are
;; inverted in the instruction.
(define_insn "*sel"
[(set (match_operand:ANYF 0 "register_operand" "=f")
(if_then_else:ANYF
(ne:FCC (match_operand:FCC 1 "register_operand" "z")
(const_int 0))
(match_operand:ANYF 2 "reg_or_0_operand" "f")
(match_operand:ANYF 3 "reg_or_0_operand" "f")))]
""
"fsel\t%0,%3,%2,%1"
[(set_attr "type" "condmove")
(set_attr "mode" "")])
;; These are the main define_expand's used to make conditional moves.
(define_expand "movcc"
[(set (match_operand:GPR 0 "register_operand")
(if_then_else:GPR (match_operator 1 "comparison_operator"
[(match_operand:GPR 2 "reg_or_0_operand")
(match_operand:GPR 3 "reg_or_0_operand")])))]
"TARGET_COND_MOVE_INT"
{
if (!INTEGRAL_MODE_P (GET_MODE (XEXP (operands[1], 0))))
FAIL;
loongarch_expand_conditional_move (operands);
DONE;
})
(define_expand "movcc"
[(set (match_operand:ANYF 0 "register_operand")
(if_then_else:ANYF (match_operator 1 "comparison_operator"
[(match_operand:ANYF 2 "reg_or_0_operand")
(match_operand:ANYF 3 "reg_or_0_operand")])))]
"TARGET_COND_MOVE_FLOAT"
{
if (!FLOAT_MODE_P (GET_MODE (XEXP (operands[1], 0))))
FAIL;
loongarch_expand_conditional_move (operands);
DONE;
})
(define_insn "lu32i_d"
[(set (match_operand:DI 0 "register_operand" "=r")
(ior:DI
(zero_extend:DI
(subreg:SI (match_operand:DI 1 "register_operand" "0") 0))
(match_operand:DI 2 "const_lu32i_operand" "u")))]
"TARGET_64BIT"
"lu32i.d\t%0,%X2>>32"
[(set_attr "type" "arith")
(set_attr "mode" "DI")])
(define_insn "lu52i_d"
[(set (match_operand:DI 0 "register_operand" "=r")
(ior:DI
(and:DI (match_operand:DI 1 "register_operand" "r")
(match_operand 2 "lu52i_mask_operand"))
(match_operand 3 "const_lu52i_operand" "v")))]
"TARGET_64BIT"
"lu52i.d\t%0,%1,%X3>>52"
[(set_attr "type" "arith")
(set_attr "mode" "DI")])
;; Instructions for adding the low 12 bits of an address to a register.
;; Operand 2 is the address: loongarch_print_operand works out which relocation
;; should be applied.
(define_insn "*low"
[(set (match_operand:P 0 "register_operand" "=r")
(lo_sum:P (match_operand:P 1 "register_operand" " r")
(match_operand:P 2 "symbolic_operand" "")))]
""
"addi.\t%0,%1,%L2"
[(set_attr "type" "arith")
(set_attr "mode" "")])
(define_insn "@tls_low"
[(set (match_operand:P 0 "register_operand" "=r")
(unspec:P [(mem:P (lo_sum:P (match_operand:P 1 "register_operand" "r")
(match_operand:P 2 "symbolic_operand" "")))]
UNSPEC_TLS_LOW))]
""
"addi.\t%0,%1,%L2"
[(set_attr "type" "arith")
(set_attr "mode" "")])
;; Instructions for loading address from GOT entry.
;; operands[1] is pc plus the high half of the address difference with the got
;; entry;
;; operands[2] is low 12 bits for low 12 bit of the address difference with the
;; got entry.
;; loongarch_print_operand works out which relocation should be applied.
(define_insn "@ld_from_got"
[(set (match_operand:P 0 "register_operand" "=r")
(unspec:P [(mem:P (lo_sum:P
(match_operand:P 1 "register_operand" "r")
(match_operand:P 2 "symbolic_operand")))]
UNSPEC_LOAD_FROM_GOT))]
""
"%Q2ld.\t%0,%1,%L2"
[(set_attr "type" "move")]
)
(define_insn "@lui_l_hi20"
[(set (match_operand:P 0 "register_operand" "=r")
(unspec:P [(match_operand:P 1 "symbolic_operand")]
UNSPEC_LUI_L_HI20))]
""
"lu12i.w\t%0,%r1"
[(set_attr "type" "move")]
)
(define_insn "@pcalau12i"
[(set (match_operand:P 0 "register_operand" "=j")
(unspec:P [(match_operand:P 1 "symbolic_operand" "")]
UNSPEC_PCALAU12I))]
""
"pcalau12i\t%0,%%pc_hi20(%1)"
[(set_attr "type" "move")])
;; @pcalau12i may be used for sibcall so it has a strict constraint. This
;; allows any general register as the operand.
(define_insn "@pcalau12i_gr"
[(set (match_operand:P 0 "register_operand" "=r")
(unspec:P [(match_operand:P 1 "symbolic_operand" "")]
UNSPEC_PCALAU12I_GR))]
""
"pcalau12i\t%0,%%pc_hi20(%1)"
[(set_attr "type" "move")])
(define_insn "@add_tls_le_relax