| ;;- Machine description for Renesas / SuperH SH. |
| ;; Copyright (C) 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, |
| ;; 2003, 2004 Free Software Foundation, Inc. |
| ;; Contributed by Steve Chamberlain (sac@cygnus.com). |
| ;; Improved by Jim Wilson (wilson@cygnus.com). |
| |
| ;; This file is part of GCC. |
| |
| ;; GCC is free software; you can redistribute it and/or modify |
| ;; it under the terms of the GNU General Public License as published by |
| ;; the Free Software Foundation; either version 2, or (at your option) |
| ;; any later version. |
| |
| ;; GCC is distributed in the hope that it will be useful, |
| ;; but WITHOUT ANY WARRANTY; without even the implied warranty of |
| ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| ;; GNU General Public License for more details. |
| |
| ;; You should have received a copy of the GNU General Public License |
| ;; along with GCC; see the file COPYING. If not, write to |
| ;; the Free Software Foundation, 59 Temple Place - Suite 330, |
| ;; Boston, MA 02111-1307, USA. |
| |
| |
| ;; ??? Should prepend a * to all pattern names which are not used. |
| ;; This will make the compiler smaller, and rebuilds after changes faster. |
| |
| ;; ??? Should be enhanced to include support for many more GNU superoptimizer |
| ;; sequences. Especially the sequences for arithmetic right shifts. |
| |
| ;; ??? Should check all DImode patterns for consistency and usefulness. |
| |
| ;; ??? The MAC.W and MAC.L instructions are not supported. There is no |
| ;; way to generate them. |
| |
| ;; ??? The cmp/str instruction is not supported. Perhaps it can be used |
| ;; for a str* inline function. |
| |
| ;; BSR is not generated by the compiler proper, but when relaxing, it |
| ;; generates .uses pseudo-ops that allow linker relaxation to create |
| ;; BSR. This is actually implemented in bfd/{coff,elf32}-sh.c |
| |
| ;; Special constraints for SH machine description: |
| ;; |
| ;; t -- T |
| ;; x -- mac |
| ;; l -- pr |
| ;; z -- r0 |
| ;; |
| ;; Special formats used for outputting SH instructions: |
| ;; |
| ;; %. -- print a .s if insn needs delay slot |
| ;; %@ -- print rte/rts if is/isn't an interrupt function |
| ;; %# -- output a nop if there is nothing to put in the delay slot |
| ;; %O -- print a constant without the # |
| ;; %R -- print the lsw reg of a double |
| ;; %S -- print the msw reg of a double |
| ;; %T -- print next word of a double REG or MEM |
| ;; |
| ;; Special predicates: |
| ;; |
| ;; arith_operand -- operand is valid source for arithmetic op |
| ;; arith_reg_operand -- operand is valid register for arithmetic op |
| ;; general_movdst_operand -- operand is valid move destination |
| ;; general_movsrc_operand -- operand is valid move source |
| ;; logical_operand -- operand is valid source for logical op |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Constants |
| ;; ------------------------------------------------------------------------- |
| |
| (define_constants [ |
| (AP_REG 145) |
| (PR_REG 146) |
| (T_REG 147) |
| (GBR_REG 144) |
| (MACH_REG 148) |
| (MACL_REG 149) |
| (FPUL_REG 150) |
| (RAP_REG 152) |
| |
| (FPSCR_REG 151) |
| |
| (PIC_REG 12) |
| (FP_REG 14) |
| (SP_REG 15) |
| |
| (PR_MEDIA_REG 18) |
| (T_MEDIA_REG 19) |
| |
| (R0_REG 0) |
| (R1_REG 1) |
| (R2_REG 2) |
| (R3_REG 3) |
| (R4_REG 4) |
| (R5_REG 5) |
| (R6_REG 6) |
| (R7_REG 7) |
| (R8_REG 8) |
| (R9_REG 9) |
| (R10_REG 10) |
| (R20_REG 20) |
| (R21_REG 21) |
| (R22_REG 22) |
| (R23_REG 23) |
| |
| (DR0_REG 64) |
| (DR2_REG 66) |
| (DR4_REG 68) |
| (FR23_REG 87) |
| |
| (TR0_REG 128) |
| (TR1_REG 129) |
| (TR2_REG 130) |
| |
| (XD0_REG 136) |
| |
| ;; These are used with unspec. |
| (UNSPEC_COMPACT_ARGS 0) |
| (UNSPEC_MOVA 1) |
| (UNSPEC_CASESI 2) |
| (UNSPEC_DATALABEL 3) |
| (UNSPEC_BBR 4) |
| (UNSPEC_SFUNC 5) |
| (UNSPEC_PIC 6) |
| (UNSPEC_GOT 7) |
| (UNSPEC_GOTOFF 8) |
| (UNSPEC_PLT 9) |
| (UNSPEC_CALLER 10) |
| (UNSPEC_GOTPLT 11) |
| (UNSPEC_ICACHE 12) |
| (UNSPEC_INIT_TRAMP 13) |
| (UNSPEC_FCOSA 14) |
| (UNSPEC_FSRRA 15) |
| (UNSPEC_FSINA 16) |
| (UNSPEC_NSB 17) |
| (UNSPEC_ALLOCO 18) |
| (UNSPEC_EH_RETURN 19) |
| (UNSPEC_TLSGD 20) |
| (UNSPEC_TLSLDM 21) |
| (UNSPEC_TLSIE 22) |
| (UNSPEC_DTPOFF 23) |
| (UNSPEC_GOTTPOFF 24) |
| (UNSPEC_TPOFF 25) |
| (UNSPEC_RA 26) |
| |
| ;; These are used with unspec_volatile. |
| (UNSPECV_BLOCKAGE 0) |
| (UNSPECV_ALIGN 1) |
| (UNSPECV_CONST2 2) |
| (UNSPECV_CONST4 4) |
| (UNSPECV_CONST8 6) |
| (UNSPECV_WINDOW_END 10) |
| (UNSPECV_CONST_END 11) |
| ]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Attributes |
| ;; ------------------------------------------------------------------------- |
| |
| ;; Target CPU. |
| |
| (define_attr "cpu" |
| "sh1,sh2,sh2e,sh3,sh3e,sh4,sh5" |
| (const (symbol_ref "sh_cpu_attr"))) |
| |
| (define_attr "endian" "big,little" |
| (const (if_then_else (symbol_ref "TARGET_LITTLE_ENDIAN") |
| (const_string "little") (const_string "big")))) |
| |
| ;; Indicate if the default fpu mode is single precision. |
| (define_attr "fpu_single" "yes,no" |
| (const (if_then_else (symbol_ref "TARGET_FPU_SINGLE") |
| (const_string "yes") (const_string "no")))) |
| |
| (define_attr "fmovd" "yes,no" |
| (const (if_then_else (symbol_ref "TARGET_FMOVD") |
| (const_string "yes") (const_string "no")))) |
| ;; pipeline model |
| (define_attr "pipe_model" "sh1,sh4,sh5media" |
| (const |
| (cond [(symbol_ref "TARGET_SHMEDIA") (const_string "sh5media") |
| (symbol_ref "TARGET_SUPERSCALAR") (const_string "sh4")] |
| (const_string "sh1")))) |
| |
| ;; cbranch conditional branch instructions |
| ;; jump unconditional jumps |
| ;; arith ordinary arithmetic |
| ;; arith3 a compound insn that behaves similarly to a sequence of |
| ;; three insns of type arith |
| ;; arith3b like above, but might end with a redirected branch |
| ;; load from memory |
| ;; load_si Likewise, SImode variant for general register. |
| ;; fload Likewise, but load to fp register. |
| ;; store to memory |
| ;; move general purpose register to register |
| ;; mt_group other sh4 mt instructions |
| ;; fmove register to register, floating point |
| ;; smpy word precision integer multiply |
| ;; dmpy longword or doublelongword precision integer multiply |
| ;; return rts |
| ;; pload load of pr reg, which can't be put into delay slot of rts |
| ;; prset copy register to pr reg, ditto |
| ;; pstore store of pr reg, which can't be put into delay slot of jsr |
| ;; prget copy pr to register, ditto |
| ;; pcload pc relative load of constant value |
| ;; pcfload Likewise, but load to fp register. |
| ;; pcload_si Likewise, SImode variant for general register. |
| ;; rte return from exception |
| ;; sfunc special function call with known used registers |
| ;; call function call |
| ;; fp floating point |
| ;; fdiv floating point divide (or square root) |
| ;; gp_fpul move from general purpose register to fpul |
| ;; fpul_gp move from fpul to general purpose register |
| ;; mac_gp move from mac[lh] to general purpose register |
| ;; dfp_arith, dfp_cmp,dfp_conv |
| ;; ftrc_s fix_truncsfsi2_i4 |
| ;; dfdiv double precision floating point divide (or square root) |
| ;; cwb ic_invalidate_line_i |
| ;; tls_load load TLS related address |
| ;; arith_media SHmedia arithmetic, logical, and shift instructions |
| ;; cbranch_media SHmedia conditional branch instructions |
| ;; cmp_media SHmedia compare instructions |
| ;; dfdiv_media SHmedia double precision divide and square root |
| ;; dfmul_media SHmedia double precision multiply instruction |
| ;; dfparith_media SHmedia double precision floating point arithmetic |
| ;; dfpconv_media SHmedia double precision floating point conversions |
| ;; dmpy_media SHmedia longword multiply |
| ;; fcmp_media SHmedia floating point compare instructions |
| ;; fdiv_media SHmedia single precision divide and square root |
| ;; fload_media SHmedia floating point register load instructions |
| ;; fmove_media SHmedia floating point register moves (inc. fabs and fneg) |
| ;; fparith_media SHmedia single precision floating point arithmetic |
| ;; fpconv_media SHmedia single precision floating point conversions |
| ;; fstore_media SHmedia floating point register store instructions |
| ;; gettr_media SHmedia gettr instruction |
| ;; invalidate_line_media SHmedia invalidate_line sequence |
| ;; jump_media SHmedia unconditional branch instructions |
| ;; load_media SHmedia general register load instructions |
| ;; pt_media SHmedia pt instruction (expanded by assembler) |
| ;; ptabs_media SHmedia ptabs instruction |
| ;; store_media SHmedia general register store instructions |
| ;; mcmp_media SHmedia multimedia compare, absolute, saturating ops |
| ;; mac_media SHmedia mac-style fixed point operations |
| ;; d2mpy_media SHmedia: two 32 bit integer multiplies |
| ;; atrans SHmedia approximate transcendental functions |
| ;; ustore_media SHmedia unaligned stores |
| ;; nil no-op move, will be deleted. |
| |
| (define_attr "type" |
| "mt_group,cbranch,jump,jump_ind,arith,arith3,arith3b,dyn_shift,load,load_si,fload,store,move,fmove,smpy,dmpy,return,pload,prset,pstore,prget,pcload,pcload_si,pcfload,rte,sfunc,call,fp,fdiv,ftrc_s,dfp_arith,dfp_cmp,dfp_conv,dfdiv,gp_fpul,fpul_gp,mac_gp,mem_fpscr,gp_fpscr,cwb,tls_load,arith_media,cbranch_media,cmp_media,dfdiv_media,dfmul_media,dfparith_media,dfpconv_media,dmpy_media,fcmp_media,fdiv_media,fload_media,fmove_media,fparith_media,fpconv_media,fstore_media,gettr_media,invalidate_line_media,jump_media,load_media,pt_media,ptabs_media,store_media,mcmp_media,mac_media,d2mpy_media,atrans_media,ustore_media,nil,other" |
| (const_string "other")) |
| |
| ;; We define a new attribute namely "insn_class".We use |
| ;; this for the DFA based pipeline description. |
| ;; |
| ;; mt_group SH4 "mt" group instructions. |
| ;; |
| ;; ex_group SH4 "ex" group instructions. |
| ;; |
| ;; ls_group SH4 "ls" group instructions. |
| ;; |
| |
| (define_attr "insn_class" |
| "mt_group,ex_group,ls_group,br_group,fe_group,co_group,none" |
| (cond [(eq_attr "type" "move,mt_group") (const_string "mt_group") |
| (eq_attr "type" "arith,dyn_shift") (const_string "ex_group") |
| (eq_attr "type" "fmove,load,pcload,load_si,pcload_si,fload,pcfload,store,gp_fpul,fpul_gp") (const_string "ls_group") |
| (eq_attr "type" "cbranch,jump") (const_string "br_group") |
| (eq_attr "type" "fp,fdiv,ftrc_s,dfp_arith,dfp_conv,dfdiv") |
| (const_string "fe_group") |
| (eq_attr "type" "jump_ind,smpy,dmpy,mac_gp,return,pload,prset,pstore,prget,rte,sfunc,call,dfp_cmp,mem_fpscr,gp_fpscr,cwb") (const_string "co_group")] |
| (const_string "none"))) |
| ;; nil are zero instructions, and arith3 / arith3b are multiple instructions, |
| ;; so these do not belong in an insn group, although they are modeled |
| ;; with their own define_insn_reservations. |
| |
| ;; Indicate what precision must be selected in fpscr for this insn, if any. |
| |
| (define_attr "fp_mode" "single,double,none" (const_string "none")) |
| |
| ;; Indicate if the fpu mode is set by this instruction |
| ;; "unknown" must have the value as "none" in fp_mode, and means |
| ;; that the instruction/abi has left the processor in an unknown |
| ;; state. |
| ;; "none" means that nothing has changed and no mode is set. |
| ;; This attribute is only used for the Renesas ABI. |
| (define_attr "fp_set" "single,double,unknown,none" (const_string "none")) |
| |
| ; If a conditional branch destination is within -252..258 bytes away |
| ; from the instruction it can be 2 bytes long. Something in the |
| ; range -4090..4100 bytes can be 6 bytes long. All other conditional |
| ; branches are initially assumed to be 16 bytes long. |
| ; In machine_dependent_reorg, we split all branches that are longer than |
| ; 2 bytes. |
| |
| ;; The maximum range used for SImode constant pool entries is 1018. A final |
| ;; instruction can add 8 bytes while only being 4 bytes in size, thus we |
| ;; can have a total of 1022 bytes in the pool. Add 4 bytes for a branch |
| ;; instruction around the pool table, 2 bytes of alignment before the table, |
| ;; and 30 bytes of alignment after the table. That gives a maximum total |
| ;; pool size of 1058 bytes. |
| ;; Worst case code/pool content size ratio is 1:2 (using asms). |
| ;; Thus, in the worst case, there is one instruction in front of a maximum |
| ;; sized pool, and then there are 1052 bytes of pool for every 508 bytes of |
| ;; code. For the last n bytes of code, there are 2n + 36 bytes of pool. |
| ;; If we have a forward branch, the initial table will be put after the |
| ;; unconditional branch. |
| ;; |
| ;; ??? We could do much better by keeping track of the actual pcloads within |
| ;; the branch range and in the pcload range in front of the branch range. |
| |
| ;; ??? This looks ugly because genattrtab won't allow if_then_else or cond |
| ;; inside an le. |
| (define_attr "short_cbranch_p" "no,yes" |
| (cond [(ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 252)) (const_int 506)) |
| (const_string "yes") |
| (ne (symbol_ref "NEXT_INSN (PREV_INSN (insn)) != insn") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 252)) (const_int 508)) |
| (const_string "yes") |
| ] (const_string "no"))) |
| |
| (define_attr "med_branch_p" "no,yes" |
| (cond [(leu (plus (minus (match_dup 0) (pc)) (const_int 990)) |
| (const_int 1988)) |
| (const_string "yes") |
| (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 4092)) |
| (const_int 8186)) |
| (const_string "yes") |
| ] (const_string "no"))) |
| |
| (define_attr "med_cbranch_p" "no,yes" |
| (cond [(leu (plus (minus (match_dup 0) (pc)) (const_int 988)) |
| (const_int 1986)) |
| (const_string "yes") |
| (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 4090)) |
| (const_int 8184)) |
| (const_string "yes") |
| ] (const_string "no"))) |
| |
| (define_attr "braf_branch_p" "no,yes" |
| (cond [(ne (symbol_ref "! TARGET_SH2") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 10330)) |
| (const_int 20660)) |
| (const_string "yes") |
| (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 32764)) |
| (const_int 65530)) |
| (const_string "yes") |
| ] (const_string "no"))) |
| |
| (define_attr "braf_cbranch_p" "no,yes" |
| (cond [(ne (symbol_ref "! TARGET_SH2") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 10328)) |
| (const_int 20658)) |
| (const_string "yes") |
| (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) |
| (const_string "no") |
| (leu (plus (minus (match_dup 0) (pc)) (const_int 32762)) |
| (const_int 65528)) |
| (const_string "yes") |
| ] (const_string "no"))) |
| |
| ; An unconditional jump in the range -4092..4098 can be 2 bytes long. |
| ; For wider ranges, we need a combination of a code and a data part. |
| ; If we can get a scratch register for a long range jump, the code |
| ; part can be 4 bytes long; otherwise, it must be 8 bytes long. |
| ; If the jump is in the range -32764..32770, the data part can be 2 bytes |
| ; long; otherwise, it must be 6 bytes long. |
| |
| ; All other instructions are two bytes long by default. |
| |
| ;; ??? This should use something like *branch_p (minus (match_dup 0) (pc)), |
| ;; but getattrtab doesn't understand this. |
| (define_attr "length" "" |
| (cond [(eq_attr "type" "cbranch") |
| (cond [(eq_attr "short_cbranch_p" "yes") |
| (const_int 2) |
| (eq_attr "med_cbranch_p" "yes") |
| (const_int 6) |
| (eq_attr "braf_cbranch_p" "yes") |
| (const_int 12) |
| ;; ??? using pc is not computed transitively. |
| (ne (match_dup 0) (match_dup 0)) |
| (const_int 14) |
| (ne (symbol_ref ("flag_pic")) (const_int 0)) |
| (const_int 24) |
| ] (const_int 16)) |
| (eq_attr "type" "jump") |
| (cond [(eq_attr "med_branch_p" "yes") |
| (const_int 2) |
| (and (eq (symbol_ref "GET_CODE (prev_nonnote_insn (insn))") |
| (symbol_ref "INSN")) |
| (eq (symbol_ref "INSN_CODE (prev_nonnote_insn (insn))") |
| (symbol_ref "code_for_indirect_jump_scratch"))) |
| (if_then_else (eq_attr "braf_branch_p" "yes") |
| (const_int 6) |
| (const_int 10)) |
| (eq_attr "braf_branch_p" "yes") |
| (const_int 10) |
| ;; ??? using pc is not computed transitively. |
| (ne (match_dup 0) (match_dup 0)) |
| (const_int 12) |
| (ne (symbol_ref ("flag_pic")) (const_int 0)) |
| (const_int 22) |
| ] (const_int 14)) |
| (eq_attr "type" "pt_media") |
| (if_then_else (ne (symbol_ref "TARGET_SHMEDIA64") (const_int 0)) |
| (const_int 20) (const_int 12)) |
| ] (if_then_else (ne (symbol_ref "TARGET_SHMEDIA") (const_int 0)) |
| (const_int 4) |
| (const_int 2)))) |
| |
| ;; (define_function_unit {name} {num-units} {n-users} {test} |
| ;; {ready-delay} {issue-delay} [{conflict-list}]) |
| |
| ;; Load and store instructions save a cycle if they are aligned on a |
| ;; four byte boundary. Using a function unit for stores encourages |
| ;; gcc to separate load and store instructions by one instruction, |
| ;; which makes it more likely that the linker will be able to word |
| ;; align them when relaxing. |
| |
| ;; Loads have a latency of two. |
| ;; However, call insns can have a delay slot, so that we want one more |
| ;; insn to be scheduled between the load of the function address and the call. |
| ;; This is equivalent to a latency of three. |
| ;; We cannot use a conflict list for this, because we need to distinguish |
| ;; between the actual call address and the function arguments. |
| ;; ADJUST_COST can only properly handle reductions of the cost, so we |
| ;; use a latency of three here. |
| ;; We only do this for SImode loads of general registers, to make the work |
| ;; for ADJUST_COST easier. |
| (define_function_unit "memory" 1 0 |
| (and (eq_attr "pipe_model" "sh1") |
| (eq_attr "type" "load_si,pcload_si")) |
| 3 2) |
| (define_function_unit "memory" 1 0 |
| (and (eq_attr "pipe_model" "sh1") |
| (eq_attr "type" "load,pcload,pload,store,pstore")) |
| 2 2) |
| |
| (define_function_unit "int" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "arith3,arith3b")) 3 3) |
| |
| (define_function_unit "int" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "dyn_shift")) 2 2) |
| |
| (define_function_unit "int" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "!arith3,arith3b,dyn_shift")) 1 1) |
| |
| ;; ??? These are approximations. |
| (define_function_unit "mpy" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "smpy")) 2 2) |
| (define_function_unit "mpy" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "dmpy")) 3 3) |
| |
| (define_function_unit "fp" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "fp,fmove")) 2 1) |
| (define_function_unit "fp" 1 0 |
| (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "fdiv")) 13 12) |
| |
| |
| ;; SH-5 SHmedia scheduling |
| ;; When executing SHmedia code, the SH-5 is a fairly straightforward |
| ;; single-issue machine. It has four pipelines, the branch unit (br), |
| ;; the integer and multimedia unit (imu), the load/store unit (lsu), and |
| ;; the floating point unit (fpu). |
| ;; Here model the instructions with a latency greater than one cycle. |
| |
| ;; Every instruction on SH-5 occupies the issue resource for at least one |
| ;; cycle. |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "!pt_media,ptabs_media,invalidate_line_media,dmpy_media,load_media,fload_media,fcmp_media,fmove_media,fparith_media,dfparith_media,fpconv_media,dfpconv_media,dfmul_media,store_media,fstore_media,mcmp_media,mac_media,d2mpy_media,atrans_media,ustore_media")) 1 1) |
| |
| ;; Specify the various types of instruction which have latency > 1 |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "mcmp_media")) 2 1) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "dmpy_media,load_media,fcmp_media,mac_media")) 3 1) |
| ;; but see sh_adjust_cost for mac_media exception. |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "fload_media,fmove_media")) 4 1) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "d2mpy_media")) 4 2) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "pt_media,ptabs_media")) 5 1) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "fparith_media,dfparith_media,fpconv_media,dfpconv_media")) 6 1) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") |
| (eq_attr "type" "invalidate_line_media")) 7 7) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "dfmul_media")) 9 4) |
| |
| (define_function_unit "sh5issue" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "atrans_media")) 10 5) |
| |
| ;; Floating-point divide and square-root occupy an additional resource, |
| ;; which is not internally pipelined. However, other instructions |
| ;; can continue to issue. |
| (define_function_unit "sh5fds" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "fdiv_media")) 19 19) |
| |
| (define_function_unit "sh5fds" 1 0 |
| (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "dfdiv_media")) 35 35) |
| |
| ; Definitions for filling branch delay slots. |
| |
| (define_attr "needs_delay_slot" "yes,no" (const_string "no")) |
| |
| ;; ??? This should be (nil) instead of (const_int 0) |
| (define_attr "hit_stack" "yes,no" |
| (cond [(eq (symbol_ref "find_regno_note (insn, REG_INC, SP_REG)") |
| (const_int 0)) |
| (const_string "no")] |
| (const_string "yes"))) |
| |
| (define_attr "interrupt_function" "no,yes" |
| (const (symbol_ref "current_function_interrupt"))) |
| |
| (define_attr "in_delay_slot" "yes,no" |
| (cond [(eq_attr "type" "cbranch") (const_string "no") |
| (eq_attr "type" "pcload,pcload_si") (const_string "no") |
| (eq_attr "needs_delay_slot" "yes") (const_string "no") |
| (eq_attr "length" "2") (const_string "yes") |
| ] (const_string "no"))) |
| |
| (define_attr "cond_delay_slot" "yes,no" |
| (cond [(eq_attr "in_delay_slot" "yes") (const_string "yes") |
| ] (const_string "no"))) |
| |
| (define_attr "is_sfunc" "" |
| (if_then_else (eq_attr "type" "sfunc") (const_int 1) (const_int 0))) |
| |
| (define_attr "is_mac_media" "" |
| (if_then_else (eq_attr "type" "mac_media") (const_int 1) (const_int 0))) |
| |
| (define_attr "branch_zero" "yes,no" |
| (cond [(eq_attr "type" "!cbranch") (const_string "no") |
| (ne (symbol_ref "(next_active_insn (insn)\ |
| == (prev_active_insn\ |
| (XEXP (SET_SRC (PATTERN (insn)), 1))))\ |
| && get_attr_length (next_active_insn (insn)) == 2") |
| (const_int 0)) |
| (const_string "yes")] |
| (const_string "no"))) |
| |
| ;; SH4 Double-precision computation with double-precision result - |
| ;; the two halves are ready at different times. |
| (define_attr "dfp_comp" "yes,no" |
| (cond [(eq_attr "type" "dfp_arith,dfp_conv,dfdiv") (const_string "yes")] |
| (const_string "no"))) |
| |
| ;; Insns for which the latency of a preceding fp insn is decreased by one. |
| (define_attr "late_fp_use" "yes,no" (const_string "no")) |
| ;; And feeding insns for which this relevant. |
| (define_attr "any_fp_comp" "yes,no" |
| (cond [(eq_attr "type" "fp,fdiv,ftrc_s,dfp_arith,dfp_conv,dfdiv") |
| (const_string "yes")] |
| (const_string "no"))) |
| |
| (define_attr "any_int_load" "yes,no" |
| (cond [(eq_attr "type" "load,load_si,pcload,pcload_si") |
| (const_string "yes")] |
| (const_string "no"))) |
| |
| (define_delay |
| (eq_attr "needs_delay_slot" "yes") |
| [(eq_attr "in_delay_slot" "yes") (nil) (nil)]) |
| |
| ;; On the SH and SH2, the rte instruction reads the return pc from the stack, |
| ;; and thus we can't put a pop instruction in its delay slot. |
| ;; ??? On the SH3, the rte instruction does not use the stack, so a pop |
| ;; instruction can go in the delay slot. |
| |
| ;; Since a normal return (rts) implicitly uses the PR register, |
| ;; we can't allow PR register loads in an rts delay slot. |
| |
| (define_delay |
| (eq_attr "type" "return") |
| [(and (eq_attr "in_delay_slot" "yes") |
| (ior (and (eq_attr "interrupt_function" "no") |
| (eq_attr "type" "!pload,prset")) |
| (and (eq_attr "interrupt_function" "yes") |
| (ior |
| (ne (symbol_ref "TARGET_SH3") (const_int 0)) |
| (eq_attr "hit_stack" "no"))))) (nil) (nil)]) |
| |
| ;; Since a call implicitly uses the PR register, we can't allow |
| ;; a PR register store in a jsr delay slot. |
| |
| (define_delay |
| (ior (eq_attr "type" "call") (eq_attr "type" "sfunc")) |
| [(and (eq_attr "in_delay_slot" "yes") |
| (eq_attr "type" "!pstore,prget")) (nil) (nil)]) |
| |
| ;; Say that we have annulled true branches, since this gives smaller and |
| ;; faster code when branches are predicted as not taken. |
| |
| ;; ??? The non-annulled condition should really be "in_delay_slot", |
| ;; but insns that can be filled in non-annulled get priority over insns |
| ;; that can only be filled in anulled. |
| |
| (define_delay |
| (and (eq_attr "type" "cbranch") |
| (ne (symbol_ref "TARGET_SH2") (const_int 0))) |
| ;; SH2e has a hardware bug that pretty much prohibits the use of |
| ;; annuled delay slots. |
| [(eq_attr "cond_delay_slot" "yes") (and (eq_attr "cond_delay_slot" "yes") |
| (not (eq_attr "cpu" "sh2e"))) (nil)]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; SImode signed integer comparisons |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "" |
| [(set (reg:SI T_REG) |
| (eq:SI (and:SI (match_operand:SI 0 "arith_reg_operand" "z,r") |
| (match_operand:SI 1 "arith_operand" "K08,r")) |
| (const_int 0)))] |
| "TARGET_SH1" |
| "tst %1,%0" |
| [(set_attr "type" "mt_group")]) |
| |
| ;; ??? Perhaps should only accept reg/constant if the register is reg 0. |
| ;; That would still allow reload to create cmpi instructions, but would |
| ;; perhaps allow forcing the constant into a register when that is better. |
| ;; Probably should use r0 for mem/imm compares, but force constant into a |
| ;; register for pseudo/imm compares. |
| |
| (define_insn "cmpeqsi_t" |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:SI 0 "arith_reg_operand" "r,z,r") |
| (match_operand:SI 1 "arith_operand" "N,rI08,r")))] |
| "TARGET_SH1" |
| "@ |
| tst %0,%0 |
| cmp/eq %1,%0 |
| cmp/eq %1,%0" |
| [(set_attr "type" "mt_group")]) |
| |
| (define_insn "cmpgtsi_t" |
| [(set (reg:SI T_REG) |
| (gt:SI (match_operand:SI 0 "arith_reg_operand" "r,r") |
| (match_operand:SI 1 "arith_reg_or_0_operand" "r,N")))] |
| "TARGET_SH1" |
| "@ |
| cmp/gt %1,%0 |
| cmp/pl %0" |
| [(set_attr "type" "mt_group")]) |
| |
| (define_insn "cmpgesi_t" |
| [(set (reg:SI T_REG) |
| (ge:SI (match_operand:SI 0 "arith_reg_operand" "r,r") |
| (match_operand:SI 1 "arith_reg_or_0_operand" "r,N")))] |
| "TARGET_SH1" |
| "@ |
| cmp/ge %1,%0 |
| cmp/pz %0" |
| [(set_attr "type" "mt_group")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; SImode unsigned integer comparisons |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "cmpgeusi_t" |
| [(set (reg:SI T_REG) |
| (geu:SI (match_operand:SI 0 "arith_reg_operand" "r") |
| (match_operand:SI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "cmp/hs %1,%0" |
| [(set_attr "type" "mt_group")]) |
| |
| (define_insn "cmpgtusi_t" |
| [(set (reg:SI T_REG) |
| (gtu:SI (match_operand:SI 0 "arith_reg_operand" "r") |
| (match_operand:SI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "cmp/hi %1,%0" |
| [(set_attr "type" "mt_group")]) |
| |
| ;; We save the compare operands in the cmpxx patterns and use them when |
| ;; we generate the branch. |
| |
| (define_expand "cmpsi" |
| [(set (reg:SI T_REG) |
| (compare (match_operand:SI 0 "cmpsi_operand" "") |
| (match_operand:SI 1 "arith_operand" "")))] |
| "TARGET_SH1" |
| " |
| { |
| if (GET_CODE (operands[0]) == REG && REGNO (operands[0]) == T_REG |
| && GET_CODE (operands[1]) != CONST_INT) |
| operands[0] = copy_to_mode_reg (SImode, operands[0]); |
| sh_compare_op0 = operands[0]; |
| sh_compare_op1 = operands[1]; |
| DONE; |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; DImode signed integer comparisons |
| ;; ------------------------------------------------------------------------- |
| |
| ;; ??? Could get better scheduling by splitting the initial test from the |
| ;; rest of the insn after reload. However, the gain would hardly justify |
| ;; the sh.md size increase necessary to do that. |
| |
| (define_insn "" |
| [(set (reg:SI T_REG) |
| (eq:SI (and:DI (match_operand:DI 0 "arith_reg_operand" "r") |
| (match_operand:DI 1 "arith_operand" "r")) |
| (const_int 0)))] |
| "TARGET_SH1" |
| "* return output_branchy_insn (EQ, \"tst\\t%S1,%S0\;bf\\t%l9\;tst\\t%R1,%R0\", |
| insn, operands);" |
| [(set_attr "length" "6") |
| (set_attr "type" "arith3b")]) |
| |
| (define_insn "cmpeqdi_t" |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:DI 0 "arith_reg_operand" "r,r") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "N,r")))] |
| "TARGET_SH1" |
| "@ |
| tst %S0,%S0\;bf %,Ldi%=\;tst %R0,%R0\\n%,Ldi%=: |
| cmp/eq %S1,%S0\;bf %,Ldi%=\;cmp/eq %R1,%R0\\n%,Ldi%=:" |
| [(set_attr "length" "6") |
| (set_attr "type" "arith3b")]) |
| |
| (define_split |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:DI 0 "arith_reg_operand" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "")))] |
| ;; If we applied this split when not optimizing, it would only be |
| ;; applied during the machine-dependent reorg, when no new basic blocks |
| ;; may be created. |
| "TARGET_SH1 && reload_completed && optimize" |
| [(set (reg:SI T_REG) (eq:SI (match_dup 2) (match_dup 3))) |
| (set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_dup 6)) |
| (pc))) |
| (set (reg:SI T_REG) (eq:SI (match_dup 4) (match_dup 5))) |
| (match_dup 6)] |
| " |
| { |
| operands[2] |
| = gen_rtx_REG (SImode, |
| true_regnum (operands[0]) + (TARGET_LITTLE_ENDIAN ? 1 : 0)); |
| operands[3] |
| = (operands[1] == const0_rtx |
| ? const0_rtx |
| : gen_rtx_REG (SImode, |
| true_regnum (operands[1]) |
| + (TARGET_LITTLE_ENDIAN ? 1 : 0))); |
| operands[4] = gen_lowpart (SImode, operands[0]); |
| operands[5] = gen_lowpart (SImode, operands[1]); |
| operands[6] = gen_label_rtx (); |
| }") |
| |
| (define_insn "cmpgtdi_t" |
| [(set (reg:SI T_REG) |
| (gt:SI (match_operand:DI 0 "arith_reg_operand" "r,r") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "r,N")))] |
| "TARGET_SH2" |
| "@ |
| cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/gt\\t%S1,%S0\;cmp/hi\\t%R1,%R0\\n%,Ldi%=: |
| tst\\t%S0,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/pl\\t%S0\;cmp/hi\\t%S0,%R0\\n%,Ldi%=:" |
| [(set_attr "length" "8") |
| (set_attr "type" "arith3")]) |
| |
| (define_insn "cmpgedi_t" |
| [(set (reg:SI T_REG) |
| (ge:SI (match_operand:DI 0 "arith_reg_operand" "r,r") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "r,N")))] |
| "TARGET_SH2" |
| "@ |
| cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/ge\\t%S1,%S0\;cmp/hs\\t%R1,%R0\\n%,Ldi%=: |
| cmp/pz\\t%S0" |
| [(set_attr "length" "8,2") |
| (set_attr "type" "arith3,mt_group")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; DImode unsigned integer comparisons |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "cmpgeudi_t" |
| [(set (reg:SI T_REG) |
| (geu:SI (match_operand:DI 0 "arith_reg_operand" "r") |
| (match_operand:DI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH2" |
| "cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/hs\\t%S1,%S0\;cmp/hs\\t%R1,%R0\\n%,Ldi%=:" |
| [(set_attr "length" "8") |
| (set_attr "type" "arith3")]) |
| |
| (define_insn "cmpgtudi_t" |
| [(set (reg:SI T_REG) |
| (gtu:SI (match_operand:DI 0 "arith_reg_operand" "r") |
| (match_operand:DI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH2" |
| "cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/hi\\t%S1,%S0\;cmp/hi\\t%R1,%R0\\n%,Ldi%=:" |
| [(set_attr "length" "8") |
| (set_attr "type" "arith3")]) |
| |
| (define_insn "cmpeqdi_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (eq:DI (match_operand:DI 1 "register_operand" "%r") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "Nr")))] |
| "TARGET_SHMEDIA" |
| "cmpeq %1, %N2, %0" |
| [(set_attr "type" "cmp_media")]) |
| |
| (define_insn "cmpgtdi_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (gt:DI (match_operand:DI 1 "arith_reg_or_0_operand" "Nr") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rN")))] |
| "TARGET_SHMEDIA" |
| "cmpgt %N1, %N2, %0" |
| [(set_attr "type" "cmp_media")]) |
| |
| (define_insn "cmpgtudi_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (gtu:DI (match_operand:DI 1 "arith_reg_or_0_operand" "Nr") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rN")))] |
| "TARGET_SHMEDIA" |
| "cmpgtu %N1, %N2, %0" |
| [(set_attr "type" "cmp_media")]) |
| |
| ;; We save the compare operands in the cmpxx patterns and use them when |
| ;; we generate the branch. |
| |
| (define_expand "cmpdi" |
| [(set (reg:SI T_REG) |
| (compare (match_operand:DI 0 "arith_operand" "") |
| (match_operand:DI 1 "arith_operand" "")))] |
| "TARGET_SH2 || TARGET_SHMEDIA" |
| " |
| { |
| sh_compare_op0 = operands[0]; |
| sh_compare_op1 = operands[1]; |
| DONE; |
| }") |
| ;; ------------------------------------------------------------------------- |
| ;; Conditional move instructions |
| ;; ------------------------------------------------------------------------- |
| |
| ;; The insn names may seem reversed, but note that cmveq performs the move |
| ;; if op1 == 0, and cmvne does it if op1 != 0. |
| |
| (define_insn "movdicc_false" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (if_then_else:DI (eq (match_operand:DI 1 "arith_reg_operand" "r") |
| (const_int 0)) |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rN") |
| (match_operand:DI 3 "arith_reg_operand" "0")))] |
| "TARGET_SHMEDIA" |
| "cmveq %1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "movdicc_true" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (if_then_else:DI (ne (match_operand:DI 1 "arith_reg_operand" "r") |
| (const_int 0)) |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rN") |
| (match_operand:DI 3 "arith_reg_operand" "0")))] |
| "TARGET_SHMEDIA" |
| "cmvne %1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "movdicc" |
| [(set (match_operand:DI 0 "register_operand" "") |
| (if_then_else:DI (match_operand 1 "comparison_operator" "") |
| (match_operand:DI 2 "register_operand" "") |
| (match_operand:DI 3 "register_operand" "")))] |
| "TARGET_SHMEDIA" |
| " |
| { |
| if ((GET_CODE (operands[1]) == EQ || GET_CODE (operands[1]) == NE) |
| && GET_MODE (sh_compare_op0) == DImode |
| && sh_compare_op1 == const0_rtx) |
| operands[1] = gen_rtx (GET_CODE (operands[1]), VOIDmode, |
| sh_compare_op0, sh_compare_op1); |
| else |
| { |
| rtx tmp; |
| |
| if (no_new_pseudos) |
| FAIL; |
| |
| tmp = gen_reg_rtx (DImode); |
| |
| switch (GET_CODE (operands[1])) |
| { |
| case EQ: |
| emit_insn (gen_seq (tmp)); |
| operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case NE: |
| emit_insn (gen_seq (tmp)); |
| operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case GT: |
| emit_insn (gen_sgt (tmp)); |
| operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case LT: |
| emit_insn (gen_slt (tmp)); |
| operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case GE: |
| emit_insn (gen_slt (tmp)); |
| operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case LE: |
| emit_insn (gen_sgt (tmp)); |
| operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case GTU: |
| emit_insn (gen_sgtu (tmp)); |
| operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case LTU: |
| emit_insn (gen_sltu (tmp)); |
| operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case GEU: |
| emit_insn (gen_sltu (tmp)); |
| operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case LEU: |
| emit_insn (gen_sgtu (tmp)); |
| operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case UNORDERED: |
| emit_insn (gen_sunordered (tmp)); |
| operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case ORDERED: |
| emit_insn (gen_sunordered (tmp)); |
| operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); |
| break; |
| |
| case UNEQ: |
| case UNGE: |
| case UNGT: |
| case UNLE: |
| case UNLT: |
| case LTGT: |
| FAIL; |
| |
| default: |
| abort (); |
| } |
| } |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Addition instructions |
| ;; ------------------------------------------------------------------------- |
| |
| (define_expand "adddi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (plus:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (match_operand:DI 2 "arith_operand" "")))] |
| "" |
| " |
| { |
| if (TARGET_SH1) |
| { |
| if (no_new_pseudos && ! arith_reg_operand (operands[2], DImode)) |
| FAIL; |
| operands[2] = force_reg (DImode, operands[2]); |
| emit_insn (gen_adddi3_compact (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*adddi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (plus:DI (match_operand:DI 1 "arith_reg_operand" "%r,r") |
| (match_operand:DI 2 "arith_operand" "r,I10")))] |
| "TARGET_SHMEDIA" |
| "@ |
| add %1, %2, %0 |
| addi %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "adddi3z_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (zero_extend:DI |
| (plus:SI (match_operand:SI 1 "extend_reg_operand" "r") |
| (match_operand:SI 2 "extend_reg_or_0_operand" "rN"))))] |
| "TARGET_SHMEDIA" |
| "addz.l %1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "adddi3_compact" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=&r") |
| (plus:DI (match_operand:DI 1 "arith_reg_operand" "%0") |
| (match_operand:DI 2 "arith_reg_operand" "r"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "#" |
| [(set_attr "length" "6")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (plus:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (match_operand:DI 2 "arith_reg_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && reload_completed" |
| [(const_int 0)] |
| " |
| { |
| rtx high0, high2, low0 = gen_lowpart (SImode, operands[0]); |
| high0 = gen_rtx_REG (SImode, |
| true_regnum (operands[0]) |
| + (TARGET_LITTLE_ENDIAN ? 1 : 0)); |
| high2 = gen_rtx_REG (SImode, |
| true_regnum (operands[2]) |
| + (TARGET_LITTLE_ENDIAN ? 1 : 0)); |
| emit_insn (gen_clrt ()); |
| emit_insn (gen_addc (low0, low0, gen_lowpart (SImode, operands[2]))); |
| emit_insn (gen_addc1 (high0, high0, high2)); |
| DONE; |
| }") |
| |
| (define_insn "addc" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (plus:SI (plus:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "arith_reg_operand" "r")) |
| (reg:SI T_REG))) |
| (set (reg:SI T_REG) |
| (ltu:SI (plus:SI (match_dup 1) (match_dup 2)) (match_dup 1)))] |
| "TARGET_SH1" |
| "addc %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "addc1" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (plus:SI (plus:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "arith_reg_operand" "r")) |
| (reg:SI T_REG))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "addc %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_expand "addsi3" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (plus:SI (match_operand:SI 1 "arith_operand" "") |
| (match_operand:SI 2 "arith_operand" "")))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| operands[1] = force_reg (SImode, operands[1]); |
| }") |
| |
| (define_insn "addsi3_media" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (plus:SI (match_operand:SI 1 "extend_reg_operand" "%r,r") |
| (match_operand:SI 2 "arith_operand" "r,I10")))] |
| "TARGET_SHMEDIA" |
| "@ |
| add.l %1, %2, %0 |
| addi.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "*addsi3_compact" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (plus:SI (match_operand:SI 1 "arith_operand" "%0") |
| (match_operand:SI 2 "arith_operand" "rI08")))] |
| "TARGET_SH1" |
| "add %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Subtraction instructions |
| ;; ------------------------------------------------------------------------- |
| |
| (define_expand "subdi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (minus:DI (match_operand:DI 1 "arith_reg_or_0_operand" "") |
| (match_operand:DI 2 "arith_reg_operand" "")))] |
| "" |
| " |
| { |
| if (TARGET_SH1) |
| { |
| operands[1] = force_reg (DImode, operands[1]); |
| emit_insn (gen_subdi3_compact (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*subdi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (minus:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rN") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "sub %N1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "subdi3_compact" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=&r") |
| (minus:DI (match_operand:DI 1 "arith_reg_operand" "0") |
| (match_operand:DI 2 "arith_reg_operand" "r"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "#" |
| [(set_attr "length" "6")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (minus:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (match_operand:DI 2 "arith_reg_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && reload_completed" |
| [(const_int 0)] |
| " |
| { |
| rtx high0, high2, low0 = gen_lowpart (SImode, operands[0]); |
| high0 = gen_rtx_REG (SImode, |
| true_regnum (operands[0]) |
| + (TARGET_LITTLE_ENDIAN ? 1 : 0)); |
| high2 = gen_rtx_REG (SImode, |
| true_regnum (operands[2]) |
| + (TARGET_LITTLE_ENDIAN ? 1 : 0)); |
| emit_insn (gen_clrt ()); |
| emit_insn (gen_subc (low0, low0, gen_lowpart (SImode, operands[2]))); |
| emit_insn (gen_subc1 (high0, high0, high2)); |
| DONE; |
| }") |
| |
| (define_insn "subc" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (minus:SI (minus:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "arith_reg_operand" "r")) |
| (reg:SI T_REG))) |
| (set (reg:SI T_REG) |
| (gtu:SI (minus:SI (minus:SI (match_dup 1) (match_dup 2)) |
| (reg:SI T_REG)) |
| (match_dup 1)))] |
| "TARGET_SH1" |
| "subc %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "subc1" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (minus:SI (minus:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "arith_reg_operand" "r")) |
| (reg:SI T_REG))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "subc %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "*subsi3_internal" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (minus:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "sub %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "*subsi3_media" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (minus:SI (match_operand:SI 1 "extend_reg_or_0_operand" "rN") |
| (match_operand:SI 2 "extend_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "sub.l %N1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| ;; Convert `constant - reg' to `neg rX; add rX, #const' since this |
| ;; will sometimes save one instruction. Otherwise we might get |
| ;; `mov #const, rY; sub rY,rX; mov rX, rY' if the source and dest regs |
| ;; are the same. |
| |
| (define_expand "subsi3" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (minus:SI (match_operand:SI 1 "arith_operand" "") |
| (match_operand:SI 2 "arith_reg_operand" "")))] |
| "" |
| " |
| { |
| if (TARGET_SH1 && GET_CODE (operands[1]) == CONST_INT) |
| { |
| emit_insn (gen_negsi2 (operands[0], operands[2])); |
| emit_insn (gen_addsi3 (operands[0], operands[0], operands[1])); |
| DONE; |
| } |
| if (TARGET_SHMEDIA) |
| { |
| if (no_new_pseudos && ! arith_reg_or_0_operand (operands[1], SImode)) |
| FAIL; |
| if (operands[1] != const0_rtx) |
| operands[1] = force_reg (SImode, operands[1]); |
| } |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Division instructions |
| ;; ------------------------------------------------------------------------- |
| |
| ;; We take advantage of the library routines which don't clobber as many |
| ;; registers as a normal function call would. |
| |
| ;; The INSN_REFERENCES_ARE_DELAYED in sh.h is problematic because it |
| ;; also has an effect on the register that holds the address of the sfunc. |
| ;; To make this work, we have an extra dummy insn that shows the use |
| ;; of this register for reorg. |
| |
| (define_insn "use_sfunc_addr" |
| [(set (reg:SI PR_REG) |
| (unspec:SI [(match_operand:SI 0 "register_operand" "r")] UNSPEC_SFUNC))] |
| "TARGET_SH1 && check_use_sfunc_addr (insn, operands[0])" |
| "" |
| [(set_attr "length" "0")]) |
| |
| ;; We must use a pseudo-reg forced to reg 0 in the SET_DEST rather than |
| ;; hard register 0. If we used hard register 0, then the next instruction |
| ;; would be a move from hard register 0 to a pseudo-reg. If the pseudo-reg |
| ;; gets allocated to a stack slot that needs its address reloaded, then |
| ;; there is nothing to prevent reload from using r0 to reload the address. |
| ;; This reload would clobber the value in r0 we are trying to store. |
| ;; If we let reload allocate r0, then this problem can never happen. |
| |
| (define_insn "udivsi3_i1" |
| [(set (match_operand:SI 0 "register_operand" "=z") |
| (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R4_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "TARGET_SH1 && ! TARGET_SH4" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| ; Since shmedia-nofpu code could be linked against shcompact code, and |
| ; the udivsi3 libcall has the same name, we must consider all registers |
| ; clobbered that are in the union of the registers clobbered by the |
| ; shmedia and the shcompact implementation. Note, if the shcompact |
| ; implementation actually used shcompact code, we'd need to clobber |
| ; also r23 and fr23. |
| (define_insn "udivsi3_i1_media" |
| [(set (match_operand:SI 0 "register_operand" "=z") |
| (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI T_MEDIA_REG)) |
| (clobber (reg:SI PR_MEDIA_REG)) |
| (clobber (reg:SI R20_REG)) |
| (clobber (reg:SI R21_REG)) |
| (clobber (reg:SI R22_REG)) |
| (clobber (reg:DI TR0_REG)) |
| (clobber (reg:DI TR1_REG)) |
| (clobber (reg:DI TR2_REG)) |
| (use (match_operand:DI 1 "target_operand" "b"))] |
| "TARGET_SHMEDIA && ! TARGET_SHMEDIA_FPU" |
| "blink %1, r18" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "udivsi3_i4_media" |
| [(set (match_dup 3) |
| (zero_extend:DI (match_operand:SI 1 "register_operand" ""))) |
| (set (match_dup 4) |
| (zero_extend:DI (match_operand:SI 2 "register_operand" ""))) |
| (set (match_dup 5) (float:DF (match_dup 3))) |
| (set (match_dup 6) (float:DF (match_dup 4))) |
| (set (match_dup 7) (div:DF (match_dup 5) (match_dup 6))) |
| (set (match_dup 8) (fix:DI (match_dup 7))) |
| (set (match_operand:SI 0 "register_operand" "") |
| (truncate:SI (match_dup 8)))] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| operands[3] = gen_reg_rtx (DImode); |
| operands[4] = gen_reg_rtx (DImode); |
| operands[5] = gen_reg_rtx (DFmode); |
| operands[6] = gen_reg_rtx (DFmode); |
| operands[7] = gen_reg_rtx (DFmode); |
| operands[8] = gen_reg_rtx (DImode); |
| }") |
| |
| (define_insn "udivsi3_i4" |
| [(set (match_operand:SI 0 "register_operand" "=y") |
| (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:DF DR0_REG)) |
| (clobber (reg:DF DR2_REG)) |
| (clobber (reg:DF DR4_REG)) |
| (clobber (reg:SI R0_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R4_REG)) |
| (clobber (reg:SI R5_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "TARGET_SH4 && ! TARGET_FPU_SINGLE" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "fp_mode" "double") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "udivsi3_i4_single" |
| [(set (match_operand:SI 0 "register_operand" "=y") |
| (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:DF DR0_REG)) |
| (clobber (reg:DF DR2_REG)) |
| (clobber (reg:DF DR4_REG)) |
| (clobber (reg:SI R0_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R4_REG)) |
| (clobber (reg:SI R5_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "(TARGET_HARD_SH4 || TARGET_SHCOMPACT) && TARGET_FPU_SINGLE" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "udivsi3" |
| [(set (match_dup 3) (symbol_ref:SI "__udivsi3")) |
| (set (reg:SI R4_REG) (match_operand:SI 1 "general_operand" "")) |
| (set (reg:SI R5_REG) (match_operand:SI 2 "general_operand" "")) |
| (parallel [(set (match_operand:SI 0 "register_operand" "") |
| (udiv:SI (reg:SI R4_REG) |
| (reg:SI R5_REG))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R4_REG)) |
| (use (match_dup 3))])] |
| "" |
| " |
| { |
| rtx first, last; |
| |
| operands[3] = gen_reg_rtx (Pmode); |
| /* Emit the move of the address to a pseudo outside of the libcall. */ |
| if (TARGET_HARD_SH4 && TARGET_SH2E) |
| { |
| emit_move_insn (operands[3], function_symbol (\"__udivsi3_i4\")); |
| if (TARGET_FPU_SINGLE) |
| last = gen_udivsi3_i4_single (operands[0], operands[3]); |
| else |
| last = gen_udivsi3_i4 (operands[0], operands[3]); |
| } |
| else if (TARGET_SHMEDIA_FPU) |
| { |
| operands[1] = force_reg (SImode, operands[1]); |
| operands[2] = force_reg (SImode, operands[2]); |
| emit_insn (gen_udivsi3_i4_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| else if (TARGET_SH5) |
| { |
| emit_move_insn (operands[3], |
| function_symbol (TARGET_FPU_ANY |
| ? \"__udivsi3_i4\" |
| : \"__udivsi3\")); |
| |
| if (TARGET_SHMEDIA) |
| last = gen_udivsi3_i1_media (operands[0], |
| Pmode == DImode |
| ? operands[3] |
| : gen_rtx_SUBREG (DImode, operands[3], |
| 0)); |
| else if (TARGET_FPU_ANY) |
| last = gen_udivsi3_i4_single (operands[0], operands[3]); |
| else |
| last = gen_udivsi3_i1 (operands[0], operands[3]); |
| } |
| else |
| { |
| emit_move_insn (operands[3], function_symbol (\"__udivsi3\")); |
| last = gen_udivsi3_i1 (operands[0], operands[3]); |
| } |
| first = emit_move_insn (gen_rtx_REG (SImode, 4), operands[1]); |
| emit_move_insn (gen_rtx_REG (SImode, 5), operands[2]); |
| last = emit_insn (last); |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| DONE; |
| }") |
| |
| (define_insn "divsi3_i1" |
| [(set (match_operand:SI 0 "register_operand" "=z") |
| (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R2_REG)) |
| (clobber (reg:SI R3_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "TARGET_SH1 && ! TARGET_SH4" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| ; Since shmedia-nofpu code could be linked against shcompact code, and |
| ; the sdivsi3 libcall has the same name, we must consider all registers |
| ; clobbered that are in the union of the registers clobbered by the |
| ; shmedia and the shcompact implementation. Note, if the shcompact |
| ; implementation actually used shcompact code, we'd need to clobber |
| ; also r22, r23 and fr23. |
| (define_insn "divsi3_i1_media" |
| [(set (match_operand:SI 0 "register_operand" "=z") |
| (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI T_MEDIA_REG)) |
| (clobber (reg:SI PR_MEDIA_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R2_REG)) |
| (clobber (reg:SI R3_REG)) |
| (clobber (reg:SI R20_REG)) |
| (clobber (reg:SI R21_REG)) |
| (clobber (reg:DI TR0_REG)) |
| (clobber (reg:DI TR1_REG)) |
| (clobber (reg:DI TR2_REG)) |
| (use (match_operand:DI 1 "target_operand" "b"))] |
| "TARGET_SHMEDIA && ! TARGET_SHMEDIA_FPU" |
| "blink %1, r18" |
| [(set_attr "type" "sfunc")]) |
| |
| (define_expand "divsi3_i4_media" |
| [(set (match_dup 3) (float:DF (match_operand:SI 1 "register_operand" "r"))) |
| (set (match_dup 4) (float:DF (match_operand:SI 2 "register_operand" "r"))) |
| (set (match_dup 5) (div:DF (match_dup 3) (match_dup 4))) |
| (set (match_operand:SI 0 "register_operand" "=r") |
| (fix:SI (match_dup 5)))] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| operands[3] = gen_reg_rtx (DFmode); |
| operands[4] = gen_reg_rtx (DFmode); |
| operands[5] = gen_reg_rtx (DFmode); |
| }") |
| |
| (define_insn "divsi3_i4" |
| [(set (match_operand:SI 0 "register_operand" "=y") |
| (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:DF DR0_REG)) |
| (clobber (reg:DF DR2_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "TARGET_SH4 && ! TARGET_FPU_SINGLE" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "fp_mode" "double") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "divsi3_i4_single" |
| [(set (match_operand:SI 0 "register_operand" "=y") |
| (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:DF DR0_REG)) |
| (clobber (reg:DF DR2_REG)) |
| (clobber (reg:SI R2_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "(TARGET_HARD_SH4 || TARGET_SHCOMPACT) && TARGET_FPU_SINGLE" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "divsi3" |
| [(set (match_dup 3) (symbol_ref:SI "__sdivsi3")) |
| (set (reg:SI R4_REG) (match_operand:SI 1 "general_operand" "")) |
| (set (reg:SI R5_REG) (match_operand:SI 2 "general_operand" "")) |
| (parallel [(set (match_operand:SI 0 "register_operand" "") |
| (div:SI (reg:SI R4_REG) |
| (reg:SI R5_REG))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R2_REG)) |
| (clobber (reg:SI R3_REG)) |
| (use (match_dup 3))])] |
| "" |
| " |
| { |
| rtx first, last; |
| |
| operands[3] = gen_reg_rtx (Pmode); |
| /* Emit the move of the address to a pseudo outside of the libcall. */ |
| if (TARGET_HARD_SH4 && TARGET_SH2E) |
| { |
| emit_move_insn (operands[3], function_symbol (\"__sdivsi3_i4\")); |
| if (TARGET_FPU_SINGLE) |
| last = gen_divsi3_i4_single (operands[0], operands[3]); |
| else |
| last = gen_divsi3_i4 (operands[0], operands[3]); |
| } |
| else if (TARGET_SHMEDIA_FPU) |
| { |
| operands[1] = force_reg (SImode, operands[1]); |
| operands[2] = force_reg (SImode, operands[2]); |
| emit_insn (gen_divsi3_i4_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| else if (TARGET_SH5) |
| { |
| emit_move_insn (operands[3], |
| function_symbol (TARGET_FPU_ANY |
| ? \"__sdivsi3_i4\" |
| : \"__sdivsi3\")); |
| |
| if (TARGET_SHMEDIA) |
| last = gen_divsi3_i1_media (operands[0], |
| Pmode == DImode |
| ? operands[3] |
| : gen_rtx_SUBREG (DImode, operands[3], |
| 0)); |
| else if (TARGET_FPU_ANY) |
| last = gen_divsi3_i4_single (operands[0], operands[3]); |
| else |
| last = gen_divsi3_i1 (operands[0], operands[3]); |
| } |
| else |
| { |
| emit_move_insn (operands[3], function_symbol (\"__sdivsi3\")); |
| last = gen_divsi3_i1 (operands[0], operands[3]); |
| } |
| first = emit_move_insn (gen_rtx_REG (SImode, 4), operands[1]); |
| emit_move_insn (gen_rtx_REG (SImode, 5), operands[2]); |
| last = emit_insn (last); |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| DONE; |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Multiplication instructions |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "umulhisi3_i" |
| [(set (reg:SI MACL_REG) |
| (mult:SI (zero_extend:SI |
| (match_operand:HI 0 "arith_reg_operand" "r")) |
| (zero_extend:SI |
| (match_operand:HI 1 "arith_reg_operand" "r"))))] |
| "TARGET_SH1" |
| "mulu.w %1,%0" |
| [(set_attr "type" "smpy")]) |
| |
| (define_insn "mulhisi3_i" |
| [(set (reg:SI MACL_REG) |
| (mult:SI (sign_extend:SI |
| (match_operand:HI 0 "arith_reg_operand" "r")) |
| (sign_extend:SI |
| (match_operand:HI 1 "arith_reg_operand" "r"))))] |
| "TARGET_SH1" |
| "muls.w %1,%0" |
| [(set_attr "type" "smpy")]) |
| |
| (define_expand "mulhisi3" |
| [(set (reg:SI MACL_REG) |
| (mult:SI (sign_extend:SI |
| (match_operand:HI 1 "arith_reg_operand" "")) |
| (sign_extend:SI |
| (match_operand:HI 2 "arith_reg_operand" "")))) |
| (set (match_operand:SI 0 "arith_reg_operand" "") |
| (reg:SI MACL_REG))] |
| "TARGET_SH1" |
| " |
| { |
| rtx first, last; |
| |
| first = emit_insn (gen_mulhisi3_i (operands[1], operands[2])); |
| last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACL_REG)); |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| /* expand_binop can't find a suitable code in umul_widen_optab to |
| make a REG_EQUAL note from, so make one here. |
| See also smulsi3_highpart. |
| ??? Alternatively, we could put this at the calling site of expand_binop, |
| i.e. expand_expr. */ |
| REG_NOTES (last) |
| = gen_rtx_EXPR_LIST (REG_EQUAL, copy_rtx (SET_SRC (single_set (first))), |
| REG_NOTES (last)); |
| DONE; |
| }") |
| |
| (define_expand "umulhisi3" |
| [(set (reg:SI MACL_REG) |
| (mult:SI (zero_extend:SI |
| (match_operand:HI 1 "arith_reg_operand" "")) |
| (zero_extend:SI |
| (match_operand:HI 2 "arith_reg_operand" "")))) |
| (set (match_operand:SI 0 "arith_reg_operand" "") |
| (reg:SI MACL_REG))] |
| "TARGET_SH1" |
| " |
| { |
| rtx first, last; |
| |
| first = emit_insn (gen_umulhisi3_i (operands[1], operands[2])); |
| last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACL_REG)); |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| /* expand_binop can't find a suitable code in umul_widen_optab to |
| make a REG_EQUAL note from, so make one here. |
| See also smulsi3_highpart. |
| ??? Alternatively, we could put this at the calling site of expand_binop, |
| i.e. expand_expr. */ |
| REG_NOTES (last) |
| = gen_rtx_EXPR_LIST (REG_EQUAL, copy_rtx (SET_SRC (single_set (first))), |
| REG_NOTES (last)); |
| DONE; |
| }") |
| |
| ;; mulsi3 on the SH2 can be done in one instruction, on the SH1 we generate |
| ;; a call to a routine which clobbers known registers. |
| |
| (define_insn "" |
| [(set (match_operand:SI 1 "register_operand" "=z") |
| (mult:SI (reg:SI R4_REG) (reg:SI R5_REG))) |
| (clobber (reg:SI MACL_REG)) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R3_REG)) |
| (clobber (reg:SI R2_REG)) |
| (clobber (reg:SI R1_REG)) |
| (use (match_operand:SI 0 "arith_reg_operand" "r"))] |
| "TARGET_SH1" |
| "jsr @%0%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "mulsi3_call" |
| [(set (reg:SI R4_REG) (match_operand:SI 1 "general_operand" "")) |
| (set (reg:SI R5_REG) (match_operand:SI 2 "general_operand" "")) |
| (parallel[(set (match_operand:SI 0 "register_operand" "") |
| (mult:SI (reg:SI R4_REG) |
| (reg:SI R5_REG))) |
| (clobber (reg:SI MACL_REG)) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R3_REG)) |
| (clobber (reg:SI R2_REG)) |
| (clobber (reg:SI R1_REG)) |
| (use (match_operand:SI 3 "register_operand" ""))])] |
| "TARGET_SH1" |
| "") |
| |
| (define_insn "mul_l" |
| [(set (reg:SI MACL_REG) |
| (mult:SI (match_operand:SI 0 "arith_reg_operand" "r") |
| (match_operand:SI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH2" |
| "mul.l %1,%0" |
| [(set_attr "type" "dmpy")]) |
| |
| (define_expand "mulsi3" |
| [(set (reg:SI MACL_REG) |
| (mult:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "arith_reg_operand" ""))) |
| (set (match_operand:SI 0 "arith_reg_operand" "") |
| (reg:SI MACL_REG))] |
| "TARGET_SH1" |
| " |
| { |
| rtx first, last; |
| |
| if (!TARGET_SH2) |
| { |
| /* The address must be set outside the libcall, |
| since it goes into a pseudo. */ |
| rtx sym = function_symbol (\"__mulsi3\"); |
| rtx addr = force_reg (SImode, sym); |
| rtx insns = gen_mulsi3_call (operands[0], operands[1], |
| operands[2], addr); |
| first = insns; |
| last = emit_insn (insns); |
| } |
| else |
| { |
| rtx macl = gen_rtx_REG (SImode, MACL_REG); |
| |
| first = emit_insn (gen_mul_l (operands[1], operands[2])); |
| /* consec_sets_giv can only recognize the first insn that sets a |
| giv as the giv insn. So we must tag this also with a REG_EQUAL |
| note. */ |
| last = emit_insn (gen_movsi_i ((operands[0]), macl)); |
| } |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| DONE; |
| }") |
| |
| (define_insn "mulsidi3_i" |
| [(set (reg:SI MACH_REG) |
| (truncate:SI |
| (lshiftrt:DI |
| (mult:DI |
| (sign_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) |
| (const_int 32)))) |
| (set (reg:SI MACL_REG) |
| (mult:SI (match_dup 0) |
| (match_dup 1)))] |
| "TARGET_SH2" |
| "dmuls.l %1,%0" |
| [(set_attr "type" "dmpy")]) |
| |
| (define_expand "mulsidi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mult:DI (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" "r"))))] |
| "TARGET_SH2 || TARGET_SHMEDIA" |
| " |
| { |
| if (TARGET_SH2) |
| { |
| emit_insn (gen_mulsidi3_compact (operands[0], operands[1], |
| operands[2])); |
| DONE; |
| } |
| }") |
| |
| (define_insn "mulsidi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mult:DI (sign_extend:DI (match_operand:SI 1 "extend_reg_operand" "%r")) |
| (sign_extend:DI (match_operand:SI 2 "extend_reg_operand" "r"))))] |
| "TARGET_SHMEDIA" |
| "muls.l %1, %2, %0" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_insn "mulsidi3_compact" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mult:DI |
| (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" "r")))) |
| (clobber (reg:SI MACH_REG)) |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SH2" |
| "#") |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (mult:DI |
| (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) |
| (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" "")))) |
| (clobber (reg:SI MACH_REG)) |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SH2" |
| [(const_int 0)] |
| " |
| { |
| rtx low_dst = gen_lowpart (SImode, operands[0]); |
| rtx high_dst = gen_highpart (SImode, operands[0]); |
| |
| emit_insn (gen_mulsidi3_i (operands[1], operands[2])); |
| |
| emit_move_insn (low_dst, gen_rtx_REG (SImode, MACL_REG)); |
| emit_move_insn (high_dst, gen_rtx_REG (SImode, MACH_REG)); |
| /* We need something to tag the possible REG_EQUAL notes on to. */ |
| emit_move_insn (operands[0], operands[0]); |
| DONE; |
| }") |
| |
| (define_insn "umulsidi3_i" |
| [(set (reg:SI MACH_REG) |
| (truncate:SI |
| (lshiftrt:DI |
| (mult:DI |
| (zero_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) |
| (const_int 32)))) |
| (set (reg:SI MACL_REG) |
| (mult:SI (match_dup 0) |
| (match_dup 1)))] |
| "TARGET_SH2" |
| "dmulu.l %1,%0" |
| [(set_attr "type" "dmpy")]) |
| |
| (define_expand "umulsidi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mult:DI (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" "r"))))] |
| "TARGET_SH2 || TARGET_SHMEDIA" |
| " |
| { |
| if (TARGET_SH2) |
| { |
| emit_insn (gen_umulsidi3_compact (operands[0], operands[1], |
| operands[2])); |
| DONE; |
| } |
| }") |
| |
| (define_insn "umulsidi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mult:DI (zero_extend:DI (match_operand:SI 1 "extend_reg_operand" "%r")) |
| (zero_extend:DI (match_operand:SI 2 "extend_reg_operand" "r"))))] |
| "TARGET_SHMEDIA" |
| "mulu.l %1, %2, %0" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_insn "umulsidi3_compact" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mult:DI |
| (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" "r")))) |
| (clobber (reg:SI MACH_REG)) |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SH2" |
| "#") |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (mult:DI (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) |
| (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" "")))) |
| (clobber (reg:SI MACH_REG)) |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SH2" |
| [(const_int 0)] |
| " |
| { |
| rtx low_dst = gen_lowpart (SImode, operands[0]); |
| rtx high_dst = gen_highpart (SImode, operands[0]); |
| |
| emit_insn (gen_umulsidi3_i (operands[1], operands[2])); |
| |
| emit_move_insn (low_dst, gen_rtx_REG (SImode, MACL_REG)); |
| emit_move_insn (high_dst, gen_rtx_REG (SImode, MACH_REG)); |
| /* We need something to tag the possible REG_EQUAL notes on to. */ |
| emit_move_insn (operands[0], operands[0]); |
| DONE; |
| }") |
| |
| (define_insn "smulsi3_highpart_i" |
| [(set (reg:SI MACH_REG) |
| (truncate:SI |
| (lshiftrt:DI |
| (mult:DI |
| (sign_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) |
| (const_int 32)))) |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SH2" |
| "dmuls.l %1,%0" |
| [(set_attr "type" "dmpy")]) |
| |
| (define_expand "smulsi3_highpart" |
| [(parallel |
| [(set (reg:SI MACH_REG) |
| (truncate:SI |
| (lshiftrt:DI |
| (mult:DI |
| (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) |
| (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" ""))) |
| (const_int 32)))) |
| (clobber (reg:SI MACL_REG))]) |
| (set (match_operand:SI 0 "arith_reg_operand" "") |
| (reg:SI MACH_REG))] |
| "TARGET_SH2" |
| " |
| { |
| rtx first, last; |
| |
| first = emit_insn (gen_smulsi3_highpart_i (operands[1], operands[2])); |
| last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACH_REG)); |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| /* expand_binop can't find a suitable code in mul_highpart_optab to |
| make a REG_EQUAL note from, so make one here. |
| See also {,u}mulhisi. |
| ??? Alternatively, we could put this at the calling site of expand_binop, |
| i.e. expand_mult_highpart. */ |
| REG_NOTES (last) |
| = gen_rtx_EXPR_LIST (REG_EQUAL, copy_rtx (SET_SRC (single_set (first))), |
| REG_NOTES (last)); |
| DONE; |
| }") |
| |
| (define_insn "umulsi3_highpart_i" |
| [(set (reg:SI MACH_REG) |
| (truncate:SI |
| (lshiftrt:DI |
| (mult:DI |
| (zero_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) |
| (const_int 32)))) |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SH2" |
| "dmulu.l %1,%0" |
| [(set_attr "type" "dmpy")]) |
| |
| (define_expand "umulsi3_highpart" |
| [(parallel |
| [(set (reg:SI MACH_REG) |
| (truncate:SI |
| (lshiftrt:DI |
| (mult:DI |
| (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) |
| (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" ""))) |
| (const_int 32)))) |
| (clobber (reg:SI MACL_REG))]) |
| (set (match_operand:SI 0 "arith_reg_operand" "") |
| (reg:SI MACH_REG))] |
| "TARGET_SH2" |
| " |
| { |
| rtx first, last; |
| |
| first = emit_insn (gen_umulsi3_highpart_i (operands[1], operands[2])); |
| last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACH_REG)); |
| /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop |
| invariant code motion can move it. */ |
| REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); |
| REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); |
| DONE; |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Logical operations |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "*andsi3_compact" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,z") |
| (and:SI (match_operand:SI 1 "arith_reg_operand" "%0,0") |
| (match_operand:SI 2 "logical_operand" "r,K08")))] |
| "TARGET_SH1" |
| "and %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| ;; If the constant is 255, then emit an extu.b instruction instead of an |
| ;; and, since that will give better code. |
| |
| (define_expand "andsi3" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (and:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "logical_operand" "")))] |
| "TARGET_SH1" |
| " |
| { |
| if (GET_CODE (operands[2]) == CONST_INT && INTVAL (operands[2]) == 255) |
| { |
| emit_insn (gen_zero_extendqisi2 (operands[0], |
| gen_lowpart (QImode, operands[1]))); |
| DONE; |
| } |
| }") |
| |
| (define_insn_and_split "anddi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r,r") |
| (and:DI (match_operand:DI 1 "arith_reg_operand" "%r,r,r") |
| (match_operand:DI 2 "and_operand" "r,I10,J16")))] |
| "TARGET_SHMEDIA" |
| "@ |
| and %1, %2, %0 |
| andi %1, %2, %0 |
| #" |
| "reload_completed |
| && ! logical_operand (operands[2], DImode)" |
| [(const_int 0)] |
| " |
| { |
| if (INTVAL (operands[2]) == (unsigned) 0xffffffff) |
| emit_insn (gen_mshflo_l_di (operands[0], operands[1], CONST0_RTX (DImode))); |
| else |
| emit_insn (gen_mshfhi_l_di (operands[0], CONST0_RTX (DImode), operands[1])); |
| DONE; |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "andcdi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (and:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (not:DI (match_operand:DI 2 "arith_reg_operand" "r"))))] |
| "TARGET_SHMEDIA" |
| "andc %1,%2,%0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "iorsi3" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,z") |
| (ior:SI (match_operand:SI 1 "arith_reg_operand" "%0,0") |
| (match_operand:SI 2 "logical_operand" "r,K08")))] |
| "TARGET_SH1" |
| "or %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "iordi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (ior:DI (match_operand:DI 1 "arith_reg_operand" "%r,r") |
| (match_operand:DI 2 "logical_operand" "r,I10")))] |
| "TARGET_SHMEDIA" |
| "@ |
| or %1, %2, %0 |
| ori %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "xorsi3" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=z,r") |
| (xor:SI (match_operand:SI 1 "arith_reg_operand" "%0,0") |
| (match_operand:SI 2 "logical_operand" "K08,r")))] |
| "TARGET_SH1" |
| "xor %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "xordi3" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (xor:DI (match_operand:DI 1 "arith_reg_operand" "%r,r") |
| (match_operand:DI 2 "shmedia_6bit_operand" "r,I06")))] |
| "TARGET_SHMEDIA" |
| "@ |
| xor %1, %2, %0 |
| xori %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| ;; Combiner bridge pattern for 2 * sign extend -> logical op -> truncate. |
| ;; converts 2 * sign extend -> logical op into logical op -> sign extend |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (sign_extend:DI (match_operator 4 "binary_logical_operator" |
| [(match_operand 1 "any_register_operand" "") |
| (match_operand 2 "any_register_operand" "")])))] |
| "TARGET_SHMEDIA" |
| [(set (match_dup 5) (match_dup 4)) |
| (set (match_dup 0) (sign_extend:DI (match_dup 5)))] |
| " |
| { |
| enum machine_mode inmode = GET_MODE (operands[1]); |
| int offset = 0; |
| |
| if (GET_CODE (operands[0]) == SUBREG) |
| { |
| offset = SUBREG_BYTE (operands[0]); |
| operands[0] = SUBREG_REG (operands[0]); |
| } |
| if (GET_CODE (operands[0]) != REG) |
| abort (); |
| if (! TARGET_LITTLE_ENDIAN) |
| offset += 8 - GET_MODE_SIZE (inmode); |
| operands[5] = gen_rtx_SUBREG (inmode, operands[0], offset); |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Shifts and rotates |
| ;; ------------------------------------------------------------------------- |
| |
| (define_expand "rotldi3" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (rotate:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (match_operand:HI 2 "mextr_bit_offset" "i")))] |
| "TARGET_SHMEDIA" |
| "if (! mextr_bit_offset (operands[2], HImode)) FAIL;") |
| |
| (define_insn "rotldi3_mextr" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (rotate:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (match_operand:HI 2 "mextr_bit_offset" "i")))] |
| "TARGET_SHMEDIA" |
| "* |
| { |
| static char templ[16]; |
| |
| sprintf (templ, \"mextr%d\\t%%1,%%1,%%0\", |
| 8 - (int) (INTVAL (operands[2]) >> 3)); |
| return templ; |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "rotrdi3" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (rotatert:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (match_operand:HI 2 "mextr_bit_offset" "i")))] |
| "TARGET_SHMEDIA" |
| "if (! mextr_bit_offset (operands[2], HImode)) FAIL;") |
| |
| (define_insn "rotrdi3_mextr" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (rotatert:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (match_operand:HI 2 "mextr_bit_offset" "i")))] |
| "TARGET_SHMEDIA" |
| "* |
| { |
| static char templ[16]; |
| |
| sprintf (templ, \"mextr%d\\t%%1,%%1,%%0\", (int) INTVAL (operands[2]) >> 3); |
| return templ; |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "rotlsi3_1" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (rotate:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (const_int 1))) |
| (set (reg:SI T_REG) |
| (lshiftrt:SI (match_dup 1) (const_int 31)))] |
| "TARGET_SH1" |
| "rotl %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "rotlsi3_31" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (rotate:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (const_int 31))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "rotr %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "rotlsi3_16" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (rotate:SI (match_operand:SI 1 "arith_reg_operand" "r") |
| (const_int 16)))] |
| "TARGET_SH1" |
| "swap.w %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_expand "rotlsi3" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (rotate:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "immediate_operand" "")))] |
| "TARGET_SH1" |
| " |
| { |
| static const char rot_tab[] = { |
| 000, 000, 000, 000, 000, 000, 010, 001, |
| 001, 001, 011, 013, 003, 003, 003, 003, |
| 003, 003, 003, 003, 003, 013, 012, 002, |
| 002, 002, 010, 000, 000, 000, 000, 000, |
| }; |
| |
| int count, choice; |
| |
| if (GET_CODE (operands[2]) != CONST_INT) |
| FAIL; |
| count = INTVAL (operands[2]); |
| choice = rot_tab[count]; |
| if (choice & 010 && SH_DYNAMIC_SHIFT_COST <= 1) |
| FAIL; |
| choice &= 7; |
| switch (choice) |
| { |
| case 0: |
| emit_move_insn (operands[0], operands[1]); |
| count -= (count & 16) * 2; |
| break; |
| case 3: |
| emit_insn (gen_rotlsi3_16 (operands[0], operands[1])); |
| count -= 16; |
| break; |
| case 1: |
| case 2: |
| { |
| rtx parts[2]; |
| parts[0] = gen_reg_rtx (SImode); |
| parts[1] = gen_reg_rtx (SImode); |
| emit_insn (gen_rotlsi3_16 (parts[2-choice], operands[1])); |
| emit_move_insn (parts[choice-1], operands[1]); |
| emit_insn (gen_ashlsi3 (parts[0], parts[0], GEN_INT (8))); |
| emit_insn (gen_lshrsi3 (parts[1], parts[1], GEN_INT (8))); |
| emit_insn (gen_iorsi3 (operands[0], parts[0], parts[1])); |
| count = (count & ~16) - 8; |
| } |
| } |
| |
| for (; count > 0; count--) |
| emit_insn (gen_rotlsi3_1 (operands[0], operands[0])); |
| for (; count < 0; count++) |
| emit_insn (gen_rotlsi3_31 (operands[0], operands[0])); |
| |
| DONE; |
| }") |
| |
| (define_insn "*rotlhi3_8" |
| [(set (match_operand:HI 0 "arith_reg_operand" "=r") |
| (rotate:HI (match_operand:HI 1 "arith_reg_operand" "r") |
| (const_int 8)))] |
| "TARGET_SH1" |
| "swap.b %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_expand "rotlhi3" |
| [(set (match_operand:HI 0 "arith_reg_operand" "") |
| (rotate:HI (match_operand:HI 1 "arith_reg_operand" "") |
| (match_operand:HI 2 "immediate_operand" "")))] |
| "TARGET_SH1" |
| " |
| { |
| if (GET_CODE (operands[2]) != CONST_INT || INTVAL (operands[2]) != 8) |
| FAIL; |
| }") |
| |
| ;; |
| ;; shift left |
| |
| ;; This pattern is used by init_expmed for computing the costs of shift |
| ;; insns. |
| |
| (define_insn_and_split "ashlsi3_std" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r,r,r") |
| (ashift:SI (match_operand:SI 1 "arith_reg_operand" "0,0,0,0") |
| (match_operand:SI 2 "nonmemory_operand" "r,M,P27,?ri"))) |
| (clobber (match_scratch:SI 3 "=X,X,X,&r"))] |
| "TARGET_SH3 |
| || (TARGET_SH1 && GET_CODE (operands[2]) == CONST_INT |
| && CONST_OK_FOR_P27 (INTVAL (operands[2])))" |
| "@ |
| shld %2,%0 |
| add %0,%0 |
| shll%O2 %0 |
| #" |
| "TARGET_SH3 |
| && reload_completed |
| && GET_CODE (operands[2]) == CONST_INT |
| && ! CONST_OK_FOR_P27 (INTVAL (operands[2]))" |
| [(set (match_dup 3) (match_dup 2)) |
| (parallel |
| [(set (match_dup 0) (ashift:SI (match_dup 1) (match_dup 3))) |
| (clobber (match_dup 4))])] |
| "operands[4] = gen_rtx_SCRATCH (SImode);" |
| [(set_attr "length" "*,*,*,4") |
| (set_attr "type" "dyn_shift,arith,arith,arith")]) |
| |
| (define_insn "ashlhi3_k" |
| [(set (match_operand:HI 0 "arith_reg_operand" "=r,r") |
| (ashift:HI (match_operand:HI 1 "arith_reg_operand" "0,0") |
| (match_operand:HI 2 "const_int_operand" "M,P27")))] |
| "TARGET_SH1 && CONST_OK_FOR_P27 (INTVAL (operands[2]))" |
| "@ |
| add %0,%0 |
| shll%O2 %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "ashlsi3_n" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ashift:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "n"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && ! sh_dynamicalize_shift_p (operands[2])" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shift_insns_rtx (insn)") (const_int 1)) |
| (const_string "2") |
| (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 2)) |
| (const_string "4") |
| (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 3)) |
| (const_string "6")] |
| (const_string "8"))) |
| (set_attr "type" "arith")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (ashift:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "const_int_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && reload_completed" |
| [(use (reg:SI R0_REG))] |
| " |
| { |
| gen_shifty_op (ASHIFT, operands); |
| DONE; |
| }") |
| |
| (define_insn "ashlsi3_media" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (ashift:SI (match_operand:SI 1 "extend_reg_operand" "r,r") |
| (match_operand:SI 2 "nonmemory_operand" "r,n")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shlld.l %1, %2, %0 |
| shlli.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "ashlsi3" |
| [(parallel [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (ashift:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "nonmemory_operand" ""))) |
| (clobber (reg:SI T_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_ashlsi3_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (GET_CODE (operands[2]) == CONST_INT |
| && sh_dynamicalize_shift_p (operands[2])) |
| operands[2] = force_reg (SImode, operands[2]); |
| if (TARGET_SH3) |
| { |
| emit_insn (gen_ashlsi3_std (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (! immediate_operand (operands[2], GET_MODE (operands[2]))) |
| FAIL; |
| }") |
| |
| (define_insn "ashlhi3" |
| [(set (match_operand:HI 0 "arith_reg_operand" "=r") |
| (ashift:HI (match_operand:HI 1 "arith_reg_operand" "0") |
| (match_operand:HI 2 "const_int_operand" "n"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shift_insns_rtx (insn)") (const_int 1)) |
| (const_string "2") |
| (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 2)) |
| (const_string "4")] |
| (const_string "6"))) |
| (set_attr "type" "arith")]) |
| |
| (define_split |
| [(set (match_operand:HI 0 "arith_reg_operand" "") |
| (ashift:HI (match_operand:HI 1 "arith_reg_operand" "") |
| (match_operand:HI 2 "const_int_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && reload_completed" |
| [(use (reg:SI R0_REG))] |
| " |
| { |
| gen_shifty_hi_op (ASHIFT, operands); |
| DONE; |
| }") |
| |
| ; |
| ; arithmetic shift right |
| ; |
| |
| (define_insn "ashrsi3_k" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "M"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && INTVAL (operands[2]) == 1" |
| "shar %0" |
| [(set_attr "type" "arith")]) |
| |
| ;; We can't do HImode right shifts correctly unless we start out with an |
| ;; explicit zero / sign extension; doing that would result in worse overall |
| ;; code, so just let the machine independent code widen the mode. |
| ;; That's why we don't have ashrhi3_k / lshrhi3_k / lshrhi3_m / lshrhi3 . |
| |
| |
| ;; ??? This should be a define expand. |
| |
| (define_insn "ashrsi2_16" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "r") |
| (const_int 16)))] |
| "TARGET_SH1" |
| "#" |
| [(set_attr "length" "4")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (const_int 16)))] |
| "TARGET_SH1" |
| [(set (match_dup 0) (rotate:SI (match_dup 1) (const_int 16))) |
| (set (match_dup 0) (sign_extend:SI (match_dup 2)))] |
| "operands[2] = gen_lowpart (HImode, operands[0]);") |
| |
| ;; ??? This should be a define expand. |
| |
| (define_insn "ashrsi2_31" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (const_int 31))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "#" |
| [(set_attr "length" "4")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (const_int 31))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| [(const_int 0)] |
| " |
| { |
| emit_insn (gen_ashlsi_c (operands[0], operands[1])); |
| emit_insn (gen_subc1 (operands[0], operands[0], operands[0])); |
| DONE; |
| }") |
| |
| (define_insn "ashlsi_c" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ashift:SI (match_operand:SI 1 "arith_reg_operand" "0") (const_int 1))) |
| (set (reg:SI T_REG) |
| (lt:SI (match_dup 1) (const_int 0)))] |
| "TARGET_SH1" |
| "shll %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "ashrsi3_d" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (neg:SI (match_operand:SI 2 "arith_reg_operand" "r"))))] |
| "TARGET_SH3" |
| "shad %2,%0" |
| [(set_attr "type" "dyn_shift")]) |
| |
| (define_insn "ashrsi3_n" |
| [(set (reg:SI R4_REG) |
| (ashiftrt:SI (reg:SI R4_REG) |
| (match_operand:SI 0 "const_int_operand" "i"))) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI PR_REG)) |
| (use (match_operand:SI 1 "arith_reg_operand" "r"))] |
| "TARGET_SH1" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "ashrsi3_media" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (ashiftrt:SI (match_operand:SI 1 "extend_reg_operand" "r,r") |
| (match_operand:SI 2 "nonmemory_operand" "r,n")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shard.l %1, %2, %0 |
| shari.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "ashrsi3" |
| [(parallel [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "nonmemory_operand" ""))) |
| (clobber (reg:SI T_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_ashrsi3_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (expand_ashiftrt (operands)) |
| DONE; |
| else |
| FAIL; |
| }") |
| |
| ;; logical shift right |
| |
| (define_insn "lshrsi3_d" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (neg:SI (match_operand:SI 2 "arith_reg_operand" "r"))))] |
| "TARGET_SH3" |
| "shld %2,%0" |
| [(set_attr "type" "dyn_shift")]) |
| |
| ;; Only the single bit shift clobbers the T bit. |
| |
| (define_insn "lshrsi3_m" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "M"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && CONST_OK_FOR_M (INTVAL (operands[2]))" |
| "shlr %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "lshrsi3_k" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "P27")))] |
| "TARGET_SH1 && CONST_OK_FOR_P27 (INTVAL (operands[2])) |
| && ! CONST_OK_FOR_M (INTVAL (operands[2]))" |
| "shlr%O2 %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "lshrsi3_n" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "n"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && ! sh_dynamicalize_shift_p (operands[2])" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shift_insns_rtx (insn)") (const_int 1)) |
| (const_string "2") |
| (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 2)) |
| (const_string "4") |
| (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 3)) |
| (const_string "6")] |
| (const_string "8"))) |
| (set_attr "type" "arith")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "const_int_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && reload_completed" |
| [(use (reg:SI R0_REG))] |
| " |
| { |
| gen_shifty_op (LSHIFTRT, operands); |
| DONE; |
| }") |
| |
| (define_insn "lshrsi3_media" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (lshiftrt:SI (match_operand:SI 1 "extend_reg_operand" "r,r") |
| (match_operand:SI 2 "nonmemory_operand" "r,n")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shlrd.l %1, %2, %0 |
| shlri.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "lshrsi3" |
| [(parallel [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "nonmemory_operand" ""))) |
| (clobber (reg:SI T_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_lshrsi3_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (GET_CODE (operands[2]) == CONST_INT |
| && sh_dynamicalize_shift_p (operands[2])) |
| operands[2] = force_reg (SImode, operands[2]); |
| if (TARGET_SH3 && arith_reg_operand (operands[2], GET_MODE (operands[2]))) |
| { |
| rtx count = copy_to_mode_reg (SImode, operands[2]); |
| emit_insn (gen_negsi2 (count, count)); |
| emit_insn (gen_lshrsi3_d (operands[0], operands[1], count)); |
| DONE; |
| } |
| if (! immediate_operand (operands[2], GET_MODE (operands[2]))) |
| FAIL; |
| }") |
| |
| ;; ??? This should be a define expand. |
| |
| (define_insn "ashldi3_k" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (ashift:DI (match_operand:DI 1 "arith_reg_operand" "0") |
| (const_int 1))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "shll %R0\;rotcl %S0" |
| [(set_attr "length" "4") |
| (set_attr "type" "arith")]) |
| |
| (define_insn "ashldi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (ashift:DI (match_operand:DI 1 "arith_reg_operand" "r,r") |
| (match_operand:DI 2 "nonmemory_operand" "r,n")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shlld %1, %2, %0 |
| shlli %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "ashldi3" |
| [(parallel [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (ashift:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (match_operand:DI 2 "immediate_operand" ""))) |
| (clobber (reg:SI T_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_ashldi3_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (GET_CODE (operands[2]) != CONST_INT |
| || INTVAL (operands[2]) != 1) |
| FAIL; |
| }") |
| |
| ;; ??? This should be a define expand. |
| |
| (define_insn "lshrdi3_k" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (lshiftrt:DI (match_operand:DI 1 "arith_reg_operand" "0") |
| (const_int 1))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "shlr %S0\;rotcr %R0" |
| [(set_attr "length" "4") |
| (set_attr "type" "arith")]) |
| |
| (define_insn "lshrdi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (lshiftrt:DI (match_operand:DI 1 "arith_reg_operand" "r,r") |
| (match_operand:DI 2 "nonmemory_operand" "r,n")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shlrd %1, %2, %0 |
| shlri %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "lshrdi3" |
| [(parallel [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (lshiftrt:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (match_operand:DI 2 "immediate_operand" ""))) |
| (clobber (reg:SI T_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_lshrdi3_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (GET_CODE (operands[2]) != CONST_INT |
| || INTVAL (operands[2]) != 1) |
| FAIL; |
| }") |
| |
| ;; ??? This should be a define expand. |
| |
| (define_insn "ashrdi3_k" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "0") |
| (const_int 1))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "shar %S0\;rotcr %R0" |
| [(set_attr "length" "4") |
| (set_attr "type" "arith")]) |
| |
| (define_insn "ashrdi3_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "r,r") |
| (match_operand:DI 2 "nonmemory_operand" "r,n")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shard %1, %2, %0 |
| shari %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "ashrdi3" |
| [(parallel [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (match_operand:DI 2 "immediate_operand" ""))) |
| (clobber (reg:SI T_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_ashrdi3_media (operands[0], operands[1], operands[2])); |
| DONE; |
| } |
| if (GET_CODE (operands[2]) != CONST_INT |
| || INTVAL (operands[2]) != 1) |
| FAIL; |
| }") |
| |
| ;; combined left/right shift |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "") |
| (match_operand:SI 2 "const_int_operand" "")) |
| (match_operand:SI 3 "const_int_operand" "")))] |
| "TARGET_SH1 && reload_completed && (unsigned)INTVAL (operands[2]) < 32" |
| [(use (reg:SI R0_REG))] |
| "if (gen_shl_and (operands[0], operands[2], operands[3], operands[1])) FAIL; |
| DONE;") |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "") |
| (match_operand:SI 2 "const_int_operand" "")) |
| (match_operand:SI 3 "const_int_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && reload_completed && (unsigned)INTVAL (operands[2]) < 32" |
| [(use (reg:SI R0_REG))] |
| "if (gen_shl_and (operands[0], operands[2], operands[3], operands[1])) FAIL; |
| DONE;") |
| |
| (define_insn "" |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "n")) |
| (match_operand:SI 3 "const_int_operand" "n"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && shl_and_kind (operands[2], operands[3], 0) == 1" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shl_and_length (insn)") (const_int 2)) |
| (const_string "4") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 3)) |
| (const_string "6") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 4)) |
| (const_string "8") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 5)) |
| (const_string "10") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 6)) |
| (const_string "12") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 7)) |
| (const_string "14") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 8)) |
| (const_string "16")] |
| (const_string "18"))) |
| (set_attr "type" "arith")]) |
| |
| (define_insn "" |
| [(set (match_operand:SI 0 "register_operand" "=z") |
| (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "n")) |
| (match_operand:SI 3 "const_int_operand" "n"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && shl_and_kind (operands[2], operands[3], 0) == 2" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shl_and_length (insn)") (const_int 2)) |
| (const_string "4") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 3)) |
| (const_string "6") |
| (eq (symbol_ref "shl_and_length (insn)") (const_int 4)) |
| (const_string "8")] |
| (const_string "10"))) |
| (set_attr "type" "arith")]) |
| |
| ;; shift left / and combination with a scratch register: The combine pass |
| ;; does not accept the individual instructions, even though they are |
| ;; cheap. But it needs a precise description so that it is usable after |
| ;; reload. |
| (define_insn "and_shl_scratch" |
| [(set (match_operand:SI 0 "register_operand" "=r,&r") |
| (lshiftrt:SI |
| (ashift:SI |
| (and:SI |
| (lshiftrt:SI (match_operand:SI 1 "register_operand" "r,0") |
| (match_operand:SI 2 "const_int_operand" "N,n")) |
| (match_operand:SI 3 "" "0,r")) |
| (match_operand:SI 4 "const_int_operand" "n,n")) |
| (match_operand:SI 5 "const_int_operand" "n,n"))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shl_and_scr_length (insn)") (const_int 2)) |
| (const_string "4") |
| (eq (symbol_ref "shl_and_scr_length (insn)") (const_int 3)) |
| (const_string "6") |
| (eq (symbol_ref "shl_and_scr_length (insn)") (const_int 4)) |
| (const_string "8") |
| (eq (symbol_ref "shl_and_scr_length (insn)") (const_int 5)) |
| (const_string "10")] |
| (const_string "12"))) |
| (set_attr "type" "arith")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (lshiftrt:SI |
| (ashift:SI |
| (and:SI |
| (lshiftrt:SI (match_operand:SI 1 "register_operand" "") |
| (match_operand:SI 2 "const_int_operand" "")) |
| (match_operand:SI 3 "register_operand" "")) |
| (match_operand:SI 4 "const_int_operand" "")) |
| (match_operand:SI 5 "const_int_operand" ""))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| [(use (reg:SI R0_REG))] |
| " |
| { |
| rtx and_source = operands[rtx_equal_p (operands[0], operands[1]) ? 3 : 1]; |
| |
| if (INTVAL (operands[2])) |
| { |
| gen_shifty_op (LSHIFTRT, operands); |
| } |
| emit_insn (gen_andsi3 (operands[0], operands[0], and_source)); |
| operands[2] = operands[4]; |
| gen_shifty_op (ASHIFT, operands); |
| if (INTVAL (operands[5])) |
| { |
| operands[2] = operands[5]; |
| gen_shifty_op (LSHIFTRT, operands); |
| } |
| DONE; |
| }") |
| |
| ;; signed left/right shift combination. |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (sign_extract:SI |
| (ashift:SI (match_operand:SI 1 "register_operand" "") |
| (match_operand:SI 2 "const_int_operand" "")) |
| (match_operand:SI 3 "const_int_operand" "") |
| (const_int 0))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1" |
| [(use (reg:SI R0_REG))] |
| "if (gen_shl_sext (operands[0], operands[2], operands[3], operands[1])) FAIL; |
| DONE;") |
| |
| (define_insn "shl_sext_ext" |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (sign_extract:SI |
| (ashift:SI (match_operand:SI 1 "register_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "n")) |
| (match_operand:SI 3 "const_int_operand" "n") |
| (const_int 0))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && (unsigned)shl_sext_kind (operands[2], operands[3], 0) - 1 < 5" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shl_sext_length (insn)") (const_int 1)) |
| (const_string "2") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 2)) |
| (const_string "4") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 3)) |
| (const_string "6") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 4)) |
| (const_string "8") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 5)) |
| (const_string "10") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 6)) |
| (const_string "12") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 7)) |
| (const_string "14") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 8)) |
| (const_string "16")] |
| (const_string "18"))) |
| (set_attr "type" "arith")]) |
| |
| (define_insn "shl_sext_sub" |
| [(set (match_operand:SI 0 "register_operand" "=z") |
| (sign_extract:SI |
| (ashift:SI (match_operand:SI 1 "register_operand" "0") |
| (match_operand:SI 2 "const_int_operand" "n")) |
| (match_operand:SI 3 "const_int_operand" "n") |
| (const_int 0))) |
| (clobber (reg:SI T_REG))] |
| "TARGET_SH1 && (shl_sext_kind (operands[2], operands[3], 0) & ~1) == 6" |
| "#" |
| [(set (attr "length") |
| (cond [(eq (symbol_ref "shl_sext_length (insn)") (const_int 3)) |
| (const_string "6") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 4)) |
| (const_string "8") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 5)) |
| (const_string "10") |
| (eq (symbol_ref "shl_sext_length (insn)") (const_int 6)) |
| (const_string "12")] |
| (const_string "14"))) |
| (set_attr "type" "arith")]) |
| |
| ;; These patterns are found in expansions of DImode shifts by 16, and |
| ;; allow the xtrct instruction to be generated from C source. |
| |
| (define_insn "xtrct_left" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ior:SI (ashift:SI (match_operand:SI 1 "arith_reg_operand" "r") |
| (const_int 16)) |
| (lshiftrt:SI (match_operand:SI 2 "arith_reg_operand" "0") |
| (const_int 16))))] |
| "TARGET_SH1" |
| "xtrct %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "xtrct_right" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (ior:SI (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") |
| (const_int 16)) |
| (ashift:SI (match_operand:SI 2 "arith_reg_operand" "r") |
| (const_int 16))))] |
| "TARGET_SH1" |
| "xtrct %2,%0" |
| [(set_attr "type" "arith")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Unary arithmetic |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "negc" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (neg:SI (plus:SI (reg:SI T_REG) |
| (match_operand:SI 1 "arith_reg_operand" "r")))) |
| (set (reg:SI T_REG) |
| (ne:SI (ior:SI (reg:SI T_REG) (match_dup 1)) |
| (const_int 0)))] |
| "TARGET_SH1" |
| "negc %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "*negdi_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (neg:DI (match_operand:DI 1 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "sub r63, %1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "negdi2" |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (neg:DI (match_operand:DI 1 "arith_reg_operand" "")))] |
| "" |
| " |
| { |
| if (TARGET_SH1) |
| { |
| int low_word = (TARGET_LITTLE_ENDIAN ? 0 : 1); |
| int high_word = (TARGET_LITTLE_ENDIAN ? 1 : 0); |
| |
| rtx low_src = operand_subword (operands[1], low_word, 0, DImode); |
| rtx high_src = operand_subword (operands[1], high_word, 0, DImode); |
| |
| rtx low_dst = operand_subword (operands[0], low_word, 1, DImode); |
| rtx high_dst = operand_subword (operands[0], high_word, 1, DImode); |
| |
| emit_insn (gen_clrt ()); |
| emit_insn (gen_negc (low_dst, low_src)); |
| emit_insn (gen_negc (high_dst, high_src)); |
| DONE; |
| } |
| }") |
| |
| (define_insn "negsi2" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (neg:SI (match_operand:SI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "neg %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "one_cmplsi2" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (not:SI (match_operand:SI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "not %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_expand "one_cmpldi2" |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (xor:DI (match_operand:DI 1 "arith_reg_operand" "") |
| (const_int -1)))] |
| "TARGET_SHMEDIA" "") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Zero extension instructions |
| ;; ------------------------------------------------------------------------- |
| |
| (define_insn "zero_extendsidi2" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (zero_extend:DI (match_operand:SI 1 "extend_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "addz.l %1, r63, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "zero_extendhidi2" |
| [(set (match_operand:DI 0 "register_operand" "=r,r") |
| (zero_extend:DI (match_operand:HI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| # |
| ld%M1.uw %m1, %0" |
| [(set_attr "type" "*,load_media")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "register_operand" "") |
| (zero_extend:DI (match_operand:HI 1 "extend_reg_operand" "")))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (ashift:DI (subreg:DI (match_dup 1) 0) (const_int 48))) |
| (set (match_dup 0) (lshiftrt:DI (match_dup 0) (const_int 48)))] |
| " |
| { |
| if (GET_CODE (operands[1]) == TRUNCATE) |
| operands[1] = XEXP (operands[1], 0); |
| }") |
| |
| ;; ??? when a truncated input to a zero_extend is reloaded, reload will |
| ;; reload the entire truncate expression. |
| (define_insn_and_split "*loaddi_trunc" |
| [(set (match_operand 0 "int_gpr_dest" "=r") |
| (truncate (match_operand:DI 1 "memory_operand" "m")))] |
| "TARGET_SHMEDIA && reload_completed" |
| "#" |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (match_dup 1))] |
| "operands[0] = gen_rtx_REG (DImode, true_regnum (operands[0]));") |
| |
| (define_insn "zero_extendqidi2" |
| [(set (match_operand:DI 0 "register_operand" "=r,r") |
| (zero_extend:DI (match_operand:QI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| andi %1, 255, %0 |
| ld%M1.ub %m1, %0" |
| [(set_attr "type" "arith_media,load_media")]) |
| |
| (define_expand "zero_extendhisi2" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (zero_extend:SI (match_operand:HI 1 "general_extend_operand" "")))] |
| "" |
| " |
| { |
| if (! TARGET_SHMEDIA && ! arith_reg_operand (operands[1], HImode)) |
| operands[1] = copy_to_mode_reg (HImode, operands[1]); |
| }") |
| |
| (define_insn "*zero_extendhisi2_compact" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (zero_extend:SI (match_operand:HI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "extu.w %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "*zero_extendhisi2_media" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (zero_extend:SI (match_operand:HI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| # |
| ld%M1.uw %m1, %0" |
| [(set_attr "type" "arith_media,load_media")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (zero_extend:SI (match_operand:HI 1 "extend_reg_operand" "")))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (ashift:SI (subreg:SI (match_dup 1) 0) (const_int 16))) |
| (set (match_dup 0) (lshiftrt:SI (match_dup 0) (const_int 16)))] |
| " |
| { |
| if (GET_CODE (operands[1]) == TRUNCATE) |
| operands[1] = XEXP (operands[1], 0); |
| }") |
| |
| (define_expand "zero_extendqisi2" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (zero_extend:SI (match_operand:QI 1 "general_extend_operand" "")))] |
| "" |
| " |
| { |
| if (! TARGET_SHMEDIA && ! arith_reg_operand (operands[1], QImode)) |
| operands[1] = copy_to_mode_reg (QImode, operands[1]); |
| }") |
| |
| (define_insn "*zero_extendqisi2_compact" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (zero_extend:SI (match_operand:QI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "extu.b %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "*zero_extendqisi2_media" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (zero_extend:SI (match_operand:QI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| andi %1, 255, %0 |
| ld%M1.ub %m1, %0" |
| [(set_attr "type" "arith_media,load_media")]) |
| |
| (define_insn "zero_extendqihi2" |
| [(set (match_operand:HI 0 "arith_reg_operand" "=r") |
| (zero_extend:HI (match_operand:QI 1 "arith_reg_operand" "r")))] |
| "TARGET_SH1" |
| "extu.b %1,%0" |
| [(set_attr "type" "arith")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Sign extension instructions |
| ;; ------------------------------------------------------------------------- |
| |
| ;; ??? This should be a define expand. |
| ;; ??? Or perhaps it should be dropped? |
| |
| ;; convert_move generates good code for SH[1-4]. |
| (define_insn "extendsidi2" |
| [(set (match_operand:DI 0 "register_operand" "=r,r") |
| (sign_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| add.l %1, r63, %0 |
| ld%M1.l %m1, %0" |
| [(set_attr "type" "arith_media,load_media")]) |
| |
| (define_insn "extendhidi2" |
| [(set (match_operand:DI 0 "register_operand" "=r,r") |
| (sign_extend:DI (match_operand:HI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| # |
| ld%M1.w %m1, %0" |
| [(set_attr "type" "*,load_media")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "register_operand" "") |
| (sign_extend:DI (match_operand:HI 1 "extend_reg_operand" "")))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (ashift:DI (subreg:DI (match_dup 1) 0) (const_int 48))) |
| (set (match_dup 0) (ashiftrt:DI (match_dup 0) (const_int 48)))] |
| " |
| { |
| if (GET_CODE (operands[1]) == TRUNCATE) |
| operands[1] = XEXP (operands[1], 0); |
| }") |
| |
| (define_insn "extendqidi2" |
| [(set (match_operand:DI 0 "register_operand" "=r,r") |
| (sign_extend:DI (match_operand:QI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| # |
| ld%M1.b %m1, %0" |
| [(set_attr "type" "*,load_media")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "register_operand" "") |
| (sign_extend:DI (match_operand:QI 1 "extend_reg_operand" "")))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (ashift:DI (subreg:DI (match_dup 1) 0) (const_int 56))) |
| (set (match_dup 0) (ashiftrt:DI (match_dup 0) (const_int 56)))] |
| " |
| { |
| if (GET_CODE (operands[1]) == TRUNCATE) |
| operands[1] = XEXP (operands[1], 0); |
| }") |
| |
| (define_expand "extendhisi2" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (sign_extend:SI (match_operand:HI 1 "general_extend_operand" "r,m")))] |
| "" |
| "") |
| |
| (define_insn "*extendhisi2_compact" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (sign_extend:SI (match_operand:HI 1 "general_movsrc_operand" "r,m")))] |
| "TARGET_SH1" |
| "@ |
| exts.w %1,%0 |
| mov.w %1,%0" |
| [(set_attr "type" "arith,load")]) |
| |
| (define_insn "*extendhisi2_media" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (sign_extend:SI (match_operand:HI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| # |
| ld%M1.w %m1, %0" |
| [(set_attr "type" "arith_media,load_media")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (sign_extend:SI (match_operand:HI 1 "extend_reg_operand" "")))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (ashift:SI (subreg:SI (match_dup 1) 0) (const_int 16))) |
| (set (match_dup 0) (ashiftrt:SI (match_dup 0) (const_int 16)))] |
| " |
| { |
| if (GET_CODE (operands[1]) == TRUNCATE) |
| operands[1] = XEXP (operands[1], 0); |
| }") |
| |
| (define_expand "extendqisi2" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (sign_extend:SI (match_operand:QI 1 "general_extend_operand" "r,m")))] |
| "" |
| "") |
| |
| (define_insn "*extendqisi2_compact" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") |
| (sign_extend:SI (match_operand:QI 1 "general_movsrc_operand" "r,m")))] |
| "TARGET_SH1" |
| "@ |
| exts.b %1,%0 |
| mov.b %1,%0" |
| [(set_attr "type" "arith,load")]) |
| |
| (define_insn "*extendqisi2_media" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (sign_extend:SI (match_operand:QI 1 "general_extend_operand" "r,m")))] |
| "TARGET_SHMEDIA" |
| "@ |
| # |
| ld%M1.b %m1, %0" |
| [(set_attr "type" "arith_media,load_media")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (sign_extend:SI (match_operand:QI 1 "extend_reg_operand" "")))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 0) (ashift:SI (subreg:SI (match_dup 1) 0) (const_int 24))) |
| (set (match_dup 0) (ashiftrt:SI (match_dup 0) (const_int 24)))] |
| " |
| { |
| if (GET_CODE (operands[1]) == TRUNCATE) |
| operands[1] = XEXP (operands[1], 0); |
| }") |
| |
| (define_insn "extendqihi2" |
| [(set (match_operand:HI 0 "arith_reg_operand" "=r,r") |
| (sign_extend:HI (match_operand:QI 1 "general_movsrc_operand" "r,m")))] |
| "TARGET_SH1" |
| "@ |
| exts.b %1,%0 |
| mov.b %1,%0" |
| [(set_attr "type" "arith,load")]) |
| |
| /* It would seem useful to combine the truncXi patterns into the movXi |
| patterns, but unary operators are ignored when matching constraints, |
| so we need separate patterns. */ |
| (define_insn "truncdisi2" |
| [(set (match_operand:SI 0 "general_movdst_operand" "=r,m,m,f,r,f") |
| (truncate:SI (match_operand:DI 1 "register_operand" "r,r,f,r,f,f")))] |
| "TARGET_SHMEDIA" |
| "@ |
| add.l %1, r63, %0 |
| st%M0.l %m0, %1 |
| fst%M0.s %m0, %T1 |
| fmov.ls %1, %0 |
| fmov.sl %T1, %0 |
| fmov.s %T1, %0" |
| [(set_attr "type" "arith_media,store_media,fstore_media,fload_media,fpconv_media,fmove_media")]) |
| |
| |
| (define_insn "truncdihi2" |
| [(set (match_operand:HI 0 "general_movdst_operand" "=?r,m") |
| (truncate:HI (match_operand:DI 1 "register_operand" "r,r")))] |
| "TARGET_SHMEDIA" |
| "@ |
| shlli\\t%1,48,%0\;shlri\\t%0,48,%0 |
| st%M0.w %m0, %1" |
| [(set_attr "type" "arith_media,store_media") |
| (set_attr "length" "8,4")]) |
| |
| ; N.B. This should agree with LOAD_EXTEND_OP and movqi. |
| ; Because we use zero extension, we can't provide signed QImode compares |
| ; using a simple compare or conditional banch insn. |
| (define_insn "truncdiqi2" |
| [(set (match_operand:QI 0 "general_movdst_operand" "=r,m") |
| (truncate:QI (match_operand:DI 1 "register_operand" "r,r")))] |
| "TARGET_SHMEDIA" |
| "@ |
| andi %1, 255, %0 |
| st%M0.b %m0, %1" |
| [(set_attr "type" "arith_media,store")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Move instructions |
| ;; ------------------------------------------------------------------------- |
| |
| ;; define push and pop so it is easy for sh.c |
| ;; We can't use push and pop on SHcompact because the stack must always |
| ;; be 8-byte aligned. |
| |
| (define_expand "push" |
| [(set (mem:SI (pre_dec:SI (reg:SI SP_REG))) |
| (match_operand:SI 0 "register_operand" "r,l,x"))] |
| "TARGET_SH1 && ! TARGET_SH5" |
| "") |
| |
| (define_expand "pop" |
| [(set (match_operand:SI 0 "register_operand" "=r,l,x") |
| (mem:SI (post_inc:SI (reg:SI SP_REG))))] |
| "TARGET_SH1 && ! TARGET_SH5" |
| "") |
| |
| (define_expand "push_e" |
| [(parallel [(set (mem:SF (pre_dec:SI (reg:SI SP_REG))) |
| (match_operand:SF 0 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (scratch:SI))])] |
| "TARGET_SH1 && ! TARGET_SH5" |
| "") |
| |
| (define_insn "push_fpul" |
| [(set (mem:SF (pre_dec:SI (reg:SI SP_REG))) (reg:SF FPUL_REG))] |
| "TARGET_SH2E && ! TARGET_SH5" |
| "sts.l fpul,@-r15" |
| [(set_attr "type" "store") |
| (set_attr "late_fp_use" "yes") |
| (set_attr "hit_stack" "yes")]) |
| |
| ;; DFmode pushes for sh4 require a lot of what is defined for movdf_i4, |
| ;; so use that. |
| (define_expand "push_4" |
| [(parallel [(set (mem:DF (pre_dec:SI (reg:SI SP_REG))) |
| (match_operand:DF 0 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (scratch:SI))])] |
| "TARGET_SH1 && ! TARGET_SH5" |
| "") |
| |
| (define_expand "pop_e" |
| [(parallel [(set (match_operand:SF 0 "" "") |
| (mem:SF (post_inc:SI (reg:SI SP_REG)))) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (scratch:SI))])] |
| "TARGET_SH1 && ! TARGET_SH5" |
| "") |
| |
| (define_insn "pop_fpul" |
| [(set (reg:SF FPUL_REG) (mem:SF (post_inc:SI (reg:SI SP_REG))))] |
| "TARGET_SH2E && ! TARGET_SH5" |
| "lds.l @r15+,fpul" |
| [(set_attr "type" "load") |
| (set_attr "hit_stack" "yes")]) |
| |
| (define_expand "pop_4" |
| [(parallel [(set (match_operand:DF 0 "" "") |
| (mem:DF (post_inc:SI (reg:SI SP_REG)))) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (scratch:SI))])] |
| "TARGET_SH1 && ! TARGET_SH5" |
| "") |
| |
| (define_expand "push_fpscr" |
| [(const_int 0)] |
| "TARGET_SH2E" |
| " |
| { |
| rtx insn = emit_insn (gen_fpu_switch (gen_rtx (MEM, PSImode, |
| gen_rtx (PRE_DEC, Pmode, |
| stack_pointer_rtx)), |
| get_fpscr_rtx ())); |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); |
| DONE; |
| }") |
| |
| (define_expand "pop_fpscr" |
| [(const_int 0)] |
| "TARGET_SH2E" |
| " |
| { |
| rtx insn = emit_insn (gen_fpu_switch (get_fpscr_rtx (), |
| gen_rtx (MEM, PSImode, |
| gen_rtx (POST_INC, Pmode, |
| stack_pointer_rtx)))); |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); |
| DONE; |
| }") |
| |
| ;; These two patterns can happen as the result of optimization, when |
| ;; comparisons get simplified to a move of zero or 1 into the T reg. |
| ;; They don't disappear completely, because the T reg is a fixed hard reg. |
| |
| (define_insn "clrt" |
| [(set (reg:SI T_REG) (const_int 0))] |
| "TARGET_SH1" |
| "clrt") |
| |
| (define_insn "sett" |
| [(set (reg:SI T_REG) (const_int 1))] |
| "TARGET_SH1" |
| "sett") |
| |
| ;; t/r must come after r/r, lest reload will try to reload stuff like |
| ;; (set (subreg:SI (mem:QI (plus:SI (reg:SI SP_REG) (const_int 12)) 0) 0) |
| ;; (made from (set (subreg:SI (reg:QI ###) 0) ) into T. |
| (define_insn "movsi_i" |
| [(set (match_operand:SI 0 "general_movdst_operand" |
| "=r,r,t,r,r,r,r,m,<,<,x,l,x,l,r") |
| (match_operand:SI 1 "general_movsrc_operand" |
| "Q,rI08,r,mr,x,l,t,r,x,l,r,r,>,>,i"))] |
| "TARGET_SH1 |
| && ! TARGET_SH2E |
| && (register_operand (operands[0], SImode) |
| || register_operand (operands[1], SImode))" |
| "@ |
| mov.l %1,%0 |
| mov %1,%0 |
| cmp/pl %1 |
| mov.l %1,%0 |
| sts %1,%0 |
| sts %1,%0 |
| movt %0 |
| mov.l %1,%0 |
| sts.l %1,%0 |
| sts.l %1,%0 |
| lds %1,%0 |
| lds %1,%0 |
| lds.l %1,%0 |
| lds.l %1,%0 |
| fake %1,%0" |
| [(set_attr "type" "pcload_si,move,mt_group,load_si,mac_gp,prget,move,store,store,pstore,move,prset,load,pload,pcload_si") |
| (set_attr "length" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,*")]) |
| |
| ;; t/r must come after r/r, lest reload will try to reload stuff like |
| ;; (subreg:SI (reg:SF FR14_REG) 0) into T (compiling stdlib/strtod.c -m3e -O2) |
| ;; ??? This allows moves from macl to fpul to be recognized, but these moves |
| ;; will require a reload. |
| ;; ??? We can't include f/f because we need the proper FPSCR setting when |
| ;; TARGET_FMOVD is in effect, and mode switching is done before reload. |
| (define_insn "movsi_ie" |
| [(set (match_operand:SI 0 "general_movdst_operand" |
| "=r,r,t,r,r,r,r,m,<,<,x,l,x,l,y,<,r,y,r,*f,y,*f,y") |
| (match_operand:SI 1 "general_movsrc_operand" |
| "Q,rI08,r,mr,x,l,t,r,x,l,r,r,>,>,>,y,i,r,y,y,*f,*f,y"))] |
| "TARGET_SH2E |
| && (register_operand (operands[0], SImode) |
| || register_operand (operands[1], SImode))" |
| "@ |
| mov.l %1,%0 |
| mov %1,%0 |
| cmp/pl %1 |
| mov.l %1,%0 |
| sts %1,%0 |
| sts %1,%0 |
| movt %0 |
| mov.l %1,%0 |
| sts.l %1,%0 |
| sts.l %1,%0 |
| lds %1,%0 |
| lds %1,%0 |
| lds.l %1,%0 |
| lds.l %1,%0 |
| lds.l %1,%0 |
| sts.l %1,%0 |
| fake %1,%0 |
| lds %1,%0 |
| sts %1,%0 |
| fsts fpul,%0 |
| flds %1,fpul |
| fmov %1,%0 |
| ! move optimized away" |
| [(set_attr "type" "pcload_si,move,*,load_si,mac_gp,prget,move,store,store,pstore,move,prset,load,pload,load,store,pcload_si,gp_fpul,fpul_gp,fmove,fmove,fmove,nil") |
| (set_attr "late_fp_use" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,yes,*,*,yes,*,*,*,*") |
| (set_attr "length" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,0")]) |
| |
| (define_insn "movsi_i_lowpart" |
| [(set (strict_low_part (match_operand:SI 0 "general_movdst_operand" "+r,r,r,r,r,r,m,r")) |
| (match_operand:SI 1 "general_movsrc_operand" "Q,rI08,mr,x,l,t,r,i"))] |
| "TARGET_SH1 |
| && (register_operand (operands[0], SImode) |
| || register_operand (operands[1], SImode))" |
| "@ |
| mov.l %1,%0 |
| mov %1,%0 |
| mov.l %1,%0 |
| sts %1,%0 |
| sts %1,%0 |
| movt %0 |
| mov.l %1,%0 |
| fake %1,%0" |
| [(set_attr "type" "pcload,move,load,move,prget,move,store,pcload")]) |
| |
| (define_insn_and_split "load_ra" |
| [(set (match_operand:SI 0 "general_movdst_operand" "") |
| (unspec:SI [(match_operand 1 "register_operand" "")] UNSPEC_RA))] |
| "TARGET_SH1" |
| "#" |
| "&& ! rtx_equal_function_value_matters" |
| [(set (match_dup 0) (match_dup 1))] |
| " |
| { |
| if (TARGET_SHCOMPACT && current_function_has_nonlocal_label) |
| operands[1] = gen_rtx_MEM (SImode, return_address_pointer_rtx); |
| }") |
| |
| (define_insn "*movsi_media" |
| [(set (match_operand:SI 0 "general_movdst_operand" |
| "=r,r,r,r,m,f,m,f,r,f,*b,r,b") |
| (match_operand:SI 1 "general_movsrc_operand" |
| "r,I16C16,nCpg,m,rZ,m,f,rZ,f,f,r,*b,Csy"))] |
| "TARGET_SHMEDIA_FPU |
| && (register_operand (operands[0], SImode) |
| || sh_register_operand (operands[1], SImode))" |
| "@ |
| add.l %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.l %m1, %0 |
| st%M0.l %m0, %N1 |
| fld%M1.s %m1, %0 |
| fst%M0.s %m0, %1 |
| fmov.ls %N1, %0 |
| fmov.sl %1, %0 |
| fmov.s %1, %0 |
| ptabs %1, %0 |
| gettr %1, %0 |
| pt %1, %0" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,fload_media,fstore_media,fload_media,fpconv_media,fmove_media,ptabs_media,gettr_media,pt_media") |
| (set_attr "length" "4,4,8,4,4,4,4,4,4,4,4,4,12")]) |
| |
| (define_insn "*movsi_media_nofpu" |
| [(set (match_operand:SI 0 "general_movdst_operand" |
| "=r,r,r,r,m,*b,r,b") |
| (match_operand:SI 1 "general_movsrc_operand" |
| "r,I16C16,nCpg,m,rZ,r,*b,Csy"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], SImode) |
| || sh_register_operand (operands[1], SImode))" |
| "@ |
| add.l %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.l %m1, %0 |
| st%M0.l %m0, %N1 |
| ptabs %1, %0 |
| gettr %1, %0 |
| pt %1, %0" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,ptabs_media,gettr_media,pt_media") |
| (set_attr "length" "4,4,8,4,4,4,4,12")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_operand:SI 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && MOVI_SHORI_BASE_OPERAND_P (operands[1])" |
| [(set (subreg:DI (match_dup 0) 0) (match_dup 2))] |
| " |
| { |
| operands[2] = shallow_copy_rtx (operands[1]); |
| PUT_MODE (operands[2], DImode); |
| }") |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (match_operand:SI 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && ((GET_CODE (operands[1]) == CONST_INT |
| && ! CONST_OK_FOR_I16 (INTVAL (operands[1]))) |
| || GET_CODE (operands[1]) == CONST_DOUBLE)" |
| [(set (subreg:DI (match_dup 0) 0) (match_dup 1))]) |
| |
| (define_expand "movsi" |
| [(set (match_operand:SI 0 "general_movdst_operand" "") |
| (match_operand:SI 1 "general_movsrc_operand" ""))] |
| "" |
| "{ if (prepare_move_operands (operands, SImode)) DONE; }") |
| |
| (define_expand "ic_invalidate_line" |
| [(parallel [(unspec_volatile [(match_operand:SI 0 "register_operand" "+r") |
| (match_dup 1)] UNSPEC_ICACHE) |
| (clobber (scratch:SI))])] |
| "TARGET_HARD_SH4 || TARGET_SH5" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_insn (gen_ic_invalidate_line_media (operands[0])); |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT) |
| { |
| operands[1] = function_symbol (\"__ic_invalidate\"); |
| operands[1] = force_reg (Pmode, operands[1]); |
| emit_insn (gen_ic_invalidate_line_compact (operands[0], operands[1])); |
| DONE; |
| } |
| operands[0] = force_reg (Pmode, operands[0]); |
| operands[1] = force_reg (Pmode, GEN_INT (trunc_int_for_mode (0xf0000008, |
| Pmode))); |
| }") |
| |
| ;; The address %0 is assumed to be 4-aligned at least. Thus, by ORing |
| ;; 0xf0000008, we get the low-oder bits *1*00 (binary), which fits |
| ;; the requirement *1*00 for associative address writes. The alignment of |
| ;; %0 implies that its least significant bit is cleared, |
| ;; thus we clear the V bit of a matching entry if there is one. |
| (define_insn "ic_invalidate_line_i" |
| [(unspec_volatile [(match_operand:SI 0 "register_operand" "r") |
| (match_operand:SI 1 "register_operand" "r")] |
| UNSPEC_ICACHE) |
| (clobber (match_scratch:SI 2 "=&r"))] |
| "TARGET_HARD_SH4" |
| "ocbwb\\t@%0\;extu.w\\t%0,%2\;or\\t%1,%2\;mov.l\\t%0,@%2" |
| [(set_attr "length" "8") |
| (set_attr "type" "cwb")]) |
| |
| ;; ??? could make arg 0 an offsettable memory operand to allow to save |
| ;; an add in the code that calculates the address. |
| (define_insn "ic_invalidate_line_media" |
| [(unspec_volatile [(match_operand 0 "register_operand" "r")] |
| UNSPEC_ICACHE)] |
| "TARGET_SHMEDIA" |
| "ocbwb %0,0\;synco\;icbi %0, 0\;synci" |
| [(set_attr "length" "16") |
| (set_attr "type" "invalidate_line_media")]) |
| |
| (define_insn "ic_invalidate_line_compact" |
| [(unspec_volatile [(match_operand:SI 0 "register_operand" "z") |
| (match_operand:SI 1 "register_operand" "r")] |
| UNSPEC_ICACHE) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "initialize_trampoline" |
| [(match_operand:SI 0 "" "") |
| (match_operand:SI 1 "" "") |
| (match_operand:SI 2 "" "")] |
| "TARGET_SHCOMPACT" |
| " |
| { |
| rtx sfun, tramp; |
| |
| tramp = force_reg (Pmode, operands[0]); |
| sfun = force_reg (Pmode, function_symbol (\"__init_trampoline\")); |
| emit_move_insn (gen_rtx_REG (SImode, R2_REG), operands[1]); |
| emit_move_insn (gen_rtx_REG (SImode, R3_REG), operands[2]); |
| |
| emit_insn (gen_initialize_trampoline_compact (tramp, sfun)); |
| DONE; |
| }") |
| |
| (define_insn "initialize_trampoline_compact" |
| [(unspec_volatile [(match_operand:SI 0 "register_operand" "z") |
| (match_operand:SI 1 "register_operand" "r") |
| (reg:SI R2_REG) (reg:SI R3_REG)] |
| UNSPEC_INIT_TRAMP) |
| |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT" |
| "jsr @%1%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "movqi_i" |
| [(set (match_operand:QI 0 "general_movdst_operand" "=r,r,m,r,r,l") |
| (match_operand:QI 1 "general_movsrc_operand" "ri,m,r,t,l,r"))] |
| "TARGET_SH1 |
| && (arith_reg_operand (operands[0], QImode) |
| || arith_reg_operand (operands[1], QImode))" |
| "@ |
| mov %1,%0 |
| mov.b %1,%0 |
| mov.b %1,%0 |
| movt %0 |
| sts %1,%0 |
| lds %1,%0" |
| [(set_attr "type" "move,load,store,move,move,move")]) |
| |
| (define_insn "*movqi_media" |
| [(set (match_operand:QI 0 "general_movdst_operand" "=r,r,r,m") |
| (match_operand:QI 1 "general_movsrc_operand" "r,I16C16,m,rZ"))] |
| "TARGET_SHMEDIA |
| && (arith_reg_operand (operands[0], QImode) |
| || arith_reg_or_0_operand (operands[1], QImode))" |
| "@ |
| add.l %1, r63, %0 |
| movi %1, %0 |
| ld%M1.ub %m1, %0 |
| st%M0.b %m0, %N1" |
| [(set_attr "type" "arith_media,arith_media,load_media,store_media")]) |
| |
| (define_expand "movqi" |
| [(set (match_operand:QI 0 "general_operand" "") |
| (match_operand:QI 1 "general_operand" ""))] |
| "" |
| "{ if (prepare_move_operands (operands, QImode)) DONE; }") |
| |
| (define_expand "reload_inqi" |
| [(set (match_operand:SI 2 "" "=&r") |
| (match_operand:QI 1 "inqhi_operand" "")) |
| (set (match_operand:QI 0 "arith_reg_operand" "=r") |
| (truncate:QI (match_dup 3)))] |
| "TARGET_SHMEDIA" |
| " |
| { |
| rtx inner = XEXP (operands[1], 0); |
| int regno = REGNO (inner); |
| |
| regno += HARD_REGNO_NREGS (regno, GET_MODE (inner)) - 1; |
| operands[1] = gen_rtx_REG (SImode, regno); |
| operands[3] = gen_rtx_REG (DImode, REGNO (operands[2])); |
| }") |
| |
| /* When storing r0, we have to avoid reg+reg addressing. */ |
| (define_insn "movhi_i" |
| [(set (match_operand:HI 0 "general_movdst_operand" "=r,r,r,r,m,r,l,r") |
| (match_operand:HI 1 "general_movsrc_operand" "Q,rI08,m,t,r,l,r,i"))] |
| "TARGET_SH1 |
| && (arith_reg_operand (operands[0], HImode) |
| || arith_reg_operand (operands[1], HImode)) |
| && (GET_CODE (operands[0]) != MEM |
| || GET_CODE (XEXP (operands[0], 0)) != PLUS |
| || GET_CODE (XEXP (XEXP (operands[0], 0), 1)) != REG |
| || ! refers_to_regno_p (R0_REG, R0_REG + 1, operands[1], (rtx *)0))" |
| "@ |
| mov.w %1,%0 |
| mov %1,%0 |
| mov.w %1,%0 |
| movt %0 |
| mov.w %1,%0 |
| sts %1,%0 |
| lds %1,%0 |
| fake %1,%0" |
| [(set_attr "type" "pcload,move,load,move,store,move,move,pcload")]) |
| |
| (define_insn "*movhi_media" |
| [(set (match_operand:HI 0 "general_movdst_operand" "=r,r,r,r,m") |
| (match_operand:HI 1 "general_movsrc_operand" "r,I16C16,n,m,rZ"))] |
| "TARGET_SHMEDIA |
| && (arith_reg_operand (operands[0], HImode) |
| || arith_reg_or_0_operand (operands[1], HImode))" |
| "@ |
| add.l %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.w %m1, %0 |
| st%M0.w %m0, %N1" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media")]) |
| |
| (define_split |
| [(set (match_operand:HI 0 "register_operand" "") |
| (match_operand:HI 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && ! CONST_OK_FOR_I16 (INTVAL (operands[1]))" |
| [(set (subreg:DI (match_dup 0) 0) (match_dup 1))]) |
| |
| (define_expand "movhi" |
| [(set (match_operand:HI 0 "general_movdst_operand" "") |
| (match_operand:HI 1 "general_movsrc_operand" ""))] |
| "" |
| "{ if (prepare_move_operands (operands, HImode)) DONE; }") |
| |
| (define_expand "reload_inhi" |
| [(set (match_operand:SI 2 "" "=&r") |
| (match_operand:HI 1 "inqhi_operand" "")) |
| (set (match_operand:HI 0 "arith_reg_operand" "=r") |
| (truncate:HI (match_dup 3)))] |
| "TARGET_SHMEDIA" |
| " |
| { |
| rtx inner = XEXP (operands[1], 0); |
| int regno = REGNO (inner); |
| |
| regno += HARD_REGNO_NREGS (regno, GET_MODE (inner)) - 1; |
| operands[1] = gen_rtx_REG (SImode, regno); |
| operands[3] = gen_rtx_REG (DImode, REGNO (operands[2])); |
| }") |
| |
| ;; x/r can be created by inlining/cse, e.g. for execute/961213-1.c |
| ;; compiled with -m2 -ml -O3 -funroll-loops |
| (define_insn "*movdi_i" |
| [(set (match_operand:DI 0 "general_movdst_operand" "=r,r,r,m,r,r,r,*!x") |
| (match_operand:DI 1 "general_movsrc_operand" "Q,r,m,r,I08,i,x,r"))] |
| "TARGET_SH1 |
| && (arith_reg_operand (operands[0], DImode) |
| || arith_reg_operand (operands[1], DImode))" |
| "* return output_movedouble (insn, operands, DImode);" |
| [(set_attr "length" "4") |
| (set_attr "type" "pcload,move,load,store,move,pcload,move,move")]) |
| |
| ;; If the output is a register and the input is memory or a register, we have |
| ;; to be careful and see which word needs to be loaded first. |
| |
| (define_split |
| [(set (match_operand:DI 0 "general_movdst_operand" "") |
| (match_operand:DI 1 "general_movsrc_operand" ""))] |
| "TARGET_SH1 && reload_completed" |
| [(set (match_dup 2) (match_dup 3)) |
| (set (match_dup 4) (match_dup 5))] |
| " |
| { |
| int regno; |
| |
| if ((GET_CODE (operands[0]) == MEM |
| && GET_CODE (XEXP (operands[0], 0)) == PRE_DEC) |
| || (GET_CODE (operands[1]) == MEM |
| && GET_CODE (XEXP (operands[1], 0)) == POST_INC)) |
| FAIL; |
| |
| if (GET_CODE (operands[0]) == REG) |
| regno = REGNO (operands[0]); |
| else if (GET_CODE (operands[0]) == SUBREG) |
| regno = subreg_regno (operands[0]); |
| else if (GET_CODE (operands[0]) == MEM) |
| regno = -1; |
| else |
| abort (); |
| |
| if (regno == -1 |
| || ! refers_to_regno_p (regno, regno + 1, operands[1], 0)) |
| { |
| operands[2] = operand_subword (operands[0], 0, 0, DImode); |
| operands[3] = operand_subword (operands[1], 0, 0, DImode); |
| operands[4] = operand_subword (operands[0], 1, 0, DImode); |
| operands[5] = operand_subword (operands[1], 1, 0, DImode); |
| } |
| else |
| { |
| operands[2] = operand_subword (operands[0], 1, 0, DImode); |
| operands[3] = operand_subword (operands[1], 1, 0, DImode); |
| operands[4] = operand_subword (operands[0], 0, 0, DImode); |
| operands[5] = operand_subword (operands[1], 0, 0, DImode); |
| } |
| |
| if (operands[2] == 0 || operands[3] == 0 |
| || operands[4] == 0 || operands[5] == 0) |
| FAIL; |
| }") |
| |
| (define_insn "*movdi_media" |
| [(set (match_operand:DI 0 "general_movdst_operand" |
| "=r,r,r,rl,m,f,m,f,r,f,*b,r,b") |
| (match_operand:DI 1 "general_movsrc_operand" |
| "r,I16C16,nCpgF,m,rlZ,m,f,rZ,f,f,r,*b,Csy"))] |
| "TARGET_SHMEDIA_FPU |
| && (register_operand (operands[0], DImode) |
| || sh_register_operand (operands[1], DImode))" |
| "@ |
| add %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1 |
| fld%M1.d %m1, %0 |
| fst%M0.d %m0, %1 |
| fmov.qd %N1, %0 |
| fmov.dq %1, %0 |
| fmov.d %1, %0 |
| ptabs %1, %0 |
| gettr %1, %0 |
| pt %1, %0" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,fload_media,fstore_media,fload_media,dfpconv_media,fmove_media,ptabs_media,gettr_media,pt_media") |
| (set_attr "length" "4,4,16,4,4,4,4,4,4,4,4,4,*")]) |
| |
| (define_insn "*movdi_media_nofpu" |
| [(set (match_operand:DI 0 "general_movdst_operand" "=r,r,r,rl,m,*b,r,b") |
| (match_operand:DI 1 "general_movsrc_operand" "r,I16C16,nCpgF,m,rlZ,r,*b,Csy"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], DImode) |
| || sh_register_operand (operands[1], DImode))" |
| "@ |
| add %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1 |
| ptabs %1, %0 |
| gettr %1, %0 |
| pt %1, %0" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,ptabs_media,gettr_media,pt_media") |
| (set_attr "length" "4,4,16,4,4,4,4,*")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (match_operand:DI 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && MOVI_SHORI_BASE_OPERAND_P (operands[1])" |
| [(set (match_dup 0) (match_dup 1))] |
| " |
| { |
| rtx insn; |
| |
| if (TARGET_SHMEDIA64) |
| insn = emit_insn (gen_movdi_const (operands[0], operands[1])); |
| else |
| insn = emit_insn (gen_movdi_const_32bit (operands[0], operands[1])); |
| |
| REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, operands[1], |
| REG_NOTES (insn)); |
| |
| DONE; |
| }") |
| |
| (define_expand "movdi_const" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (const:DI (sign_extend:DI |
| (truncate:HI |
| (ashiftrt:DI |
| (match_operand:DI 1 "immediate_operand" "s") |
| (const_int 48)))))) |
| (set (match_dup 0) |
| (ior:DI (ashift:DI (match_dup 0) (const_int 16)) |
| (zero_extend:DI |
| (truncate:HI |
| (const:DI |
| (sign_extend:DI |
| (truncate:HI |
| (ashiftrt:SI |
| (match_dup 1) |
| (const_int 32))))))))) |
| (set (match_dup 0) |
| (ior:DI (ashift:DI (match_dup 0) (const_int 16)) |
| (zero_extend:DI |
| (truncate:HI |
| (const:DI |
| (sign_extend:DI |
| (truncate:HI |
| (ashiftrt:SI |
| (match_dup 1) |
| (const_int 16))))))))) |
| (set (match_dup 0) |
| (ior:DI (ashift:DI (match_dup 0) (const_int 16)) |
| (zero_extend:DI |
| (truncate:HI |
| (const:DI |
| (sign_extend:DI |
| (truncate:HI |
| (match_dup 1))))))))] |
| "TARGET_SHMEDIA64 && reload_completed |
| && MOVI_SHORI_BASE_OPERAND_P (operands[1])" |
| " |
| { |
| sh_mark_label (operands[1], 4); |
| }") |
| |
| (define_expand "movdi_const_32bit" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (const:DI (sign_extend:DI |
| (truncate:HI |
| (ashiftrt:DI |
| (match_operand:DI 1 "immediate_operand" "s") |
| (const_int 16)))))) |
| (set (match_dup 0) |
| (ior:DI (ashift:DI (match_dup 0) (const_int 16)) |
| (zero_extend:DI |
| (truncate:HI |
| (const:DI |
| (sign_extend:DI |
| (truncate:HI |
| (match_dup 1))))))))] |
| "TARGET_SHMEDIA32 && reload_completed |
| && MOVI_SHORI_BASE_OPERAND_P (operands[1])" |
| " |
| { |
| sh_mark_label (operands[1], 2); |
| }") |
| |
| (define_expand "movdi_const_16bit" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (const:DI (sign_extend:DI |
| (truncate:HI |
| (match_operand:DI 1 "immediate_operand" "s")))))] |
| "TARGET_SHMEDIA && flag_pic && reload_completed |
| && GET_CODE (operands[1]) == SYMBOL_REF" |
| "") |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (match_operand:DI 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && GET_CODE (operands[1]) == CONST_INT |
| && ! CONST_OK_FOR_I16 (INTVAL (operands[1]))" |
| [(set (match_dup 0) (match_dup 2)) |
| (match_dup 1)] |
| " |
| { |
| unsigned HOST_WIDE_INT val = INTVAL (operands[1]); |
| unsigned HOST_WIDE_INT low = val; |
| unsigned HOST_WIDE_INT high = val; |
| unsigned HOST_WIDE_INT sign; |
| unsigned HOST_WIDE_INT val2 = val ^ (val-1); |
| |
| /* Sign-extend the 16 least-significant bits. */ |
| low &= 0xffff; |
| low ^= 0x8000; |
| low -= 0x8000; |
| |
| /* Arithmetic shift right the word by 16 bits. */ |
| high >>= 16; |
| sign = 1; |
| sign <<= (HOST_BITS_PER_WIDE_INT - 16 - 1); |
| high ^= sign; |
| high -= sign; |
| do |
| { |
| /* If we can't generate the constant with a two-insn movi / shori |
| sequence, try some other strategies. */ |
| if (! CONST_OK_FOR_I16 (high)) |
| { |
| /* Try constant load / left shift. We know VAL != 0. */ |
| val2 = val ^ (val-1); |
| if (val2 > 0x1ffff) |
| { |
| int trailing_zeroes = exact_log2 ((val2 >> 16) + 1) + 15; |
| |
| if (CONST_OK_FOR_I16 (val >> trailing_zeroes) |
| || (! CONST_OK_FOR_I16 (high >> 16) |
| && CONST_OK_FOR_I16 (val >> (trailing_zeroes + 16)))) |
| { |
| val2 = (HOST_WIDE_INT) val >> trailing_zeroes; |
| operands[1] = gen_ashldi3_media (operands[0], operands[0], |
| GEN_INT (trailing_zeroes)); |
| break; |
| } |
| } |
| /* Try constant load / right shift. */ |
| val2 = (val >> 15) + 1; |
| if (val2 == (val2 & -val2)) |
| { |
| int shift = 49 - exact_log2 (val2); |
| |
| val2 = trunc_int_for_mode (val << shift, DImode); |
| if (CONST_OK_FOR_I16 (val2)) |
| { |
| operands[1] = gen_lshrdi3_media (operands[0], operands[0], |
| GEN_INT (shift)); |
| break; |
| } |
| } |
| /* Try mperm.w . */ |
| val2 = val & 0xffff; |
| if ((val >> 16 & 0xffff) == val2 |
| && (val >> 32 & 0xffff) == val2 |
| && (val >> 48 & 0xffff) == val2) |
| { |
| val2 = (HOST_WIDE_INT) val >> 48; |
| operands[1] = gen_rtx_REG (V4HImode, true_regnum (operands[0])); |
| operands[1] = gen_mperm_w0 (operands[1], operands[1]); |
| break; |
| } |
| /* Try movi / mshflo.l */ |
| val2 = (HOST_WIDE_INT) val >> 32; |
| if (val2 == trunc_int_for_mode (val, SImode)) |
| { |
| operands[1] = gen_mshflo_l_di (operands[0], operands[0], |
| operands[0]); |
| break; |
| } |
| /* Try movi / mshflo.l w/ r63. */ |
| val2 = val + ((HOST_WIDE_INT) -1 << 32); |
| if ((HOST_WIDE_INT) val2 < 0 && CONST_OK_FOR_I16 (val2)) |
| { |
| operands[1] = gen_mshflo_l_di (operands[0], operands[0], |
| GEN_INT (0)); |
| break; |
| } |
| } |
| val2 = high; |
| operands[1] = gen_shori_media (operands[0], operands[0], GEN_INT (low)); |
| } |
| while (0); |
| operands[2] = GEN_INT (val2); |
| }") |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (match_operand:DI 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && GET_CODE (operands[1]) == CONST_DOUBLE" |
| [(set (match_dup 0) (match_dup 2)) |
| (set (match_dup 0) |
| (ior:DI (ashift:DI (match_dup 0) (const_int 16)) |
| (zero_extend:DI (truncate:HI (match_dup 1)))))] |
| " |
| { |
| unsigned HOST_WIDE_INT low = CONST_DOUBLE_LOW (operands[1]); |
| unsigned HOST_WIDE_INT high = CONST_DOUBLE_HIGH (operands[1]); |
| unsigned HOST_WIDE_INT val = low; |
| unsigned HOST_WIDE_INT sign; |
| |
| /* Sign-extend the 16 least-significant bits. */ |
| val &= 0xffff; |
| val ^= 0x8000; |
| val -= 0x8000; |
| operands[1] = GEN_INT (val); |
| |
| /* Arithmetic shift right the double-word by 16 bits. */ |
| low >>= 16; |
| low |= (high & 0xffff) << (HOST_BITS_PER_WIDE_INT - 16); |
| high >>= 16; |
| sign = 1; |
| sign <<= (HOST_BITS_PER_WIDE_INT - 16 - 1); |
| high ^= sign; |
| high -= sign; |
| |
| /* This will only be true if high is a sign-extension of low, i.e., |
| it must be either 0 or (unsigned)-1, and be zero iff the |
| most-significant bit of low is set. */ |
| if (high + (low >> (HOST_BITS_PER_WIDE_INT - 1)) == 0) |
| operands[2] = GEN_INT (low); |
| else |
| operands[2] = immed_double_const (low, high, DImode); |
| }") |
| |
| (define_insn "shori_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") |
| (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_operand" "0,0") |
| (const_int 16)) |
| (zero_extend:DI |
| (truncate:HI |
| (match_operand:DI 2 "immediate_operand" "I16C16,nF")))))] |
| "TARGET_SHMEDIA" |
| "@ |
| shori %u2, %0 |
| #" |
| [(set_attr "type" "arith_media,*")]) |
| |
| (define_expand "movdi" |
| [(set (match_operand:DI 0 "general_movdst_operand" "") |
| (match_operand:DI 1 "general_movsrc_operand" ""))] |
| "" |
| "{ if (prepare_move_operands (operands, DImode)) DONE; }") |
| |
| (define_insn "movdf_media" |
| [(set (match_operand:DF 0 "general_movdst_operand" "=f,f,r,r,r,f,m,r,m") |
| (match_operand:DF 1 "general_movsrc_operand" "f,rZ,f,r,F,m,f,m,rZ"))] |
| "TARGET_SHMEDIA_FPU |
| && (register_operand (operands[0], DFmode) |
| || sh_register_operand (operands[1], DFmode))" |
| "@ |
| fmov.d %1, %0 |
| fmov.qd %N1, %0 |
| fmov.dq %1, %0 |
| add %1, r63, %0 |
| # |
| fld%M1.d %m1, %0 |
| fst%M0.d %m0, %1 |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1" |
| [(set_attr "type" "fmove_media,fload_media,dfpconv_media,arith_media,*,fload_media,fstore_media,load_media,store_media")]) |
| |
| (define_insn "movdf_media_nofpu" |
| [(set (match_operand:DF 0 "general_movdst_operand" "=r,r,r,m") |
| (match_operand:DF 1 "general_movsrc_operand" "r,F,m,rZ"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], DFmode) |
| || sh_register_operand (operands[1], DFmode))" |
| "@ |
| add %1, r63, %0 |
| # |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1" |
| [(set_attr "type" "arith_media,*,load_media,store_media")]) |
| |
| (define_split |
| [(set (match_operand:DF 0 "arith_reg_operand" "") |
| (match_operand:DF 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed" |
| [(set (match_dup 3) (match_dup 2))] |
| " |
| { |
| int endian = WORDS_BIG_ENDIAN ? 1 : 0; |
| long values[2]; |
| REAL_VALUE_TYPE value; |
| |
| REAL_VALUE_FROM_CONST_DOUBLE (value, operands[1]); |
| REAL_VALUE_TO_TARGET_DOUBLE (value, values); |
| |
| if (HOST_BITS_PER_WIDE_INT >= 64) |
| operands[2] = immed_double_const ((unsigned long) values[endian] |
| | ((HOST_WIDE_INT) values[1 - endian] |
| << 32), 0, DImode); |
| else if (HOST_BITS_PER_WIDE_INT == 32) |
| operands[2] = immed_double_const (values[endian], values[1 - endian], |
| DImode); |
| else |
| abort (); |
| |
| operands[3] = gen_rtx_REG (DImode, true_regnum (operands[0])); |
| }") |
| |
| ;; ??? This should be a define expand. |
| |
| (define_insn "movdf_k" |
| [(set (match_operand:DF 0 "general_movdst_operand" "=r,r,r,m") |
| (match_operand:DF 1 "general_movsrc_operand" "r,FQ,m,r"))] |
| "TARGET_SH1 |
| && (! TARGET_SH4 || reload_completed |
| /* ??? We provide some insn so that direct_{load,store}[DFmode] get set */ |
| || (GET_CODE (operands[0]) == REG && REGNO (operands[0]) == 3) |
| || (GET_CODE (operands[1]) == REG && REGNO (operands[1]) == 3)) |
| && (arith_reg_operand (operands[0], DFmode) |
| || arith_reg_operand (operands[1], DFmode))" |
| "* return output_movedouble (insn, operands, DFmode);" |
| [(set_attr "length" "4") |
| (set_attr "type" "move,pcload,load,store")]) |
| |
| ;; All alternatives of movdf_i4 are split for ! TARGET_FMOVD. |
| ;; However, the d/F/c/z alternative cannot be split directly; it is converted |
| ;; with special code in machine_dependent_reorg into a load of the R0_REG and |
| ;; the d/m/c/X alternative, which is split later into single-precision |
| ;; instructions. And when not optimizing, no splits are done before fixing |
| ;; up pcloads, so we need usable length information for that. |
| (define_insn "movdf_i4" |
| [(set (match_operand:DF 0 "general_movdst_operand" "=d,r,d,d,m,r,r,m,!??r,!???d") |
| (match_operand:DF 1 "general_movsrc_operand" "d,r,F,m,d,FQ,m,r,d,r")) |
| (use (match_operand:PSI 2 "fpscr_operand" "c,c,c,c,c,c,c,c,c,c")) |
| (clobber (match_scratch:SI 3 "=X,X,&z,X,X,X,X,X,X,X"))] |
| "TARGET_SH4 |
| && (arith_reg_operand (operands[0], DFmode) |
| || arith_reg_operand (operands[1], DFmode))" |
| "@ |
| fmov %1,%0 |
| # |
| # |
| fmov.d %1,%0 |
| fmov.d %1,%0 |
| # |
| # |
| # |
| # |
| #" |
| [(set_attr_alternative "length" |
| [(if_then_else (eq_attr "fmovd" "yes") (const_int 2) (const_int 4)) |
| (const_int 4) |
| (if_then_else (eq_attr "fmovd" "yes") (const_int 4) (const_int 6)) |
| (if_then_else (eq_attr "fmovd" "yes") (const_int 2) (const_int 6)) |
| (if_then_else (eq_attr "fmovd" "yes") (const_int 2) (const_int 6)) |
| (const_int 4) |
| (const_int 8) (const_int 8) ;; these need only 8 bytes for @(r0,rn) |
| ;; We can't use 4-byte push/pop on SHcompact, so we have to |
| ;; increment or decrement r15 explicitly. |
| (if_then_else |
| (ne (symbol_ref "TARGET_SHCOMPACT") (const_int 0)) |
| (const_int 10) (const_int 8)) |
| (if_then_else |
| (ne (symbol_ref "TARGET_SHCOMPACT") (const_int 0)) |
| (const_int 10) (const_int 8))]) |
| (set_attr "type" "fmove,move,pcfload,fload,store,pcload,load,store,load,fload") |
| (set_attr "late_fp_use" "*,*,*,*,yes,*,*,*,*,*") |
| (set (attr "fp_mode") (if_then_else (eq_attr "fmovd" "yes") |
| (const_string "double") |
| (const_string "none")))]) |
| |
| ;; Moving DFmode between fp/general registers through memory |
| ;; (the top of the stack) is faster than moving through fpul even for |
| ;; little endian. Because the type of an instruction is important for its |
| ;; scheduling, it is beneficial to split these operations, rather than |
| ;; emitting them in one single chunk, even if this will expose a stack |
| ;; use that will prevent scheduling of other stack accesses beyond this |
| ;; instruction. |
| (define_split |
| [(set (match_operand:DF 0 "register_operand" "") |
| (match_operand:DF 1 "register_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 "=X"))] |
| "TARGET_SH4 && reload_completed |
| && (true_regnum (operands[0]) < 16) != (true_regnum (operands[1]) < 16)" |
| [(const_int 0)] |
| " |
| { |
| rtx insn, tos; |
| |
| if (TARGET_SH5 && true_regnum (operands[1]) < 16) |
| { |
| emit_move_insn (stack_pointer_rtx, |
| plus_constant (stack_pointer_rtx, -8)); |
| tos = gen_rtx_MEM (DFmode, stack_pointer_rtx); |
| } |
| else |
| tos = gen_rtx (MEM, DFmode, gen_rtx (PRE_DEC, Pmode, stack_pointer_rtx)); |
| insn = emit_insn (gen_movdf_i4 (tos, operands[1], operands[2])); |
| if (! (TARGET_SH5 && true_regnum (operands[1]) < 16)) |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); |
| if (TARGET_SH5 && true_regnum (operands[0]) < 16) |
| tos = gen_rtx_MEM (DFmode, stack_pointer_rtx); |
| else |
| tos = gen_rtx (MEM, DFmode, gen_rtx (POST_INC, Pmode, stack_pointer_rtx)); |
| insn = emit_insn (gen_movdf_i4 (operands[0], tos, operands[2])); |
| if (TARGET_SH5 && true_regnum (operands[0]) < 16) |
| emit_move_insn (stack_pointer_rtx, plus_constant (stack_pointer_rtx, 8)); |
| else |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); |
| DONE; |
| }") |
| |
| ;; local-alloc sometimes allocates scratch registers even when not required, |
| ;; so we must be prepared to handle these. |
| |
| ;; Remove the use and clobber from a movdf_i4 so that we can use movdf_k. |
| (define_split |
| [(set (match_operand:DF 0 "general_movdst_operand" "") |
| (match_operand:DF 1 "general_movsrc_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 ""))] |
| "TARGET_SH4 |
| && reload_completed |
| && true_regnum (operands[0]) < 16 |
| && true_regnum (operands[1]) < 16" |
| [(set (match_dup 0) (match_dup 1))] |
| " |
| { |
| /* If this was a reg <-> mem operation with base + index reg addressing, |
| we have to handle this in a special way. */ |
| rtx mem = operands[0]; |
| int store_p = 1; |
| if (! memory_operand (mem, DFmode)) |
| { |
| mem = operands[1]; |
| store_p = 0; |
| } |
| if (GET_CODE (mem) == SUBREG && SUBREG_BYTE (mem) == 0) |
| mem = SUBREG_REG (mem); |
| if (GET_CODE (mem) == MEM) |
| { |
| rtx addr = XEXP (mem, 0); |
| if (GET_CODE (addr) == PLUS |
| && GET_CODE (XEXP (addr, 0)) == REG |
| && GET_CODE (XEXP (addr, 1)) == REG) |
| { |
| int offset; |
| rtx reg0 = gen_rtx (REG, Pmode, 0); |
| rtx regop = operands[store_p], word0 ,word1; |
| |
| if (GET_CODE (regop) == SUBREG) |
| alter_subreg (®op); |
| if (REGNO (XEXP (addr, 0)) == REGNO (XEXP (addr, 1))) |
| offset = 2; |
| else |
| offset = 4; |
| mem = copy_rtx (mem); |
| PUT_MODE (mem, SImode); |
| word0 = gen_rtx (SUBREG, SImode, regop, 0); |
| alter_subreg (&word0); |
| word1 = gen_rtx (SUBREG, SImode, regop, 4); |
| alter_subreg (&word1); |
| if (store_p || ! refers_to_regno_p (REGNO (word0), |
| REGNO (word0) + 1, addr, 0)) |
| { |
| emit_insn (store_p |
| ? gen_movsi_ie (mem, word0) |
| : gen_movsi_ie (word0, mem)); |
| emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (offset))); |
| mem = copy_rtx (mem); |
| emit_insn (store_p |
| ? gen_movsi_ie (mem, word1) |
| : gen_movsi_ie (word1, mem)); |
| emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (-offset))); |
| } |
| else |
| { |
| emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (offset))); |
| emit_insn (gen_movsi_ie (word1, mem)); |
| emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (-offset))); |
| mem = copy_rtx (mem); |
| emit_insn (gen_movsi_ie (word0, mem)); |
| } |
| DONE; |
| } |
| } |
| }") |
| |
| ;; Split away the clobber of r0 after machine_dependent_reorg has fixed pcloads. |
| (define_split |
| [(set (match_operand:DF 0 "register_operand" "") |
| (match_operand:DF 1 "memory_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (reg:SI R0_REG))] |
| "TARGET_SH4 && reload_completed" |
| [(parallel [(set (match_dup 0) (match_dup 1)) |
| (use (match_dup 2)) |
| (clobber (scratch:SI))])] |
| "") |
| |
| (define_expand "reload_indf" |
| [(parallel [(set (match_operand:DF 0 "register_operand" "=f") |
| (match_operand:DF 1 "immediate_operand" "FQ")) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (match_operand:SI 2 "register_operand" "=&z"))])] |
| "TARGET_SH1" |
| "") |
| |
| (define_expand "reload_outdf" |
| [(parallel [(set (match_operand:DF 0 "register_operand" "=r,f") |
| (match_operand:DF 1 "register_operand" "af,r")) |
| (clobber (match_operand:SI 2 "register_operand" "=&y,y"))])] |
| "TARGET_SH1" |
| "") |
| |
| ;; Simplify no-op moves. |
| (define_split |
| [(set (match_operand:SF 0 "register_operand" "") |
| (match_operand:SF 1 "register_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 ""))] |
| "TARGET_SH2E && reload_completed |
| && true_regnum (operands[0]) == true_regnum (operands[1])" |
| [(set (match_dup 0) (match_dup 0))] |
| "") |
| |
| ;; fmovd substitute post-reload splits |
| (define_split |
| [(set (match_operand:DF 0 "register_operand" "") |
| (match_operand:DF 1 "register_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 ""))] |
| "TARGET_SH4 && ! TARGET_FMOVD && reload_completed |
| && FP_OR_XD_REGISTER_P (true_regnum (operands[0])) |
| && FP_OR_XD_REGISTER_P (true_regnum (operands[1]))" |
| [(const_int 0)] |
| " |
| { |
| int dst = true_regnum (operands[0]), src = true_regnum (operands[1]); |
| emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, dst), |
| gen_rtx (REG, SFmode, src), operands[2])); |
| emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, dst + 1), |
| gen_rtx (REG, SFmode, src + 1), operands[2])); |
| DONE; |
| }") |
| |
| (define_split |
| [(set (match_operand:DF 0 "register_operand" "") |
| (mem:DF (match_operand:SI 1 "register_operand" ""))) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 ""))] |
| "TARGET_SH4 && ! TARGET_FMOVD && reload_completed |
| && FP_OR_XD_REGISTER_P (true_regnum (operands[0])) |
| && find_regno_note (insn, REG_DEAD, true_regnum (operands[1]))" |
| [(const_int 0)] |
| " |
| { |
| int regno = true_regnum (operands[0]); |
| rtx insn; |
| rtx mem2 = gen_rtx (MEM, SFmode, gen_rtx (POST_INC, Pmode, operands[1])); |
| |
| insn = emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, |
| regno + !! TARGET_LITTLE_ENDIAN), |
| mem2, operands[2])); |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, operands[1], NULL_RTX); |
| insn = emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, |
| regno + ! TARGET_LITTLE_ENDIAN), |
| gen_rtx (MEM, SFmode, operands[1]), |
| operands[2])); |
| DONE; |
| }") |
| |
| (define_split |
| [(set (match_operand:DF 0 "register_operand" "") |
| (match_operand:DF 1 "memory_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 ""))] |
| "TARGET_SH4 && ! TARGET_FMOVD && reload_completed |
| && FP_OR_XD_REGISTER_P (true_regnum (operands[0]))" |
| [(const_int 0)] |
| " |
| { |
| int regno = true_regnum (operands[0]); |
| rtx addr, insn, adjust = NULL_RTX; |
| rtx mem2 = copy_rtx (operands[1]); |
| rtx reg0 = gen_rtx_REG (SFmode, regno + !! TARGET_LITTLE_ENDIAN); |
| rtx reg1 = gen_rtx_REG (SFmode, regno + ! TARGET_LITTLE_ENDIAN); |
| |
| PUT_MODE (mem2, SFmode); |
| operands[1] = copy_rtx (mem2); |
| addr = XEXP (mem2, 0); |
| if (GET_CODE (addr) != POST_INC) |
| { |
| /* If we have to modify the stack pointer, the value that we have |
| read with post-increment might be modified by an interrupt, |
| so write it back. */ |
| if (REGNO (addr) == STACK_POINTER_REGNUM) |
| adjust = gen_push_e (reg0); |
| else |
| adjust = gen_addsi3 (addr, addr, GEN_INT (-4)); |
| XEXP (mem2, 0) = addr = gen_rtx_POST_INC (SImode, addr); |
| } |
| addr = XEXP (addr, 0); |
| insn = emit_insn (gen_movsf_ie (reg0, mem2, operands[2])); |
| REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_INC, addr, NULL_RTX); |
| insn = emit_insn (gen_movsf_ie (reg1, operands[1], operands[2])); |
| if (adjust) |
| emit_insn (adjust); |
| else |
| REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_INC, addr, NULL_RTX); |
| DONE; |
| }") |
| |
| (define_split |
| [(set (match_operand:DF 0 "memory_operand" "") |
| (match_operand:DF 1 "register_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (match_scratch:SI 3 ""))] |
| "TARGET_SH4 && ! TARGET_FMOVD && reload_completed |
| && FP_OR_XD_REGISTER_P (true_regnum (operands[1]))" |
| [(const_int 0)] |
| " |
| { |
| int regno = true_regnum (operands[1]); |
| rtx insn, addr, adjust = NULL_RTX; |
| |
| operands[0] = copy_rtx (operands[0]); |
| PUT_MODE (operands[0], SFmode); |
| insn = emit_insn (gen_movsf_ie (operands[0], |
| gen_rtx (REG, SFmode, |
| regno + ! TARGET_LITTLE_ENDIAN), |
| operands[2])); |
| operands[0] = copy_rtx (operands[0]); |
| addr = XEXP (operands[0], 0); |
| if (GET_CODE (addr) != PRE_DEC) |
| { |
| adjust = gen_addsi3 (addr, addr, GEN_INT (4)); |
| emit_insn_before (adjust, insn); |
| XEXP (operands[0], 0) = addr = gen_rtx (PRE_DEC, SImode, addr); |
| } |
| addr = XEXP (addr, 0); |
| if (! adjust) |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, addr, NULL_RTX); |
| insn = emit_insn (gen_movsf_ie (operands[0], |
| gen_rtx (REG, SFmode, |
| regno + !! TARGET_LITTLE_ENDIAN), |
| operands[2])); |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, addr, NULL_RTX); |
| DONE; |
| }") |
| |
| ;; If the output is a register and the input is memory or a register, we have |
| ;; to be careful and see which word needs to be loaded first. |
| |
| (define_split |
| [(set (match_operand:DF 0 "general_movdst_operand" "") |
| (match_operand:DF 1 "general_movsrc_operand" ""))] |
| "TARGET_SH1 && reload_completed" |
| [(set (match_dup 2) (match_dup 3)) |
| (set (match_dup 4) (match_dup 5))] |
| " |
| { |
| int regno; |
| |
| if ((GET_CODE (operands[0]) == MEM |
| && GET_CODE (XEXP (operands[0], 0)) == PRE_DEC) |
| || (GET_CODE (operands[1]) == MEM |
| && GET_CODE (XEXP (operands[1], 0)) == POST_INC)) |
| FAIL; |
| |
| if (GET_CODE (operands[0]) == REG) |
| regno = REGNO (operands[0]); |
| else if (GET_CODE (operands[0]) == SUBREG) |
| regno = subreg_regno (operands[0]); |
| else if (GET_CODE (operands[0]) == MEM) |
| regno = -1; |
| else |
| abort (); |
| |
| if (regno == -1 |
| || ! refers_to_regno_p (regno, regno + 1, operands[1], 0)) |
| { |
| operands[2] = operand_subword (operands[0], 0, 0, DFmode); |
| operands[3] = operand_subword (operands[1], 0, 0, DFmode); |
| operands[4] = operand_subword (operands[0], 1, 0, DFmode); |
| operands[5] = operand_subword (operands[1], 1, 0, DFmode); |
| } |
| else |
| { |
| operands[2] = operand_subword (operands[0], 1, 0, DFmode); |
| operands[3] = operand_subword (operands[1], 1, 0, DFmode); |
| operands[4] = operand_subword (operands[0], 0, 0, DFmode); |
| operands[5] = operand_subword (operands[1], 0, 0, DFmode); |
| } |
| |
| if (operands[2] == 0 || operands[3] == 0 |
| || operands[4] == 0 || operands[5] == 0) |
| FAIL; |
| }") |
| |
| ;; If a base address generated by LEGITIMIZE_ADDRESS for SImode is |
| ;; used only once, let combine add in the index again. |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (match_operand:SI 1 "" "")) |
| (clobber (match_operand 2 "register_operand" ""))] |
| "TARGET_SH1 && ! reload_in_progress && ! reload_completed" |
| [(use (reg:SI R0_REG))] |
| " |
| { |
| rtx addr, reg, const_int; |
| |
| if (GET_CODE (operands[1]) != MEM) |
| FAIL; |
| addr = XEXP (operands[1], 0); |
| if (GET_CODE (addr) != PLUS) |
| FAIL; |
| reg = XEXP (addr, 0); |
| const_int = XEXP (addr, 1); |
| if (! (BASE_REGISTER_RTX_P (reg) && INDEX_REGISTER_RTX_P (operands[2]) |
| && GET_CODE (const_int) == CONST_INT)) |
| FAIL; |
| emit_move_insn (operands[2], const_int); |
| emit_move_insn (operands[0], |
| change_address (operands[1], VOIDmode, |
| gen_rtx_PLUS (SImode, reg, operands[2]))); |
| DONE; |
| }") |
| |
| (define_split |
| [(set (match_operand:SI 1 "" "") |
| (match_operand:SI 0 "register_operand" "")) |
| (clobber (match_operand 2 "register_operand" ""))] |
| "TARGET_SH1 && ! reload_in_progress && ! reload_completed" |
| [(use (reg:SI R0_REG))] |
| " |
| { |
| rtx addr, reg, const_int; |
| |
| if (GET_CODE (operands[1]) != MEM) |
| FAIL; |
| addr = XEXP (operands[1], 0); |
| if (GET_CODE (addr) != PLUS) |
| FAIL; |
| reg = XEXP (addr, 0); |
| const_int = XEXP (addr, 1); |
| if (! (BASE_REGISTER_RTX_P (reg) && INDEX_REGISTER_RTX_P (operands[2]) |
| && GET_CODE (const_int) == CONST_INT)) |
| FAIL; |
| emit_move_insn (operands[2], const_int); |
| emit_move_insn (change_address (operands[1], VOIDmode, |
| gen_rtx_PLUS (SImode, reg, operands[2])), |
| operands[0]); |
| DONE; |
| }") |
| |
| (define_expand "movdf" |
| [(set (match_operand:DF 0 "general_movdst_operand" "") |
| (match_operand:DF 1 "general_movsrc_operand" ""))] |
| "" |
| " |
| { |
| if (prepare_move_operands (operands, DFmode)) DONE; |
| if (TARGET_SHMEDIA) |
| { |
| if (TARGET_SHMEDIA_FPU) |
| emit_insn (gen_movdf_media (operands[0], operands[1])); |
| else |
| emit_insn (gen_movdf_media_nofpu (operands[0], operands[1])); |
| DONE; |
| } |
| if (TARGET_SH4) |
| { |
| emit_df_insn (gen_movdf_i4 (operands[0], operands[1], get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| ;;This is incompatible with the way gcc uses subregs. |
| ;;(define_insn "movv2sf_i" |
| ;; [(set (match_operand:V2SF 0 "nonimmediate_operand" "=f,f,m") |
| ;; (match_operand:V2SF 1 "nonimmediate_operand" "f,m,f"))] |
| ;; "TARGET_SHMEDIA_FPU |
| ;; && (fp_arith_reg_operand (operands[0], V2SFmode) |
| ;; || fp_arith_reg_operand (operands[1], V2SFmode))" |
| ;; "@ |
| ;; # |
| ;; fld%M1.p %m1, %0 |
| ;; fst%M0.p %m0, %1" |
| ;; [(set_attr "type" "*,fload_media,fstore_media")]) |
| |
| (define_insn_and_split "movv2sf_i" |
| [(set (match_operand:V2SF 0 "general_movdst_operand" "=f,rf,r,m,mf") |
| (match_operand:V2SF 1 "general_operand" "fm,rfm?,F?,f,rfZ?"))] |
| "TARGET_SHMEDIA_FPU" |
| "#" |
| "TARGET_SHMEDIA_FPU && reload_completed" |
| [(set (match_dup 0) (match_dup 1))] |
| " |
| { |
| operands[0] = simplify_gen_subreg (DFmode, operands[0], V2SFmode, 0); |
| operands[1] = simplify_gen_subreg (DFmode, operands[1], V2SFmode, 0); |
| }") |
| |
| (define_expand "movv2sf" |
| [(set (match_operand:V2SF 0 "general_movdst_operand" "") |
| (match_operand:V2SF 1 "nonimmediate_operand" ""))] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (prepare_move_operands (operands, V2SFmode)) |
| DONE; |
| }") |
| |
| (define_expand "addv2sf3" |
| [(match_operand:V2SF 0 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 1 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 2 "fp_arith_reg_operand" "")] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| sh_expand_binop_v2sf (PLUS, operands[0], operands[1], operands[2]); |
| DONE; |
| }") |
| |
| (define_expand "subv2sf3" |
| [(match_operand:V2SF 0 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 1 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 2 "fp_arith_reg_operand" "")] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| sh_expand_binop_v2sf (MINUS, operands[0], operands[1], operands[2]); |
| DONE; |
| }") |
| |
| (define_expand "mulv2sf3" |
| [(match_operand:V2SF 0 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 1 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 2 "fp_arith_reg_operand" "")] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| sh_expand_binop_v2sf (MULT, operands[0], operands[1], operands[2]); |
| DONE; |
| }") |
| |
| (define_expand "divv2sf3" |
| [(match_operand:V2SF 0 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 1 "fp_arith_reg_operand" "") |
| (match_operand:V2SF 2 "fp_arith_reg_operand" "")] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| sh_expand_binop_v2sf (DIV, operands[0], operands[1], operands[2]); |
| DONE; |
| }") |
| |
| (define_insn_and_split "*movv4sf_i" |
| [(set (match_operand:V4SF 0 "nonimmediate_operand" "=f,f,m") |
| (match_operand:V4SF 1 "general_operand" "fZ,m,fZ"))] |
| "TARGET_SHMEDIA_FPU" |
| "#" |
| "&& reload_completed" |
| [(const_int 0)] |
| " |
| { |
| int i; |
| |
| for (i = 0; i < 4/2; i++) |
| { |
| rtx x, y; |
| |
| if (GET_CODE (operands[0]) == MEM) |
| x = gen_rtx_MEM (V2SFmode, |
| plus_constant (XEXP (operands[0], 0), |
| i * GET_MODE_SIZE (V2SFmode))); |
| else |
| x = simplify_gen_subreg (V2SFmode, operands[0], V4SFmode, i * 8); |
| |
| if (GET_CODE (operands[1]) == MEM) |
| y = gen_rtx_MEM (V2SFmode, |
| plus_constant (XEXP (operands[1], 0), |
| i * GET_MODE_SIZE (V2SFmode))); |
| else |
| y = simplify_gen_subreg (V2SFmode, operands[1], V4SFmode, i * 8); |
| |
| emit_insn (gen_movv2sf_i (x, y)); |
| } |
| |
| DONE; |
| }" |
| [(set_attr "length" "8")]) |
| |
| (define_expand "movv4sf" |
| [(set (match_operand:V4SF 0 "nonimmediate_operand" "") |
| (match_operand:V4SF 1 "general_operand" ""))] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (prepare_move_operands (operands, V4SFmode)) |
| DONE; |
| }") |
| |
| (define_insn_and_split "*movv16sf_i" |
| [(set (match_operand:V16SF 0 "nonimmediate_operand" "=f,f,m") |
| (match_operand:V16SF 1 "nonimmediate_operand" "f,m,f"))] |
| "TARGET_SHMEDIA_FPU" |
| "#" |
| "&& reload_completed" |
| [(const_int 0)] |
| " |
| { |
| int i; |
| |
| for (i = 0; i < 16/2; i++) |
| { |
| rtx x,y; |
| |
| if (GET_CODE (operands[0]) == MEM) |
| x = gen_rtx_MEM (V2SFmode, |
| plus_constant (XEXP (operands[0], 0), |
| i * GET_MODE_SIZE (V2SFmode))); |
| else |
| { |
| x = gen_rtx_SUBREG (V2SFmode, operands[0], i * 8); |
| alter_subreg (&x); |
| } |
| |
| if (GET_CODE (operands[1]) == MEM) |
| y = gen_rtx_MEM (V2SFmode, |
| plus_constant (XEXP (operands[1], 0), |
| i * GET_MODE_SIZE (V2SFmode))); |
| else |
| { |
| y = gen_rtx_SUBREG (V2SFmode, operands[1], i * 8); |
| alter_subreg (&y); |
| } |
| |
| emit_insn (gen_movv2sf_i (x, y)); |
| } |
| |
| DONE; |
| }" |
| [(set_attr "length" "32")]) |
| |
| (define_expand "movv16sf" |
| [(set (match_operand:V16SF 0 "nonimmediate_operand" "=f,f,m") |
| (match_operand:V16SF 1 "nonimmediate_operand" "f,m,f"))] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (prepare_move_operands (operands, V16SFmode)) |
| DONE; |
| }") |
| |
| (define_insn "movsf_media" |
| [(set (match_operand:SF 0 "general_movdst_operand" "=f,f,r,r,r,f,m,r,m") |
| (match_operand:SF 1 "general_movsrc_operand" "f,rZ,f,r,F,m,f,m,rZ"))] |
| "TARGET_SHMEDIA_FPU |
| && (register_operand (operands[0], SFmode) |
| || sh_register_operand (operands[1], SFmode))" |
| "@ |
| fmov.s %1, %0 |
| fmov.ls %N1, %0 |
| fmov.sl %1, %0 |
| add.l %1, r63, %0 |
| # |
| fld%M1.s %m1, %0 |
| fst%M0.s %m0, %1 |
| ld%M1.l %m1, %0 |
| st%M0.l %m0, %N1" |
| [(set_attr "type" "fmove_media,fload_media,fpconv_media,arith_media,*,fload_media,fstore_media,load_media,store_media")]) |
| |
| (define_insn "movsf_media_nofpu" |
| [(set (match_operand:SF 0 "general_movdst_operand" "=r,r,r,m") |
| (match_operand:SF 1 "general_movsrc_operand" "r,F,m,rZ"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], SFmode) |
| || sh_register_operand (operands[1], SFmode))" |
| "@ |
| add.l %1, r63, %0 |
| # |
| ld%M1.l %m1, %0 |
| st%M0.l %m0, %N1" |
| [(set_attr "type" "arith_media,*,load_media,store_media")]) |
| |
| (define_split |
| [(set (match_operand:SF 0 "arith_reg_operand" "") |
| (match_operand:SF 1 "immediate_operand" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && ! FP_REGISTER_P (true_regnum (operands[0]))" |
| [(set (match_dup 3) (match_dup 2))] |
| " |
| { |
| long values; |
| REAL_VALUE_TYPE value; |
| |
| REAL_VALUE_FROM_CONST_DOUBLE (value, operands[1]); |
| REAL_VALUE_TO_TARGET_SINGLE (value, values); |
| operands[2] = GEN_INT (values); |
| |
| operands[3] = gen_rtx_REG (DImode, true_regnum (operands[0])); |
| }") |
| |
| (define_insn "movsf_i" |
| [(set (match_operand:SF 0 "general_movdst_operand" "=r,r,r,r,m,l,r") |
| (match_operand:SF 1 "general_movsrc_operand" "r,G,FQ,mr,r,r,l"))] |
| "TARGET_SH1 |
| && (! TARGET_SH2E |
| /* ??? We provide some insn so that direct_{load,store}[SFmode] get set */ |
| || (GET_CODE (operands[0]) == REG && REGNO (operands[0]) == 3) |
| || (GET_CODE (operands[1]) == REG && REGNO (operands[1]) == 3)) |
| && (arith_reg_operand (operands[0], SFmode) |
| || arith_reg_operand (operands[1], SFmode))" |
| "@ |
| mov %1,%0 |
| mov #0,%0 |
| mov.l %1,%0 |
| mov.l %1,%0 |
| mov.l %1,%0 |
| lds %1,%0 |
| sts %1,%0" |
| [(set_attr "type" "move,move,pcload,load,store,move,move")]) |
| |
| ;; We may not split the ry/yr/XX alternatives to movsi_ie, since |
| ;; update_flow_info would not know where to put REG_EQUAL notes |
| ;; when the destination changes mode. |
| (define_insn "movsf_ie" |
| [(set (match_operand:SF 0 "general_movdst_operand" |
| "=f,r,f,f,fy,f,m,r,r,m,f,y,y,rf,r,y,<,y,y") |
| (match_operand:SF 1 "general_movsrc_operand" |
| "f,r,G,H,FQ,mf,f,FQ,mr,r,y,f,>,fr,y,r,y,>,y")) |
| (use (match_operand:PSI 2 "fpscr_operand" "c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c")) |
| (clobber (match_scratch:SI 3 "=X,X,Bsc,Bsc,&z,X,X,X,X,X,X,X,X,y,X,X,X,X,X"))] |
| |
| "TARGET_SH2E |
| && (arith_reg_operand (operands[0], SFmode) |
| || arith_reg_operand (operands[1], SFmode) |
| || arith_reg_operand (operands[3], SImode) |
| || (fpul_operand (operands[0], SFmode) |
| && memory_operand (operands[1], SFmode) |
| && GET_CODE (XEXP (operands[1], 0)) == POST_INC) |
| || (fpul_operand (operands[1], SFmode) |
| && memory_operand (operands[0], SFmode) |
| && GET_CODE (XEXP (operands[0], 0)) == PRE_DEC))" |
| "@ |
| fmov %1,%0 |
| mov %1,%0 |
| fldi0 %0 |
| fldi1 %0 |
| # |
| fmov.s %1,%0 |
| fmov.s %1,%0 |
| mov.l %1,%0 |
| mov.l %1,%0 |
| mov.l %1,%0 |
| fsts fpul,%0 |
| flds %1,fpul |
| lds.l %1,%0 |
| # |
| sts %1,%0 |
| lds %1,%0 |
| sts.l %1,%0 |
| lds.l %1,%0 |
| ! move optimized away" |
| [(set_attr "type" "fmove,move,fmove,fmove,pcfload,fload,store,pcload,load,store,fmove,fmove,load,*,fpul_gp,gp_fpul,store,load,nil") |
| (set_attr "late_fp_use" "*,*,*,*,*,*,yes,*,*,*,*,*,*,*,yes,*,yes,*,*") |
| (set_attr "length" "*,*,*,*,4,*,*,*,*,*,2,2,2,4,2,2,2,2,0") |
| (set (attr "fp_mode") (if_then_else (eq_attr "fmovd" "yes") |
| (const_string "single") |
| (const_string "none")))]) |
| |
| (define_split |
| [(set (match_operand:SF 0 "register_operand" "") |
| (match_operand:SF 1 "register_operand" "")) |
| (use (match_operand:PSI 2 "fpscr_operand" "")) |
| (clobber (reg:SI FPUL_REG))] |
| "TARGET_SH1" |
| [(parallel [(set (reg:SF FPUL_REG) (match_dup 1)) |
| (use (match_dup 2)) |
| (clobber (scratch:SI))]) |
| (parallel [(set (match_dup 0) (reg:SF FPUL_REG)) |
| (use (match_dup 2)) |
| (clobber (scratch:SI))])] |
| "") |
| |
| (define_expand "movsf" |
| [(set (match_operand:SF 0 "general_movdst_operand" "") |
| (match_operand:SF 1 "general_movsrc_operand" ""))] |
| "" |
| " |
| { |
| if (prepare_move_operands (operands, SFmode)) |
| DONE; |
| if (TARGET_SHMEDIA) |
| { |
| if (TARGET_SHMEDIA_FPU) |
| emit_insn (gen_movsf_media (operands[0], operands[1])); |
| else |
| emit_insn (gen_movsf_media_nofpu (operands[0], operands[1])); |
| DONE; |
| } |
| if (TARGET_SH2E) |
| { |
| emit_sf_insn (gen_movsf_ie (operands[0], operands[1], get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "mov_nop" |
| [(set (match_operand 0 "any_register_operand" "") (match_dup 0))] |
| "TARGET_SH2E" |
| "" |
| [(set_attr "length" "0") |
| (set_attr "type" "nil")]) |
| |
| (define_expand "reload_insf" |
| [(parallel [(set (match_operand:SF 0 "register_operand" "=a") |
| (match_operand:SF 1 "immediate_operand" "FQ")) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (match_operand:SI 2 "register_operand" "=&z"))])] |
| "TARGET_SH1" |
| "") |
| |
| (define_expand "reload_insi" |
| [(parallel [(set (match_operand:SF 0 "register_operand" "=y") |
| (match_operand:SF 1 "immediate_operand" "FQ")) |
| (clobber (match_operand:SI 2 "register_operand" "=&z"))])] |
| "TARGET_SH1" |
| "") |
| |
| (define_insn "*movsi_y" |
| [(set (match_operand:SI 0 "register_operand" "=y,y") |
| (match_operand:SI 1 "immediate_operand" "Qi,I08")) |
| (clobber (match_scratch:SI 2 "=&z,r"))] |
| "TARGET_SH2E |
| && (reload_in_progress || reload_completed)" |
| "#" |
| [(set_attr "length" "4") |
| (set_attr "type" "pcload,move")]) |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (match_operand:SI 1 "immediate_operand" "")) |
| (clobber (match_operand:SI 2 "register_operand" ""))] |
| "TARGET_SH1" |
| [(set (match_dup 2) (match_dup 1)) |
| (set (match_dup 0) (match_dup 2))] |
| "") |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (match_operand:SI 1 "memory_operand" "")) |
| (clobber (reg:SI R0_REG))] |
| "TARGET_SH1" |
| [(set (match_dup 0) (match_dup 1))] |
| "") |
| |
| ;; ------------------------------------------------------------------------ |
| ;; Define the real conditional branch instructions. |
| ;; ------------------------------------------------------------------------ |
| |
| (define_insn "branch_true" |
| [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SH1" |
| "* return output_branch (1, insn, operands);" |
| [(set_attr "type" "cbranch")]) |
| |
| (define_insn "branch_false" |
| [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SH1" |
| "* return output_branch (0, insn, operands);" |
| [(set_attr "type" "cbranch")]) |
| |
| ;; Patterns to prevent reorg from re-combining a condbranch with a branch |
| ;; which destination is too far away. |
| ;; The const_int_operand is distinct for each branch target; it avoids |
| ;; unwanted matches with redundant_insn. |
| (define_insn "block_branch_redirect" |
| [(set (pc) (unspec [(match_operand 0 "const_int_operand" "")] UNSPEC_BBR))] |
| "TARGET_SH1" |
| "" |
| [(set_attr "length" "0")]) |
| |
| ;; This one has the additional purpose to record a possible scratch register |
| ;; for the following branch. |
| ;; ??? Unfortunately, just setting the scratch register is not good enough, |
| ;; because the insn then might be deemed dead and deleted. And we can't |
| ;; make the use in the jump insn explicit because that would disable |
| ;; delay slot scheduling from the target. |
| (define_insn "indirect_jump_scratch" |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (unspec:SI [(match_operand 1 "const_int_operand" "")] UNSPEC_BBR)) |
| (set (pc) (unspec [(const_int 0)] UNSPEC_BBR))] |
| "TARGET_SH1" |
| "" |
| [(set_attr "length" "0")]) |
| |
| ;; This one is used to preemt an insn from beyond the bra / braf / jmp |
| ;; being pulled into the delay slot of a condbranch that has been made to |
| ;; jump around the unconditional jump because it was out of range. |
| (define_insn "stuff_delay_slot" |
| [(set (pc) |
| (unspec [(match_operand 0 "const_int_operand" "") (pc)] UNSPEC_BBR)) |
| (set (reg:SI T_REG) (match_operand 1 "const_int_operand" ""))] |
| "TARGET_SH1" |
| "" |
| [(set_attr "length" "0") |
| (set_attr "cond_delay_slot" "yes")]) |
| |
| ;; Conditional branch insns |
| |
| (define_expand "beq_media" |
| [(set (pc) |
| (if_then_else (eq (match_operand:DI 1 "arith_reg_operand" "r,r") |
| (match_operand:DI 2 "arith_operand" "r,I06")) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "") |
| |
| (define_insn "*beq_media_i" |
| [(set (pc) |
| (if_then_else (match_operator 3 "equality_comparison_operator" |
| [(match_operand:DI 1 "arith_reg_operand" "r,r") |
| (match_operand:DI 2 "arith_operand" "r,I06")]) |
| (match_operand:DI 0 "target_operand" "b,b") |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "@ |
| b%o3%' %1, %2, %0 |
| b%o3i%' %1, %2, %0" |
| [(set_attr "type" "cbranch_media")]) |
| |
| (define_expand "bne_media" |
| [(set (pc) |
| (if_then_else (ne (match_operand:DI 1 "arith_reg_operand" "r,r") |
| (match_operand:DI 2 "arith_operand" "r,I06")) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "") |
| |
| (define_expand "bgt_media" |
| [(set (pc) |
| (if_then_else (gt (match_operand:DI 1 "arith_reg_or_0_operand" "r") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "r")) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "") |
| |
| (define_expand "bge_media" |
| [(set (pc) |
| (if_then_else (ge (match_operand:DI 1 "arith_reg_or_0_operand" "r") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "r")) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "") |
| |
| (define_expand "bgtu_media" |
| [(set (pc) |
| (if_then_else (gtu (match_operand:DI 1 "arith_reg_or_0_operand" "r") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "r")) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "") |
| |
| (define_expand "bgeu_media" |
| [(set (pc) |
| (if_then_else (geu (match_operand:DI 1 "arith_reg_or_0_operand" "r") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "r")) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "") |
| |
| (define_insn "*bgt_media_i" |
| [(set (pc) |
| (if_then_else (match_operator 3 "greater_comparison_operator" |
| [(match_operand:DI 1 "arith_reg_or_0_operand" "rN") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rN")]) |
| (match_operand:DI 0 "target_operand" "b") |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "b%o3%' %N1, %N2, %0" |
| [(set_attr "type" "cbranch_media")]) |
| |
| ;; These are only needed to make invert_jump() happy. |
| (define_insn "*blt_media_i" |
| [(set (pc) |
| (if_then_else (match_operator 3 "less_comparison_operator" |
| [(match_operand:DI 1 "arith_reg_or_0_operand" "rN") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rN")]) |
| (match_operand:DI 0 "target_operand" "b") |
| (pc)))] |
| "TARGET_SHMEDIA" |
| "b%o3%' %N2, %N1, %0" |
| [(set_attr "type" "cbranch_media")]) |
| |
| (define_expand "beq" |
| [(set (pc) |
| (if_then_else (ne (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (sh_compare_op0) != DImode) |
| { |
| rtx tmp = gen_reg_rtx (DImode); |
| |
| emit_insn (gen_seq (tmp)); |
| emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); |
| DONE; |
| } |
| |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| emit_jump_insn (gen_beq_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| |
| from_compare (operands, EQ); |
| }") |
| |
| (define_expand "bne" |
| [(set (pc) |
| (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (sh_compare_op0) != DImode) |
| { |
| rtx tmp = gen_reg_rtx (DImode); |
| |
| emit_insn (gen_seq (tmp)); |
| emit_jump_insn (gen_beq_media (operands[0], tmp, const0_rtx)); |
| DONE; |
| } |
| |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| emit_jump_insn (gen_bne_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| |
| from_compare (operands, EQ); |
| }") |
| |
| (define_expand "bgt" |
| [(set (pc) |
| (if_then_else (ne (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (sh_compare_op0) != DImode) |
| { |
| rtx tmp = gen_reg_rtx (DImode); |
| |
| emit_insn (gen_sgt (tmp)); |
| emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); |
| DONE; |
| } |
| |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bgt_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| |
| from_compare (operands, GT); |
| }") |
| |
| (define_expand "blt" |
| [(set (pc) |
| (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (sh_compare_op0) != DImode) |
| { |
| rtx tmp = gen_reg_rtx (DImode); |
| |
| emit_insn (gen_slt (tmp)); |
| emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); |
| DONE; |
| } |
| |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bgt_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| DONE; |
| } |
| |
| if (GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) |
| { |
| rtx tmp = sh_compare_op0; |
| sh_compare_op0 = sh_compare_op1; |
| sh_compare_op1 = tmp; |
| emit_insn (gen_bgt (operands[0])); |
| DONE; |
| } |
| from_compare (operands, GE); |
| }") |
| |
| (define_expand "ble" |
| [(set (pc) |
| (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (sh_compare_op0) != DImode) |
| { |
| rtx tmp = gen_reg_rtx (DImode); |
| |
| emit_insn (gen_sle (tmp)); |
| emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); |
| DONE; |
| } |
| |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bge_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| DONE; |
| } |
| |
| if (TARGET_SH2E |
| && TARGET_IEEE |
| && GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) |
| { |
| rtx tmp = sh_compare_op0; |
| sh_compare_op0 = sh_compare_op1; |
| sh_compare_op1 = tmp; |
| emit_insn (gen_bge (operands[0])); |
| DONE; |
| } |
| from_compare (operands, GT); |
| }") |
| |
| (define_expand "bge" |
| [(set (pc) |
| (if_then_else (ne (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (sh_compare_op0) != DImode) |
| { |
| rtx tmp = gen_reg_rtx (DImode); |
| |
| emit_insn (gen_sge (tmp)); |
| emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); |
| DONE; |
| } |
| |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bge_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| |
| if (TARGET_SH2E |
| && ! TARGET_IEEE |
| && GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) |
| { |
| rtx tmp = sh_compare_op0; |
| sh_compare_op0 = sh_compare_op1; |
| sh_compare_op1 = tmp; |
| emit_insn (gen_ble (operands[0])); |
| DONE; |
| } |
| from_compare (operands, GE); |
| }") |
| |
| (define_expand "bgtu" |
| [(set (pc) |
| (if_then_else (ne (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bgtu_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| |
| from_compare (operands, GTU); |
| }") |
| |
| (define_expand "bltu" |
| [(set (pc) |
| (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bgtu_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| DONE; |
| } |
| |
| from_compare (operands, GEU); |
| }") |
| |
| (define_expand "bgeu" |
| [(set (pc) |
| (if_then_else (ne (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bgeu_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| |
| from_compare (operands, GEU); |
| }") |
| |
| (define_expand "bleu" |
| [(set (pc) |
| (if_then_else (eq (reg:SI T_REG) (const_int 0)) |
| (label_ref (match_operand 0 "" "")) |
| (pc)))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (sh_compare_op0 != const0_rtx) |
| sh_compare_op0 = force_reg (DImode, sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (DImode, sh_compare_op1); |
| emit_jump_insn (gen_bgeu_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| DONE; |
| } |
| |
| from_compare (operands, GTU); |
| }") |
| |
| (define_expand "bunordered" |
| [(set (match_dup 1) (unordered:DI (match_dup 2) (match_dup 3))) |
| (set (pc) |
| (if_then_else (ne (match_dup 1) (const_int 0)) |
| (label_ref:DI (match_operand 0 "" "")) |
| (pc)))] |
| "TARGET_SHMEDIA" |
| " |
| { |
| operands[1] = gen_reg_rtx (DImode); |
| operands[2] = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| operands[3] = force_reg (GET_MODE (sh_compare_op1), sh_compare_op1); |
| }") |
| |
| ;; ------------------------------------------------------------------------ |
| ;; Jump and linkage insns |
| ;; ------------------------------------------------------------------------ |
| |
| (define_insn "jump_compact" |
| [(set (pc) |
| (label_ref (match_operand 0 "" "")))] |
| "TARGET_SH1" |
| "* |
| { |
| /* The length is 16 if the delay slot is unfilled. */ |
| if (get_attr_length(insn) > 4) |
| return output_far_jump(insn, operands[0]); |
| else |
| return \"bra %l0%#\"; |
| }" |
| [(set_attr "type" "jump") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| ;; ??? It would be much saner to explicitly use the scratch register |
| ;; in the jump insn, and have indirect_jump_scratch only set it, |
| ;; but fill_simple_delay_slots would refuse to do delay slot filling |
| ;; from the target then, as it uses simplejump_p. |
| ;;(define_insn "jump_compact_far" |
| ;; [(set (pc) |
| ;; (label_ref (match_operand 0 "" ""))) |
| ;; (use (match_operand 1 "register_operand" "r")] |
| ;; "TARGET_SH1" |
| ;; "* return output_far_jump(insn, operands[0], operands[1]);" |
| ;; [(set_attr "type" "jump") |
| ;; (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "jump_media" |
| [(set (pc) |
| (match_operand:DI 0 "target_operand" "b"))] |
| "TARGET_SHMEDIA" |
| "blink %0, r63" |
| [(set_attr "type" "jump_media")]) |
| |
| (define_expand "jump" |
| [(set (pc) |
| (label_ref (match_operand 0 "" "")))] |
| "" |
| " |
| { |
| if (TARGET_SH1) |
| emit_jump_insn (gen_jump_compact (operands[0])); |
| else if (TARGET_SHMEDIA) |
| { |
| if (reload_in_progress || reload_completed) |
| FAIL; |
| emit_jump_insn (gen_jump_media (gen_rtx_LABEL_REF (DImode, |
| operands[0]))); |
| } |
| DONE; |
| }") |
| |
| (define_insn "force_mode_for_call" |
| [(use (reg:PSI FPSCR_REG))] |
| "TARGET_SHCOMPACT" |
| "" |
| [(set_attr "length" "0") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double")))]) |
| |
| (define_insn "calli" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (match_operand 1 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SH1" |
| "jsr @%0%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes") |
| (set_attr "fp_set" "unknown")]) |
| |
| ;; This is a pc-rel call, using bsrf, for use with PIC. |
| |
| (define_insn "calli_pcrel" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (match_operand 1 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (use (reg:SI PIC_REG)) |
| (use (match_operand 2 "" "")) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SH2" |
| "bsrf %0\\n%O2:%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes") |
| (set_attr "fp_set" "unknown")]) |
| |
| (define_insn_and_split "call_pcrel" |
| [(call (mem:SI (match_operand:SI 0 "symbol_ref_operand" "")) |
| (match_operand 1 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (use (reg:SI PIC_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (match_scratch:SI 2 "=r"))] |
| "TARGET_SH2" |
| "#" |
| "reload_completed" |
| [(const_int 0)] |
| " |
| { |
| rtx lab = PATTERN (gen_call_site ()); |
| |
| if (SYMBOL_REF_LOCAL_P (operands[0])) |
| emit_insn (gen_sym_label2reg (operands[2], operands[0], lab)); |
| else |
| emit_insn (gen_symPLT_label2reg (operands[2], operands[0], lab)); |
| emit_call_insn (gen_calli_pcrel (operands[2], operands[1], lab)); |
| DONE; |
| }" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes") |
| (set_attr "fp_set" "unknown")]) |
| |
| (define_insn "call_compact" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "immediate_operand" "n") |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && ! (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%0%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "call_compact_rettramp" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "immediate_operand" "n") |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI R10_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%0%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "call_media" |
| [(call (mem:DI (match_operand:DI 0 "target_reg_operand" "b")) |
| (match_operand 1 "" "")) |
| (clobber (reg:DI PR_MEDIA_REG))] |
| "TARGET_SHMEDIA" |
| "blink %0, r18" |
| [(set_attr "type" "jump_media")]) |
| |
| (define_insn "call_valuei" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (match_operand 2 "" ""))) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SH1" |
| "jsr @%1%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes") |
| (set_attr "fp_set" "unknown")]) |
| |
| (define_insn "call_valuei_pcrel" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (match_operand 2 "" ""))) |
| (use (reg:PSI FPSCR_REG)) |
| (use (reg:SI PIC_REG)) |
| (use (match_operand 3 "" "")) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SH2" |
| "bsrf %1\\n%O3:%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes") |
| (set_attr "fp_set" "unknown")]) |
| |
| (define_insn_and_split "call_value_pcrel" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "symbol_ref_operand" "")) |
| (match_operand 2 "" ""))) |
| (use (reg:PSI FPSCR_REG)) |
| (use (reg:SI PIC_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (match_scratch:SI 3 "=r"))] |
| "TARGET_SH2" |
| "#" |
| "reload_completed" |
| [(const_int 0)] |
| " |
| { |
| rtx lab = PATTERN (gen_call_site ()); |
| |
| if (SYMBOL_REF_LOCAL_P (operands[1])) |
| emit_insn (gen_sym_label2reg (operands[3], operands[1], lab)); |
| else |
| emit_insn (gen_symPLT_label2reg (operands[3], operands[1], lab)); |
| emit_call_insn (gen_call_valuei_pcrel (operands[0], operands[3], |
| operands[2], lab)); |
| DONE; |
| }" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes") |
| (set_attr "fp_set" "unknown")]) |
| |
| (define_insn "call_value_compact" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (match_operand 2 "" ""))) |
| (match_operand 3 "immediate_operand" "n") |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && ! (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%1%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "call_value_compact_rettramp" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (match_operand 2 "" ""))) |
| (match_operand 3 "immediate_operand" "n") |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI R10_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%1%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "call_value_media" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:DI (match_operand:DI 1 "target_reg_operand" "b")) |
| (match_operand 2 "" ""))) |
| (clobber (reg:DI PR_MEDIA_REG))] |
| "TARGET_SHMEDIA" |
| "blink %1, r18" |
| [(set_attr "type" "jump_media")]) |
| |
| (define_expand "call" |
| [(parallel [(call (mem:SI (match_operand 0 "arith_reg_operand" "")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "" "") |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| operands[0] = XEXP (operands[0], 0); |
| if (flag_pic && GET_CODE (operands[0]) == SYMBOL_REF) |
| { |
| if (! SYMBOL_REF_LOCAL_P (operands[0])) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, operands[0])); |
| operands[0] = reg; |
| } |
| else |
| { |
| operands[0] = gen_sym2PIC (operands[0]); |
| PUT_MODE (operands[0], Pmode); |
| } |
| } |
| if (GET_MODE (operands[0]) == SImode) |
| { |
| if (GET_CODE (operands[0]) == REG) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| else if (GET_CODE (operands[0]) == SUBREG) |
| { |
| operands[0] = SUBREG_REG (operands[0]); |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| } |
| else |
| { |
| operands[0] = shallow_copy_rtx (operands[0]); |
| PUT_MODE (operands[0], DImode); |
| } |
| } |
| if (! target_reg_operand (operands[0], DImode)) |
| operands[0] = copy_to_mode_reg (DImode, operands[0]); |
| emit_call_insn (gen_call_media (operands[0], operands[1])); |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT && operands[2] && INTVAL (operands[2])) |
| { |
| rtx cookie_rtx = operands[2]; |
| long cookie = INTVAL (cookie_rtx); |
| rtx func = XEXP (operands[0], 0); |
| rtx r0, r1; |
| |
| if (flag_pic) |
| { |
| if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, func)); |
| func = reg; |
| } |
| else |
| func = legitimize_pic_address (func, Pmode, 0); |
| } |
| |
| r0 = gen_rtx_REG (SImode, R0_REG); |
| r1 = gen_rtx_REG (SImode, R1_REG); |
| |
| /* Since such a call function may use all call-clobbered |
| registers, we force a mode switch earlier, so that we don't |
| run out of registers when adjusting fpscr for the call. */ |
| emit_insn (gen_force_mode_for_call ()); |
| |
| operands[0] = function_symbol (\"__GCC_shcompact_call_trampoline\"); |
| if (flag_pic) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, operands[0])); |
| operands[0] = reg; |
| } |
| operands[0] = force_reg (SImode, operands[0]); |
| |
| emit_move_insn (r0, func); |
| emit_move_insn (r1, cookie_rtx); |
| |
| if (cookie & CALL_COOKIE_RET_TRAMP (1)) |
| emit_call_insn (gen_call_compact_rettramp (operands[0], operands[1], |
| operands[2])); |
| else |
| emit_call_insn (gen_call_compact (operands[0], operands[1], |
| operands[2])); |
| |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT && flag_pic |
| && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF |
| && ! SYMBOL_REF_LOCAL_P (XEXP (operands[0], 0))) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, XEXP (operands[0], 0))); |
| XEXP (operands[0], 0) = reg; |
| } |
| if (flag_pic && TARGET_SH2 |
| && GET_CODE (operands[0]) == MEM |
| && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF) |
| { |
| emit_call_insn (gen_call_pcrel (XEXP (operands[0], 0), operands[1])); |
| DONE; |
| } |
| else |
| { |
| operands[0] = force_reg (SImode, XEXP (operands[0], 0)); |
| operands[1] = operands[2]; |
| } |
| |
| emit_call_insn (gen_calli (operands[0], operands[1])); |
| DONE; |
| }") |
| |
| (define_insn "call_pop_compact" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "immediate_operand" "n") |
| (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) |
| (match_operand 3 "immediate_operand" "n"))) |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && ! (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%0%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "call_pop_compact_rettramp" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "immediate_operand" "n") |
| (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) |
| (match_operand 3 "immediate_operand" "n"))) |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI R10_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%0%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "call_pop" |
| [(parallel [(call (mem:SI (match_operand 0 "arith_reg_operand" "")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "" "") |
| (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) |
| (match_operand 3 "" "")))])] |
| "TARGET_SHCOMPACT" |
| " |
| { |
| if (operands[2] && INTVAL (operands[2])) |
| { |
| rtx cookie_rtx = operands[2]; |
| long cookie = INTVAL (cookie_rtx); |
| rtx func = XEXP (operands[0], 0); |
| rtx r0, r1; |
| |
| if (flag_pic) |
| { |
| if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, func)); |
| func = reg; |
| } |
| else |
| func = legitimize_pic_address (func, Pmode, 0); |
| } |
| |
| r0 = gen_rtx_REG (SImode, R0_REG); |
| r1 = gen_rtx_REG (SImode, R1_REG); |
| |
| /* Since such a call function may use all call-clobbered |
| registers, we force a mode switch earlier, so that we don't |
| run out of registers when adjusting fpscr for the call. */ |
| emit_insn (gen_force_mode_for_call ()); |
| |
| operands[0] = function_symbol (\"__GCC_shcompact_call_trampoline\"); |
| if (flag_pic) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, operands[0])); |
| operands[0] = reg; |
| } |
| operands[0] = force_reg (SImode, operands[0]); |
| |
| emit_move_insn (r0, func); |
| emit_move_insn (r1, cookie_rtx); |
| |
| if (cookie & CALL_COOKIE_RET_TRAMP (1)) |
| emit_call_insn (gen_call_pop_compact_rettramp |
| (operands[0], operands[1], operands[2], operands[3])); |
| else |
| emit_call_insn (gen_call_pop_compact |
| (operands[0], operands[1], operands[2], operands[3])); |
| |
| DONE; |
| } |
| |
| abort (); |
| }") |
| |
| (define_expand "call_value" |
| [(parallel [(set (match_operand 0 "arith_reg_operand" "") |
| (call (mem:SI (match_operand 1 "arith_reg_operand" "")) |
| (match_operand 2 "" ""))) |
| (match_operand 3 "" "") |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| operands[1] = XEXP (operands[1], 0); |
| if (flag_pic && GET_CODE (operands[1]) == SYMBOL_REF) |
| { |
| if (! SYMBOL_REF_LOCAL_P (operands[1])) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, operands[1])); |
| operands[1] = reg; |
| } |
| else |
| { |
| operands[1] = gen_sym2PIC (operands[1]); |
| PUT_MODE (operands[1], Pmode); |
| } |
| } |
| if (GET_MODE (operands[1]) == SImode) |
| { |
| if (GET_CODE (operands[1]) == REG) |
| operands[1] = gen_rtx_SUBREG (DImode, operands[1], 0); |
| else if (GET_CODE (operands[1]) == SUBREG) |
| { |
| operands[1] = SUBREG_REG (operands[1]); |
| if (GET_MODE (operands[1]) != DImode) |
| operands[1] = gen_rtx_SUBREG (DImode, operands[1], 0); |
| } |
| else |
| { |
| operands[1] = shallow_copy_rtx (operands[1]); |
| PUT_MODE (operands[1], DImode); |
| } |
| } |
| if (! target_reg_operand (operands[1], DImode)) |
| operands[1] = copy_to_mode_reg (DImode, operands[1]); |
| emit_call_insn (gen_call_value_media (operands[0], operands[1], |
| operands[2])); |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT && operands[3] && INTVAL (operands[3])) |
| { |
| rtx cookie_rtx = operands[3]; |
| long cookie = INTVAL (cookie_rtx); |
| rtx func = XEXP (operands[1], 0); |
| rtx r0, r1; |
| |
| if (flag_pic) |
| { |
| if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, func)); |
| func = reg; |
| } |
| else |
| func = legitimize_pic_address (func, Pmode, 0); |
| } |
| |
| r0 = gen_rtx_REG (SImode, R0_REG); |
| r1 = gen_rtx_REG (SImode, R1_REG); |
| |
| /* Since such a call function may use all call-clobbered |
| registers, we force a mode switch earlier, so that we don't |
| run out of registers when adjusting fpscr for the call. */ |
| emit_insn (gen_force_mode_for_call ()); |
| |
| operands[1] = function_symbol (\"__GCC_shcompact_call_trampoline\"); |
| if (flag_pic) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, operands[1])); |
| operands[1] = reg; |
| } |
| operands[1] = force_reg (SImode, operands[1]); |
| |
| emit_move_insn (r0, func); |
| emit_move_insn (r1, cookie_rtx); |
| |
| if (cookie & CALL_COOKIE_RET_TRAMP (1)) |
| emit_call_insn (gen_call_value_compact_rettramp (operands[0], |
| operands[1], |
| operands[2], |
| operands[3])); |
| else |
| emit_call_insn (gen_call_value_compact (operands[0], operands[1], |
| operands[2], operands[3])); |
| |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT && flag_pic |
| && GET_CODE (XEXP (operands[1], 0)) == SYMBOL_REF |
| && ! SYMBOL_REF_LOCAL_P (XEXP (operands[1], 0))) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, XEXP (operands[1], 0))); |
| XEXP (operands[1], 0) = reg; |
| } |
| if (flag_pic && TARGET_SH2 |
| && GET_CODE (operands[1]) == MEM |
| && GET_CODE (XEXP (operands[1], 0)) == SYMBOL_REF) |
| { |
| emit_call_insn (gen_call_value_pcrel (operands[0], XEXP (operands[1], 0), |
| operands[2])); |
| DONE; |
| } |
| else |
| operands[1] = force_reg (SImode, XEXP (operands[1], 0)); |
| |
| emit_call_insn (gen_call_valuei (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "sibcalli" |
| [(call (mem:SI (match_operand:SI 0 "register_operand" "k")) |
| (match_operand 1 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (return)] |
| "TARGET_SH1" |
| "jmp @%0%#" |
| [(set_attr "needs_delay_slot" "yes") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "type" "jump_ind")]) |
| |
| (define_insn "sibcalli_pcrel" |
| [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "k")) |
| (match_operand 1 "" "")) |
| (use (match_operand 2 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (return)] |
| "TARGET_SH2" |
| "braf %0\\n%O2:%#" |
| [(set_attr "needs_delay_slot" "yes") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "type" "jump_ind")]) |
| |
| (define_insn_and_split "sibcall_pcrel" |
| [(call (mem:SI (match_operand:SI 0 "symbol_ref_operand" "")) |
| (match_operand 1 "" "")) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (match_scratch:SI 2 "=k")) |
| (return)] |
| "TARGET_SH2" |
| "#" |
| "reload_completed" |
| [(const_int 0)] |
| " |
| { |
| rtx lab = PATTERN (gen_call_site ()); |
| rtx call_insn; |
| |
| emit_insn (gen_sym_label2reg (operands[2], operands[0], lab)); |
| call_insn = emit_call_insn (gen_sibcalli_pcrel (operands[2], operands[1], |
| lab)); |
| SIBLING_CALL_P (call_insn) = 1; |
| DONE; |
| }" |
| [(set_attr "needs_delay_slot" "yes") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "type" "jump_ind")]) |
| |
| (define_insn "sibcall_compact" |
| [(call (mem:SI (match_operand:SI 0 "register_operand" "k,k")) |
| (match_operand 1 "" "")) |
| (return) |
| (use (match_operand:SI 2 "register_operand" "z,x")) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| ;; We want to make sure the `x' above will only match MACH_REG |
| ;; because sibcall_epilogue may clobber MACL_REG. |
| (clobber (reg:SI MACL_REG))] |
| "TARGET_SHCOMPACT" |
| "@ |
| jmp @%0%# |
| jmp @%0\\n sts %2, r0" |
| [(set_attr "needs_delay_slot" "yes,no") |
| (set_attr "length" "2,4") |
| (set (attr "fp_mode") (const_string "single")) |
| (set_attr "type" "jump_ind")]) |
| |
| (define_insn "sibcall_media" |
| [(call (mem:DI (match_operand:DI 0 "target_reg_operand" "k")) |
| (match_operand 1 "" "")) |
| (use (reg:SI PR_MEDIA_REG)) |
| (return)] |
| "TARGET_SHMEDIA" |
| "blink %0, r63" |
| [(set_attr "type" "jump_media")]) |
| |
| (define_expand "sibcall" |
| [(parallel |
| [(call (mem:SI (match_operand 0 "arith_reg_operand" "")) |
| (match_operand 1 "" "")) |
| (match_operand 2 "" "") |
| (use (reg:PSI FPSCR_REG)) |
| (return)])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| operands[0] = XEXP (operands[0], 0); |
| if (flag_pic && GET_CODE (operands[0]) == SYMBOL_REF) |
| { |
| if (! SYMBOL_REF_LOCAL_P (operands[0])) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| /* We must not use GOTPLT for sibcalls, because PIC_REG |
| must be restored before the PLT code gets to run. */ |
| emit_insn (gen_symGOT2reg (reg, operands[0])); |
| operands[0] = reg; |
| } |
| else |
| { |
| operands[0] = gen_sym2PIC (operands[0]); |
| PUT_MODE (operands[0], Pmode); |
| } |
| } |
| if (GET_MODE (operands[0]) == SImode) |
| { |
| if (GET_CODE (operands[0]) == REG) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| else if (GET_CODE (operands[0]) == SUBREG) |
| { |
| operands[0] = SUBREG_REG (operands[0]); |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| } |
| else |
| { |
| operands[0] = shallow_copy_rtx (operands[0]); |
| PUT_MODE (operands[0], DImode); |
| } |
| } |
| if (! target_reg_operand (operands[0], DImode)) |
| operands[0] = copy_to_mode_reg (DImode, operands[0]); |
| emit_call_insn (gen_sibcall_media (operands[0], operands[1])); |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT && operands[2] |
| && (INTVAL (operands[2]) & ~ CALL_COOKIE_RET_TRAMP (1))) |
| { |
| rtx cookie_rtx = operands[2]; |
| long cookie = INTVAL (cookie_rtx); |
| rtx func = XEXP (operands[0], 0); |
| rtx mach, r1; |
| |
| if (flag_pic) |
| { |
| if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOT2reg (reg, func)); |
| func = reg; |
| } |
| else |
| func = legitimize_pic_address (func, Pmode, 0); |
| } |
| |
| /* FIXME: if we could tell whether all argument registers are |
| already taken, we could decide whether to force the use of |
| MACH_REG or to stick to R0_REG. Unfortunately, there's no |
| simple way to tell. We could use the CALL_COOKIE, but we |
| can't currently tell a register used for regular argument |
| passing from one that is unused. If we leave it up to reload |
| to decide which register to use, it seems to always choose |
| R0_REG, which leaves no available registers in SIBCALL_REGS |
| to hold the address of the trampoline. */ |
| mach = gen_rtx_REG (SImode, MACH_REG); |
| r1 = gen_rtx_REG (SImode, R1_REG); |
| |
| /* Since such a call function may use all call-clobbered |
| registers, we force a mode switch earlier, so that we don't |
| run out of registers when adjusting fpscr for the call. */ |
| emit_insn (gen_force_mode_for_call ()); |
| |
| operands[0] = function_symbol (\"__GCC_shcompact_call_trampoline\"); |
| if (flag_pic) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOT2reg (reg, operands[0])); |
| operands[0] = reg; |
| } |
| operands[0] = force_reg (SImode, operands[0]); |
| |
| /* We don't need a return trampoline, since the callee will |
| return directly to the upper caller. */ |
| if (cookie & CALL_COOKIE_RET_TRAMP (1)) |
| { |
| cookie &= ~ CALL_COOKIE_RET_TRAMP (1); |
| cookie_rtx = GEN_INT (cookie); |
| } |
| |
| emit_move_insn (mach, func); |
| emit_move_insn (r1, cookie_rtx); |
| |
| emit_call_insn (gen_sibcall_compact (operands[0], operands[1], mach)); |
| DONE; |
| } |
| else if (TARGET_SHCOMPACT && flag_pic |
| && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF |
| && ! SYMBOL_REF_LOCAL_P (XEXP (operands[0], 0))) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOT2reg (reg, XEXP (operands[0], 0))); |
| XEXP (operands[0], 0) = reg; |
| } |
| if (flag_pic && TARGET_SH2 |
| && GET_CODE (operands[0]) == MEM |
| && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF |
| /* The PLT needs the PIC register, but the epilogue would have |
| to restore it, so we can only use PC-relative PIC calls for |
| static functions. */ |
| && SYMBOL_REF_LOCAL_P (XEXP (operands[0], 0))) |
| { |
| emit_call_insn (gen_sibcall_pcrel (XEXP (operands[0], 0), operands[1])); |
| DONE; |
| } |
| else |
| operands[0] = force_reg (SImode, XEXP (operands[0], 0)); |
| |
| emit_call_insn (gen_sibcalli (operands[0], operands[1])); |
| DONE; |
| }") |
| |
| (define_expand "sibcall_value" |
| [(set (match_operand 0 "" "") |
| (call (match_operand 1 "" "") |
| (match_operand 2 "" ""))) |
| (match_operand 3 "" "")] |
| "" |
| " |
| { |
| emit_call_insn (gen_sibcall (operands[1], operands[2], operands[3])); |
| DONE; |
| }") |
| |
| (define_insn "call_value_pop_compact" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (match_operand 2 "" ""))) |
| (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) |
| (match_operand 4 "immediate_operand" "n"))) |
| (match_operand 3 "immediate_operand" "n") |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && ! (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%1%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "call_value_pop_compact_rettramp" |
| [(set (match_operand 0 "" "=rf") |
| (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) |
| (match_operand 2 "" ""))) |
| (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) |
| (match_operand 4 "immediate_operand" "n"))) |
| (match_operand 3 "immediate_operand" "n") |
| (use (reg:SI R0_REG)) |
| (use (reg:SI R1_REG)) |
| (use (reg:PSI FPSCR_REG)) |
| (clobber (reg:SI R10_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT && (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" |
| "jsr @%1%#" |
| [(set_attr "type" "call") |
| (set (attr "fp_mode") |
| (if_then_else (eq_attr "fpu_single" "yes") |
| (const_string "single") (const_string "double"))) |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "call_value_pop" |
| [(parallel [(set (match_operand 0 "arith_reg_operand" "") |
| (call (mem:SI (match_operand 1 "arith_reg_operand" "")) |
| (match_operand 2 "" ""))) |
| (match_operand 3 "" "") |
| (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) |
| (match_operand 4 "" "")))])] |
| "TARGET_SHCOMPACT" |
| " |
| { |
| if (TARGET_SHCOMPACT && operands[3] && INTVAL (operands[3])) |
| { |
| rtx cookie_rtx = operands[3]; |
| long cookie = INTVAL (cookie_rtx); |
| rtx func = XEXP (operands[1], 0); |
| rtx r0, r1; |
| |
| if (flag_pic) |
| { |
| if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, func)); |
| func = reg; |
| } |
| else |
| func = legitimize_pic_address (func, Pmode, 0); |
| } |
| |
| r0 = gen_rtx_REG (SImode, R0_REG); |
| r1 = gen_rtx_REG (SImode, R1_REG); |
| |
| /* Since such a call function may use all call-clobbered |
| registers, we force a mode switch earlier, so that we don't |
| run out of registers when adjusting fpscr for the call. */ |
| emit_insn (gen_force_mode_for_call ()); |
| |
| operands[1] = function_symbol (\"__GCC_shcompact_call_trampoline\"); |
| if (flag_pic) |
| { |
| rtx reg = gen_reg_rtx (Pmode); |
| |
| emit_insn (gen_symGOTPLT2reg (reg, operands[1])); |
| operands[1] = reg; |
| } |
| operands[1] = force_reg (SImode, operands[1]); |
| |
| emit_move_insn (r0, func); |
| emit_move_insn (r1, cookie_rtx); |
| |
| if (cookie & CALL_COOKIE_RET_TRAMP (1)) |
| emit_call_insn (gen_call_value_pop_compact_rettramp |
| (operands[0], operands[1], operands[2], |
| operands[3], operands[4])); |
| else |
| emit_call_insn (gen_call_value_pop_compact |
| (operands[0], operands[1], operands[2], |
| operands[3], operands[4])); |
| |
| DONE; |
| } |
| |
| abort (); |
| }") |
| |
| (define_expand "sibcall_epilogue" |
| [(return)] |
| "" |
| " |
| { |
| sh_expand_epilogue (1); |
| if (TARGET_SHCOMPACT) |
| { |
| rtx insn, set; |
| |
| /* If epilogue clobbers r0, preserve it in macl. */ |
| for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) |
| if ((set = single_set (insn)) |
| && GET_CODE (SET_DEST (set)) == REG |
| && REGNO (SET_DEST (set)) == R0_REG) |
| { |
| rtx r0 = gen_rtx_REG (SImode, R0_REG); |
| rtx tmp = gen_rtx_REG (SImode, MACL_REG); |
| rtx i; |
| |
| /* We can't tell at this point whether the sibcall is a |
| sibcall_compact and, if it is, whether it uses r0 or |
| mach as operand 2, so let the instructions that |
| preserve r0 be optimized away if r0 turns out to be |
| dead. */ |
| i = emit_insn_before (gen_rtx_SET (SImode, tmp, r0), insn); |
| REG_NOTES (i) = gen_rtx_EXPR_LIST (REG_MAYBE_DEAD, const0_rtx, |
| REG_NOTES (i)); |
| i = emit_move_insn (r0, tmp); |
| REG_NOTES (i) = gen_rtx_EXPR_LIST (REG_MAYBE_DEAD, const0_rtx, |
| REG_NOTES (i)); |
| break; |
| } |
| } |
| DONE; |
| }") |
| |
| (define_insn "indirect_jump_compact" |
| [(set (pc) |
| (match_operand:SI 0 "arith_reg_operand" "r"))] |
| "TARGET_SH1" |
| "jmp @%0%#" |
| [(set_attr "needs_delay_slot" "yes") |
| (set_attr "type" "jump_ind")]) |
| |
| (define_expand "indirect_jump" |
| [(set (pc) |
| (match_operand 0 "register_operand" ""))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA && GET_MODE (operands[0]) == SImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| }") |
| |
| ;; The use of operand 1 / 2 helps us distinguish case table jumps |
| ;; which can be present in structured code from indirect jumps which can not |
| ;; be present in structured code. This allows -fprofile-arcs to work. |
| |
| ;; For SH1 processors. |
| (define_insn "casesi_jump_1" |
| [(set (pc) |
| (match_operand:SI 0 "register_operand" "r")) |
| (use (label_ref (match_operand 1 "" "")))] |
| "TARGET_SH1" |
| "jmp @%0%#" |
| [(set_attr "needs_delay_slot" "yes") |
| (set_attr "type" "jump_ind")]) |
| |
| ;; For all later processors. |
| (define_insn "casesi_jump_2" |
| [(set (pc) (plus:SI (match_operand:SI 0 "register_operand" "r") |
| (label_ref (match_operand 1 "" "")))) |
| (use (label_ref (match_operand 2 "" "")))] |
| "TARGET_SH2 |
| && (! INSN_UID (operands[1]) || prev_real_insn (operands[1]) == insn)" |
| "braf %0%#" |
| [(set_attr "needs_delay_slot" "yes") |
| (set_attr "type" "jump_ind")]) |
| |
| (define_insn "casesi_jump_media" |
| [(set (pc) (match_operand:DI 0 "target_reg_operand" "b")) |
| (use (label_ref (match_operand 1 "" "")))] |
| "TARGET_SHMEDIA" |
| "blink %0, r63" |
| [(set_attr "type" "jump_media")]) |
| |
| ;; Call subroutine returning any type. |
| ;; ??? This probably doesn't work. |
| |
| (define_expand "untyped_call" |
| [(parallel [(call (match_operand 0 "" "") |
| (const_int 0)) |
| (match_operand 1 "" "") |
| (match_operand 2 "" "")])] |
| "TARGET_SH2E || TARGET_SHMEDIA" |
| " |
| { |
| int i; |
| |
| emit_call_insn (gen_call (operands[0], const0_rtx, const0_rtx)); |
| |
| for (i = 0; i < XVECLEN (operands[2], 0); i++) |
| { |
| rtx set = XVECEXP (operands[2], 0, i); |
| emit_move_insn (SET_DEST (set), SET_SRC (set)); |
| } |
| |
| /* The optimizer does not know that the call sets the function value |
| registers we stored in the result block. We avoid problems by |
| claiming that all hard registers are used and clobbered at this |
| point. */ |
| emit_insn (gen_blockage ()); |
| |
| DONE; |
| }") |
| |
| ;; ------------------------------------------------------------------------ |
| ;; Misc insns |
| ;; ------------------------------------------------------------------------ |
| |
| (define_insn "dect" |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:SI 0 "arith_reg_operand" "+r") (const_int 1))) |
| (set (match_dup 0) (plus:SI (match_dup 0) (const_int -1)))] |
| "TARGET_SH2" |
| "dt %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_insn "nop" |
| [(const_int 0)] |
| "" |
| "nop") |
| |
| ;; Load address of a label. This is only generated by the casesi expand, |
| ;; and by machine_dependent_reorg (fixing up fp moves). |
| ;; This must use unspec, because this only works for labels that are |
| ;; within range, |
| |
| (define_insn "mova" |
| [(set (reg:SI R0_REG) |
| (unspec:SI [(label_ref (match_operand 0 "" ""))] UNSPEC_MOVA))] |
| "TARGET_SH1" |
| "mova %O0,r0" |
| [(set_attr "in_delay_slot" "no") |
| (set_attr "type" "arith")]) |
| |
| ;; machine_dependent_reorg will make this a `mova'. |
| (define_insn "mova_const" |
| [(set (reg:SI R0_REG) |
| (unspec:SI [(match_operand 0 "immediate_operand" "i")] UNSPEC_MOVA))] |
| "TARGET_SH1" |
| "#" |
| [(set_attr "in_delay_slot" "no") |
| (set_attr "type" "arith")]) |
| |
| (define_expand "GOTaddr2picreg" |
| [(set (reg:SI R0_REG) |
| (unspec:SI [(const:SI (unspec:SI [(match_dup 1)] UNSPEC_PIC))] |
| UNSPEC_MOVA)) |
| (set (match_dup 0) (const:SI (unspec:SI [(match_dup 1)] UNSPEC_PIC))) |
| (set (match_dup 0) (plus:SI (match_dup 0) (reg:SI R0_REG)))] |
| "" " |
| { |
| operands[0] = gen_rtx_REG (Pmode, PIC_REG); |
| operands[1] = gen_rtx_SYMBOL_REF (VOIDmode, GOT_SYMBOL_NAME); |
| |
| if (TARGET_SH5) |
| operands[1] = gen_datalabel_ref (operands[1]); |
| |
| if (TARGET_SHMEDIA) |
| { |
| rtx tr = gen_rtx_REG (DImode, TR0_REG); |
| rtx dipic = operands[0]; |
| rtx lab = PATTERN (gen_call_site ()); |
| rtx insn, equiv; |
| |
| equiv = operands[1]; |
| operands[1] = gen_rtx_MINUS (DImode, |
| operands[1], |
| gen_rtx_CONST |
| (DImode, |
| gen_rtx_MINUS (DImode, |
| gen_rtx_CONST (DImode, |
| lab), |
| pc_rtx))); |
| operands[1] = gen_sym2PIC (operands[1]); |
| PUT_MODE (operands[1], DImode); |
| |
| if (GET_MODE (dipic) != DImode) |
| dipic = gen_rtx_SUBREG (DImode, dipic, 0); |
| |
| if (TARGET_SHMEDIA64) |
| emit_insn (gen_movdi_const (dipic, operands[1])); |
| else |
| emit_insn (gen_movdi_const_32bit (dipic, operands[1])); |
| |
| emit_insn (gen_ptrel (tr, dipic, lab)); |
| |
| if (GET_MODE (operands[0]) != GET_MODE (tr)) |
| tr = gen_lowpart (GET_MODE (operands[0]), tr); |
| |
| insn = emit_move_insn (operands[0], tr); |
| |
| REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, equiv, |
| REG_NOTES (insn)); |
| |
| DONE; |
| } |
| } |
| ") |
| |
| (define_insn "*ptb" |
| [(set (match_operand:DI 0 "target_reg_operand" "=b") |
| (const:DI (unspec:DI [(match_operand:DI 1 "" "Csy")] |
| UNSPEC_DATALABEL)))] |
| "TARGET_SHMEDIA && flag_pic |
| && EXTRA_CONSTRAINT_Csy (operands[1])" |
| "ptb/u datalabel %1, %0" |
| [(set_attr "type" "pt_media") |
| (set_attr "length" "*")]) |
| |
| (define_insn "ptrel" |
| [(set (match_operand:DI 0 "target_reg_operand" "=b") |
| (plus:DI (match_operand:DI 1 "register_operand" "r") |
| (pc))) |
| (match_operand:DI 2 "" "")] |
| "TARGET_SHMEDIA" |
| "%O2: ptrel/u %1, %0" |
| [(set_attr "type" "ptabs_media")]) |
| |
| (define_expand "builtin_setjmp_receiver" |
| [(match_operand 0 "" "")] |
| "flag_pic" |
| " |
| { |
| emit_insn (gen_GOTaddr2picreg ()); |
| DONE; |
| }") |
| |
| (define_expand "call_site" |
| [(unspec [(match_dup 0)] UNSPEC_CALLER)] |
| "TARGET_SH1" |
| " |
| { |
| static HOST_WIDE_INT i = 0; |
| operands[0] = GEN_INT (i); |
| i++; |
| }") |
| |
| (define_expand "sym_label2reg" |
| [(set (match_operand:SI 0 "" "") |
| (const:SI (minus:SI |
| (const:SI |
| (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_PIC)) |
| (const:SI |
| (plus:SI |
| (match_operand:SI 2 "" "") |
| (const_int 2))))))] |
| "TARGET_SH1" "") |
| |
| (define_expand "symGOT_load" |
| [(set (match_dup 2) (match_operand 1 "" "")) |
| (set (match_dup 3) (plus (match_dup 2) (reg PIC_REG))) |
| (set (match_operand 0 "" "") (mem (match_dup 3)))] |
| "" |
| " |
| { |
| rtx insn; |
| |
| operands[2] = no_new_pseudos ? operands[0] : gen_reg_rtx (Pmode); |
| operands[3] = no_new_pseudos ? operands[0] : gen_reg_rtx (Pmode); |
| |
| if (TARGET_SHMEDIA) |
| { |
| rtx reg = operands[2]; |
| |
| if (GET_MODE (reg) != DImode) |
| reg = gen_rtx_SUBREG (DImode, reg, 0); |
| |
| if (flag_pic > 1) |
| emit_insn (gen_movdi_const_32bit (reg, operands[1])); |
| else |
| emit_insn (gen_movdi_const_16bit (reg, operands[1])); |
| } |
| else |
| emit_move_insn (operands[2], operands[1]); |
| |
| emit_move_insn (operands[3], gen_rtx_PLUS (Pmode, |
| operands[2], |
| gen_rtx_REG (Pmode, PIC_REG))); |
| |
| insn = emit_move_insn (operands[0], gen_rtx_MEM (Pmode, operands[3])); |
| |
| REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, XVECEXP (XEXP (operands[1], |
| 0), 0, 0), |
| REG_NOTES (insn)); |
| |
| DONE; |
| }") |
| |
| (define_expand "sym2GOT" |
| [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOT))] |
| "" |
| "") |
| |
| (define_expand "symGOT2reg" |
| [(match_operand 0 "" "") (match_operand 1 "" "")] |
| "" |
| " |
| { |
| rtx gotsym, insn; |
| |
| gotsym = gen_sym2GOT (operands[1]); |
| PUT_MODE (gotsym, Pmode); |
| insn = emit_insn (gen_symGOT_load (operands[0], gotsym)); |
| |
| RTX_UNCHANGING_P (SET_SRC (PATTERN (insn))) = 1; |
| |
| DONE; |
| }") |
| |
| (define_expand "sym2GOTPLT" |
| [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOTPLT))] |
| "" |
| "") |
| |
| (define_expand "symGOTPLT2reg" |
| [(match_operand 0 "" "") (match_operand 1 "" "")] |
| "" |
| " |
| { |
| emit_insn (gen_symGOT_load (operands[0], gen_sym2GOTPLT (operands[1]))); |
| DONE; |
| }") |
| |
| (define_expand "sym2GOTOFF" |
| [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOTOFF))] |
| "" |
| "") |
| |
| (define_expand "symGOTOFF2reg" |
| [(match_operand 0 "" "") (match_operand 1 "" "")] |
| "" |
| " |
| { |
| rtx gotoffsym, insn; |
| rtx t = no_new_pseudos ? operands[0] : gen_reg_rtx (GET_MODE (operands[0])); |
| |
| gotoffsym = gen_sym2GOTOFF (operands[1]); |
| PUT_MODE (gotoffsym, Pmode); |
| emit_move_insn (t, gotoffsym); |
| insn = emit_move_insn (operands[0], |
| gen_rtx_PLUS (Pmode, t, |
| gen_rtx_REG (Pmode, PIC_REG))); |
| |
| REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, operands[1], |
| REG_NOTES (insn)); |
| |
| DONE; |
| }") |
| |
| (define_expand "symPLT_label2reg" |
| [(set (match_operand:SI 0 "" "") |
| (const:SI (minus:SI |
| (const:SI |
| (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_PLT)) |
| (const:SI |
| (minus:SI |
| (const:SI (plus:SI |
| (match_operand:SI 2 "" "") |
| (const_int 2))) |
| (const:SI (unspec:SI [(pc)] UNSPEC_PIC))))))) |
| ;; Even though the PIC register is not really used by the call |
| ;; sequence in which this is expanded, the PLT code assumes the PIC |
| ;; register is set, so we must not skip its initialization. Since |
| ;; we only use this expand as part of calling sequences, and never |
| ;; to take the address of a function, this is the best point to |
| ;; insert the (use). Using the PLT to take the address of a |
| ;; function would be wrong, not only because the PLT entry could |
| ;; then be called from a function that doesn't initialize the PIC |
| ;; register to the proper GOT, but also because pointers to the |
| ;; same function might not compare equal, should they be set by |
| ;; different shared libraries. |
| (use (reg:SI PIC_REG))] |
| "TARGET_SH1" |
| "") |
| |
| (define_expand "sym2PIC" |
| [(const (unspec [(match_operand:SI 0 "" "")] UNSPEC_PIC))] |
| "" |
| "") |
| |
| ;; TLS code generation. |
| ;; ??? this should be a define_insn_and_split |
| ;; See the thread [PATCH/RFA] SH TLS support on gcc-patches |
| ;; <http://gcc.gnu.org/ml/gcc-patches/2003-02/msg01898.html> |
| ;; for details. |
| |
| (define_insn "tls_global_dynamic" |
| [(set (match_operand:SI 0 "register_operand" "=&z") |
| (call (unspec:SI [(match_operand:SI 1 "" "")] |
| UNSPEC_TLSGD) |
| (const_int 0))) |
| (use (reg:PSI FPSCR_REG)) |
| (use (reg:SI PIC_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (scratch:SI))] |
| "TARGET_SH1" |
| "* |
| { |
| return \"\\ |
| mov.l\\t1f,r4\\n\\ |
| \\tmova\\t2f,r0\\n\\ |
| \\tmov.l\\t2f,r1\\n\\ |
| \\tadd\\tr0,r1\\n\\ |
| \\tjsr\\t@r1\\n\\ |
| \\tadd\\tr12,r4\\n\\ |
| \\tbra\\t3f\\n\\ |
| \\tnop\\n\\ |
| \\t.align\\t2\\n\\ |
| 1:\\t.long\\t%a1@TLSGD\\n\\ |
| 2:\\t.long\\t__tls_get_addr@PLT\\n\\ |
| 3:\"; |
| }" |
| [(set_attr "type" "tls_load") |
| (set_attr "length" "26")]) |
| |
| (define_insn "tls_local_dynamic" |
| [(set (match_operand:SI 0 "register_operand" "=&z") |
| (call (unspec:SI [(match_operand:SI 1 "" "")] |
| UNSPEC_TLSLDM) |
| (const_int 0))) |
| (use (reg:PSI FPSCR_REG)) |
| (use (reg:SI PIC_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (scratch:SI))] |
| "TARGET_SH1" |
| "* |
| { |
| return \"\\ |
| mov.l\\t1f,r4\\n\\ |
| \\tmova\\t2f,r0\\n\\ |
| \\tmov.l\\t2f,r1\\n\\ |
| \\tadd\\tr0,r1\\n\\ |
| \\tjsr\\t@r1\\n\\ |
| \\tadd\\tr12,r4\\n\\ |
| \\tbra\\t3f\\n\\ |
| \\tnop\\n\\ |
| \\t.align\\t2\\n\\ |
| 1:\\t.long\\t%a1@TLSLDM\\n\\ |
| 2:\\t.long\\t__tls_get_addr@PLT\\n\\ |
| 3:\"; |
| }" |
| [(set_attr "type" "tls_load") |
| (set_attr "length" "26")]) |
| |
| (define_expand "sym2DTPOFF" |
| [(const (unspec [(match_operand 0 "" "")] UNSPEC_DTPOFF))] |
| "" |
| "") |
| |
| (define_expand "symDTPOFF2reg" |
| [(match_operand 0 "" "") (match_operand 1 "" "") (match_operand 2 "" "")] |
| "" |
| " |
| { |
| rtx dtpoffsym, insn; |
| rtx t = no_new_pseudos ? operands[0] : gen_reg_rtx (GET_MODE (operands[0])); |
| |
| dtpoffsym = gen_sym2DTPOFF (operands[1]); |
| PUT_MODE (dtpoffsym, Pmode); |
| emit_move_insn (t, dtpoffsym); |
| insn = emit_move_insn (operands[0], |
| gen_rtx_PLUS (Pmode, t, operands[2])); |
| DONE; |
| }") |
| |
| (define_expand "sym2GOTTPOFF" |
| [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOTTPOFF))] |
| "" |
| "") |
| |
| (define_insn "tls_initial_exec" |
| [(set (match_operand:SI 0 "register_operand" "=&r") |
| (unspec:SI [(match_operand:SI 1 "" "")] |
| UNSPEC_TLSIE)) |
| (use (reg:SI GBR_REG)) |
| (use (reg:SI PIC_REG)) |
| (clobber (reg:SI R0_REG))] |
| "" |
| "* |
| { |
| return \"\\ |
| mov.l\\t1f,r0\\n\\ |
| \\tstc\\tgbr,%0\\n\\ |
| \\tmov.l\\t@(r0,r12),r0\\n\\ |
| \\tbra\\t2f\\n\\ |
| \\tadd\\tr0,%0\\n\\ |
| \\t.align\\t2\\n\\ |
| 1:\\t.long\\t%a1\\n\\ |
| 2:\"; |
| }" |
| [(set_attr "type" "tls_load") |
| (set_attr "length" "16")]) |
| |
| (define_expand "sym2TPOFF" |
| [(const (unspec [(match_operand 0 "" "")] UNSPEC_TPOFF))] |
| "" |
| "") |
| |
| (define_expand "symTPOFF2reg" |
| [(match_operand 0 "" "") (match_operand 1 "" "")] |
| "" |
| " |
| { |
| rtx tpoffsym, insn; |
| |
| tpoffsym = gen_sym2TPOFF (operands[1]); |
| PUT_MODE (tpoffsym, Pmode); |
| insn = emit_move_insn (operands[0], tpoffsym); |
| DONE; |
| }") |
| |
| (define_insn "load_gbr" |
| [(set (match_operand:SI 0 "register_operand" "") (reg:SI GBR_REG)) |
| (use (reg:SI GBR_REG))] |
| "" |
| "stc gbr,%0" |
| [(set_attr "type" "tls_load")]) |
| |
| ;; case instruction for switch statements. |
| |
| ;; Operand 0 is index |
| ;; operand 1 is the minimum bound |
| ;; operand 2 is the maximum bound - minimum bound + 1 |
| ;; operand 3 is CODE_LABEL for the table; |
| ;; operand 4 is the CODE_LABEL to go to if index out of range. |
| |
| (define_expand "casesi" |
| [(match_operand:SI 0 "arith_reg_operand" "") |
| (match_operand:SI 1 "arith_reg_operand" "") |
| (match_operand:SI 2 "arith_reg_operand" "") |
| (match_operand 3 "" "") (match_operand 4 "" "")] |
| "" |
| " |
| { |
| rtx reg = gen_reg_rtx (SImode); |
| rtx reg2 = gen_reg_rtx (SImode); |
| if (TARGET_SHMEDIA) |
| { |
| rtx reg = gen_reg_rtx (DImode); |
| rtx reg2 = gen_reg_rtx (DImode); |
| rtx reg3 = gen_reg_rtx (DImode); |
| rtx reg4 = gen_reg_rtx (DImode); |
| rtx reg5 = gen_reg_rtx (DImode); |
| |
| operands[0] = convert_modes (DImode, SImode, operands[0], 0); |
| operands[1] = convert_modes (DImode, SImode, operands[1], 0); |
| operands[2] = convert_modes (DImode, SImode, operands[2], 1); |
| |
| emit_jump_insn (gen_bgt_media (operands[4], operands[1], operands[0])); |
| emit_move_insn (reg, gen_rtx_MINUS (DImode, operands[0], operands[1])); |
| emit_jump_insn (gen_bgtu_media (operands[4], reg, operands[2])); |
| emit_insn (gen_casesi_shift_media (reg2, reg, operands[3])); |
| emit_move_insn (reg3, gen_datalabel_ref (gen_rtx_LABEL_REF |
| (DImode, operands[3]))); |
| emit_insn (gen_casesi_load_media (reg4, reg3, reg2, operands[3])); |
| emit_move_insn (reg5, gen_rtx_PLUS (DImode, reg3, reg4)); |
| emit_jump_insn (gen_casesi_jump_media (reg5, operands[3])); |
| emit_barrier (); |
| DONE; |
| } |
| operands[1] = copy_to_mode_reg (SImode, operands[1]); |
| operands[2] = copy_to_mode_reg (SImode, operands[2]); |
| /* If optimizing, casesi_worker depends on the mode of the instruction |
| before label it 'uses' - operands[3]. */ |
| emit_insn (gen_casesi_0 (operands[0], operands[1], operands[2], operands[4], |
| reg)); |
| emit_insn (gen_casesi_worker_0 (reg2, reg, operands[3])); |
| if (TARGET_SH2) |
| emit_jump_insn (gen_casesi_jump_2 (reg2, gen_label_rtx (), operands[3])); |
| else |
| emit_jump_insn (gen_casesi_jump_1 (reg2, operands[3])); |
| /* For SH2 and newer, the ADDR_DIFF_VEC is not actually relative to |
| operands[3], but to lab. We will fix this up in |
| machine_dependent_reorg. */ |
| emit_barrier (); |
| DONE; |
| }") |
| |
| (define_expand "casesi_0" |
| [(set (match_operand:SI 4 "" "") (match_operand:SI 0 "arith_reg_operand" "")) |
| (set (match_dup 4) (minus:SI (match_dup 4) |
| (match_operand:SI 1 "arith_operand" ""))) |
| (set (reg:SI T_REG) |
| (gtu:SI (match_dup 4) |
| (match_operand:SI 2 "arith_reg_operand" ""))) |
| (set (pc) |
| (if_then_else (ne (reg:SI T_REG) |
| (const_int 0)) |
| (label_ref (match_operand 3 "" "")) |
| (pc)))] |
| "TARGET_SH1" |
| "") |
| |
| ;; ??? reload might clobber r0 if we use it explicitly in the RTL before |
| ;; reload; using a R0_REGS pseudo reg is likely to give poor code. |
| ;; So we keep the use of r0 hidden in a R0_REGS clobber until after reload. |
| |
| (define_insn "casesi_worker_0" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (unspec:SI [(match_operand:SI 1 "register_operand" "0,r") |
| (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) |
| (clobber (match_scratch:SI 3 "=X,1")) |
| (clobber (match_scratch:SI 4 "=&z,z"))] |
| "TARGET_SH1" |
| "#") |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (unspec:SI [(match_operand:SI 1 "register_operand" "") |
| (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) |
| (clobber (match_scratch:SI 3 "")) |
| (clobber (match_scratch:SI 4 ""))] |
| "TARGET_SH1 && ! TARGET_SH2 && reload_completed" |
| [(set (reg:SI R0_REG) (unspec:SI [(label_ref (match_dup 2))] UNSPEC_MOVA)) |
| (parallel [(set (match_dup 0) |
| (unspec:SI [(reg:SI R0_REG) (match_dup 1) |
| (label_ref (match_dup 2))] UNSPEC_CASESI)) |
| (clobber (match_dup 3))]) |
| (set (match_dup 0) (plus:SI (match_dup 0) (reg:SI R0_REG)))] |
| "if (GET_CODE (operands[2]) == CODE_LABEL) LABEL_NUSES (operands[2])++;") |
| |
| (define_split |
| [(set (match_operand:SI 0 "register_operand" "") |
| (unspec:SI [(match_operand:SI 1 "register_operand" "") |
| (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) |
| (clobber (match_scratch:SI 3 "")) |
| (clobber (match_scratch:SI 4 ""))] |
| "TARGET_SH2 && reload_completed" |
| [(set (reg:SI R0_REG) (unspec:SI [(label_ref (match_dup 2))] UNSPEC_MOVA)) |
| (parallel [(set (match_dup 0) |
| (unspec:SI [(reg:SI R0_REG) (match_dup 1) |
| (label_ref (match_dup 2))] UNSPEC_CASESI)) |
| (clobber (match_dup 3))])] |
| "if (GET_CODE (operands[2]) == CODE_LABEL) LABEL_NUSES (operands[2])++;") |
| |
| (define_insn "casesi_worker_1" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (unspec:SI [(reg:SI R0_REG) |
| (match_operand:SI 1 "register_operand" "0,r") |
| (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) |
| (clobber (match_scratch:SI 3 "=X,1"))] |
| "TARGET_SH1" |
| "* |
| { |
| rtx diff_vec = PATTERN (next_real_insn (operands[2])); |
| |
| if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) |
| abort (); |
| |
| switch (GET_MODE (diff_vec)) |
| { |
| case SImode: |
| return \"shll2 %1\;mov.l @(r0,%1),%0\"; |
| case HImode: |
| return \"add %1,%1\;mov.w @(r0,%1),%0\"; |
| case QImode: |
| if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) |
| return \"mov.b @(r0,%1),%0\;extu.b %0,%0\"; |
| return \"mov.b @(r0,%1),%0\"; |
| default: |
| abort (); |
| } |
| }" |
| [(set_attr "length" "4")]) |
| |
| (define_insn "casesi_worker_2" |
| [(set (match_operand:SI 0 "register_operand" "=r,r") |
| (unspec:SI [(reg:SI R0_REG) |
| (match_operand:SI 1 "register_operand" "0,r") |
| (label_ref (match_operand 2 "" "")) |
| (label_ref (match_operand 3 "" ""))] UNSPEC_CASESI)) |
| (clobber (match_operand:SI 4 "" "=X,1"))] |
| "TARGET_SH2 && reload_completed && flag_pic" |
| "* |
| { |
| rtx diff_vec = PATTERN (next_real_insn (operands[2])); |
| char *load; |
| |
| if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) |
| abort (); |
| |
| switch (GET_MODE (diff_vec)) |
| { |
| case SImode: |
| output_asm_insn (\"shll2 %1\", operands); |
| load = \"mov.l @(r0,%1),%0\"; break; |
| case HImode: |
| output_asm_insn (\"add %1,%1\", operands); |
| load = \"mov.w @(r0,%1),%0\"; break; |
| case QImode: |
| if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) |
| load = \"mov.b @(r0,%1),%0\;extu.b %0,%0\"; |
| else |
| load = \"mov.b @(r0,%1),%0\"; |
| break; |
| default: |
| abort (); |
| } |
| output_asm_insn (\"add\tr0,%1\;mova\t%O3,r0\\n\", operands); |
| return load; |
| }" |
| [(set_attr "length" "8")]) |
| |
| (define_insn "casesi_shift_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (ashift:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (unspec:DI [(label_ref:DI (match_operand 2 "" ""))] |
| UNSPEC_CASESI)))] |
| "TARGET_SHMEDIA" |
| "* |
| { |
| rtx diff_vec = PATTERN (next_real_insn (operands[2])); |
| |
| if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) |
| abort (); |
| |
| switch (GET_MODE (diff_vec)) |
| { |
| case SImode: |
| return \"shlli %1, 2, %0\"; |
| case HImode: |
| return \"shlli %1, 1, %0\"; |
| case QImode: |
| if (rtx_equal_p (operands[0], operands[1])) |
| return \"\"; |
| return \"add %1, r63, %0\"; |
| default: |
| abort (); |
| } |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "casesi_load_media" |
| [(set (match_operand:DI 0 "arith_reg_operand" "=r") |
| (mem:DI (unspec [(match_operand 1 "arith_reg_operand" "r") |
| (match_operand 2 "arith_reg_operand" "r") |
| (label_ref:DI (match_operand 3 "" ""))] 2)))] |
| "TARGET_SHMEDIA" |
| "* |
| { |
| rtx diff_vec = PATTERN (next_real_insn (operands[3])); |
| |
| if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) |
| abort (); |
| |
| switch (GET_MODE (diff_vec)) |
| { |
| case SImode: |
| return \"ldx.l %1, %2, %0\"; |
| case HImode: |
| #if 0 |
| if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) |
| return \"ldx.uw %1, %2, %0\"; |
| #endif |
| return \"ldx.w %1, %2, %0\"; |
| case QImode: |
| if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) |
| return \"ldx.ub %1, %2, %0\"; |
| return \"ldx.b %1, %2, %0\"; |
| default: |
| abort (); |
| } |
| }" |
| [(set_attr "type" "load_media")]) |
| |
| (define_expand "return" |
| [(return)] |
| "reload_completed && ! sh_need_epilogue ()" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| emit_jump_insn (gen_return_media ()); |
| DONE; |
| } |
| |
| if (TARGET_SHCOMPACT |
| && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))) |
| { |
| emit_jump_insn (gen_shcompact_return_tramp ()); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*return_i" |
| [(return)] |
| "TARGET_SH1 && ! (TARGET_SHCOMPACT |
| && (current_function_args_info.call_cookie |
| & CALL_COOKIE_RET_TRAMP (1))) |
| && reload_completed" |
| "%@ %#" |
| [(set_attr "type" "return") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "shcompact_return_tramp" |
| [(return)] |
| "TARGET_SHCOMPACT |
| && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))" |
| " |
| { |
| rtx reg = gen_rtx_REG (Pmode, R0_REG); |
| rtx sym = function_symbol (\"__GCC_shcompact_return_trampoline\"); |
| |
| if (flag_pic) |
| emit_insn (gen_symGOTPLT2reg (reg, sym)); |
| else |
| emit_move_insn (reg, sym); |
| |
| emit_jump_insn (gen_shcompact_return_tramp_i ()); |
| DONE; |
| }") |
| |
| (define_insn "shcompact_return_tramp_i" |
| [(parallel [(return) (use (reg:SI R0_REG))])] |
| "TARGET_SHCOMPACT |
| && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))" |
| "jmp @r0%#" |
| [(set_attr "type" "jump_ind") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "return_media_i" |
| [(parallel [(return) (use (match_operand:DI 0 "target_reg_operand" "k"))])] |
| "TARGET_SHMEDIA && reload_completed" |
| "blink %0, r63" |
| [(set_attr "type" "jump_media")]) |
| |
| (define_insn "return_media_rte" |
| [(return)] |
| "TARGET_SHMEDIA && reload_completed && current_function_interrupt" |
| "rte" |
| [(set_attr "type" "jump_media")]) |
| |
| (define_expand "return_media" |
| [(return)] |
| "TARGET_SHMEDIA && reload_completed" |
| " |
| { |
| int tr_regno = sh_media_register_for_return (); |
| rtx tr; |
| |
| if (current_function_interrupt) |
| { |
| emit_jump_insn (gen_return_media_rte ()); |
| DONE; |
| } |
| if (tr_regno < 0) |
| { |
| rtx r18 = gen_rtx_REG (DImode, PR_MEDIA_REG); |
| |
| if (! call_used_regs[TR0_REG] || fixed_regs[TR0_REG]) |
| abort (); |
| tr_regno = TR0_REG; |
| tr = gen_rtx_REG (DImode, tr_regno); |
| emit_move_insn (tr, r18); |
| } |
| else |
| tr = gen_rtx_REG (DImode, tr_regno); |
| |
| emit_jump_insn (gen_return_media_i (tr)); |
| DONE; |
| }") |
| |
| (define_insn "shcompact_preserve_incoming_args" |
| [(set (match_operand:SI 0 "register_operand" "+r") |
| (unspec:SI [(match_dup 0)] UNSPEC_COMPACT_ARGS))] |
| "TARGET_SHCOMPACT" |
| "" |
| [(set_attr "length" "0")]) |
| |
| (define_insn "shcompact_incoming_args" |
| [(set (reg:SI R2_REG) (unspec:SI [(reg:SI R2_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R3_REG) (unspec:SI [(reg:SI R3_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R4_REG) (unspec:SI [(reg:SI R4_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R5_REG) (unspec:SI [(reg:SI R5_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R6_REG) (unspec:SI [(reg:SI R6_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R7_REG) (unspec:SI [(reg:SI R7_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R8_REG) (unspec:SI [(reg:SI R8_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (reg:SI R9_REG) (unspec:SI [(reg:SI R9_REG)] UNSPEC_COMPACT_ARGS)) |
| (set (mem:BLK (reg:SI MACL_REG)) |
| (unspec:BLK [(reg:SI MACH_REG)] UNSPEC_COMPACT_ARGS)) |
| (use (reg:SI R0_REG)) |
| (clobber (reg:SI R0_REG)) |
| (clobber (reg:SI MACL_REG)) |
| (clobber (reg:SI MACH_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT" |
| "jsr @r0%#" |
| [(set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "shmedia_save_restore_regs_compact" |
| [(set (reg:SI SP_REG) |
| (plus:SI (reg:SI SP_REG) |
| (match_operand:SI 0 "immediate_operand" "i"))) |
| (use (reg:SI R0_REG)) |
| (clobber (reg:SI PR_REG))] |
| "TARGET_SHCOMPACT |
| && (INTVAL (operands[0]) == SHMEDIA_REGS_STACK_ADJUST () |
| || INTVAL (operands[0]) == - SHMEDIA_REGS_STACK_ADJUST ())" |
| "jsr @r0%#" |
| [(set_attr "needs_delay_slot" "yes")]) |
| |
| (define_expand "prologue" |
| [(const_int 0)] |
| "" |
| "sh_expand_prologue (); DONE;") |
| |
| (define_expand "epilogue" |
| [(return)] |
| "" |
| " |
| { |
| sh_expand_epilogue (0); |
| emit_jump_insn (gen_return ()); |
| DONE; |
| }") |
| |
| (define_expand "eh_return" |
| [(use (match_operand 0 "register_operand" ""))] |
| "" |
| { |
| rtx tmp, ra = operands[0]; |
| |
| if (TARGET_SHMEDIA64) |
| emit_insn (gen_eh_set_ra_di (ra)); |
| else |
| emit_insn (gen_eh_set_ra_si (ra)); |
| |
| DONE; |
| }) |
| |
| ;; Clobber the return address on the stack. We can't expand this |
| ;; until we know where it will be put in the stack frame. |
| |
| (define_insn "eh_set_ra_si" |
| [(unspec [(match_operand:SI 0 "register_operand" "r")] UNSPEC_EH_RETURN) |
| (clobber (match_scratch:SI 1 "=&r"))] |
| "! TARGET_SHMEDIA64" |
| "#") |
| |
| (define_insn "eh_set_ra_di" |
| [(unspec [(match_operand:DI 0 "register_operand" "r")] UNSPEC_EH_RETURN) |
| (clobber (match_scratch:DI 1 "=&r"))] |
| "TARGET_SHMEDIA64" |
| "#") |
| |
| (define_split |
| [(unspec [(match_operand 0 "register_operand" "")] UNSPEC_EH_RETURN) |
| (clobber (match_scratch 1 ""))] |
| "reload_completed" |
| [(const_int 0)] |
| " |
| { |
| sh_set_return_address (operands[0], operands[1]); |
| DONE; |
| }") |
| |
| (define_insn "blockage" |
| [(unspec_volatile [(const_int 0)] UNSPECV_BLOCKAGE)] |
| "" |
| "" |
| [(set_attr "length" "0")]) |
| |
| ;; ------------------------------------------------------------------------ |
| ;; Scc instructions |
| ;; ------------------------------------------------------------------------ |
| |
| (define_insn "movt" |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (eq:SI (reg:SI T_REG) (const_int 1)))] |
| "TARGET_SH1" |
| "movt %0" |
| [(set_attr "type" "arith")]) |
| |
| (define_expand "seq" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| switch (GET_MODE (sh_compare_op0)) |
| { |
| case DImode: |
| emit_insn (gen_cmpeqdi_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| case SFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpeqsf_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| case DFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpeqdf_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| default: |
| FAIL; |
| } |
| DONE; |
| } |
| if (sh_expand_t_scc (EQ, operands[0])) |
| DONE; |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (EQ); |
| }") |
| |
| (define_expand "slt" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| switch (GET_MODE (sh_compare_op0)) |
| { |
| case DImode: |
| emit_insn (gen_cmpgtdi_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| break; |
| |
| case SFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgtsf_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| break; |
| |
| case DFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgtdf_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| break; |
| |
| default: |
| FAIL; |
| } |
| DONE; |
| } |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (LT); |
| }") |
| |
| (define_expand "sle" |
| [(match_operand:SI 0 "arith_reg_operand" "")] |
| "" |
| " |
| { |
| rtx tmp = sh_compare_op0; |
| |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| switch (GET_MODE (sh_compare_op0)) |
| { |
| case DImode: |
| { |
| tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); |
| |
| emit_insn (gen_cmpgtdi_media (tmp, |
| sh_compare_op0, sh_compare_op1)); |
| emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); |
| break; |
| } |
| |
| case SFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgesf_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| break; |
| |
| case DFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgedf_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| break; |
| |
| default: |
| FAIL; |
| } |
| DONE; |
| } |
| |
| sh_compare_op0 = sh_compare_op1; |
| sh_compare_op1 = tmp; |
| emit_insn (gen_sge (operands[0])); |
| DONE; |
| }") |
| |
| (define_expand "sgt" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| switch (GET_MODE (sh_compare_op0)) |
| { |
| case DImode: |
| emit_insn (gen_cmpgtdi_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| case SFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgtsf_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| case DFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgtdf_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| default: |
| FAIL; |
| } |
| DONE; |
| } |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (GT); |
| }") |
| |
| (define_expand "sge" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| switch (GET_MODE (sh_compare_op0)) |
| { |
| case DImode: |
| { |
| rtx tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); |
| |
| emit_insn (gen_cmpgtdi_media (tmp, |
| sh_compare_op1, sh_compare_op0)); |
| emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); |
| break; |
| } |
| |
| case SFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgesf_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| case DFmode: |
| if (! TARGET_SHMEDIA_FPU) |
| FAIL; |
| emit_insn (gen_cmpgedf_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| break; |
| |
| default: |
| FAIL; |
| } |
| DONE; |
| } |
| |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| if (GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) |
| { |
| if (TARGET_IEEE) |
| { |
| rtx lab = gen_label_rtx (); |
| prepare_scc_operands (EQ); |
| emit_jump_insn (gen_branch_true (lab)); |
| prepare_scc_operands (GT); |
| emit_label (lab); |
| emit_insn (gen_movt (operands[0])); |
| } |
| else |
| emit_insn (gen_movnegt (operands[0], prepare_scc_operands (LT))); |
| DONE; |
| } |
| operands[1] = prepare_scc_operands (GE); |
| }") |
| |
| (define_expand "sgtu" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| emit_insn (gen_cmpgtudi_media (operands[0], |
| sh_compare_op0, sh_compare_op1)); |
| DONE; |
| } |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (GTU); |
| }") |
| |
| (define_expand "sltu" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| emit_insn (gen_cmpgtudi_media (operands[0], |
| sh_compare_op1, sh_compare_op0)); |
| DONE; |
| } |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (LTU); |
| }") |
| |
| (define_expand "sleu" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| rtx tmp; |
| |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); |
| |
| emit_insn (gen_cmpgtudi_media (tmp, sh_compare_op0, sh_compare_op1)); |
| emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); |
| |
| DONE; |
| } |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (LEU); |
| }") |
| |
| (define_expand "sgeu" |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (match_dup 1))] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| rtx tmp; |
| |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); |
| |
| emit_insn (gen_cmpgtudi_media (tmp, sh_compare_op1, sh_compare_op0)); |
| emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); |
| |
| DONE; |
| } |
| |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (GEU); |
| }") |
| |
| ;; sne moves the complement of the T reg to DEST like this: |
| ;; cmp/eq ... |
| ;; mov #-1,temp |
| ;; negc temp,dest |
| ;; This is better than xoring compare result with 1 because it does |
| ;; not require r0 and further, the -1 may be CSE-ed or lifted out of a |
| ;; loop. |
| |
| (define_expand "sne" |
| [(set (match_dup 2) (const_int -1)) |
| (parallel [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (neg:SI (plus:SI (match_dup 1) |
| (match_dup 2)))) |
| (set (reg:SI T_REG) |
| (ne:SI (ior:SI (match_dup 1) (match_dup 2)) |
| (const_int 0)))])] |
| "" |
| " |
| { |
| if (TARGET_SHMEDIA) |
| { |
| rtx tmp; |
| |
| if (GET_MODE (operands[0]) != DImode) |
| operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); |
| |
| if (! TARGET_SHMEDIA_FPU && GET_MODE (sh_compare_op0) != DImode) |
| FAIL; |
| |
| sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| if (sh_compare_op1 != const0_rtx) |
| sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode |
| ? GET_MODE (sh_compare_op0) |
| : GET_MODE (sh_compare_op1), |
| sh_compare_op1); |
| |
| tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); |
| |
| emit_insn (gen_seq (tmp)); |
| emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); |
| |
| DONE; |
| } |
| |
| if (sh_expand_t_scc (NE, operands[0])) |
| DONE; |
| if (! rtx_equal_function_value_matters) |
| FAIL; |
| operands[1] = prepare_scc_operands (EQ); |
| operands[2] = gen_reg_rtx (SImode); |
| }") |
| |
| (define_expand "sunordered" |
| [(set (match_operand:DI 0 "arith_reg_operand" "") |
| (unordered:DI (match_dup 1) (match_dup 2)))] |
| "TARGET_SHMEDIA_FPU" |
| " |
| { |
| operands[1] = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); |
| operands[2] = force_reg (GET_MODE (sh_compare_op1), sh_compare_op1); |
| }") |
| |
| ;; Use the same trick for FP sle / sge |
| (define_expand "movnegt" |
| [(set (match_dup 2) (const_int -1)) |
| (parallel [(set (match_operand 0 "" "") |
| (neg:SI (plus:SI (match_dup 1) |
| (match_dup 2)))) |
| (set (reg:SI T_REG) |
| (ne:SI (ior:SI (match_operand 1 "" "") (match_dup 2)) |
| (const_int 0)))])] |
| "TARGET_SH1" |
| "operands[2] = gen_reg_rtx (SImode);") |
| |
| ;; Recognize mov #-1/negc/neg sequence, and change it to movt/add #-1. |
| ;; This prevents a regression that occurred when we switched from xor to |
| ;; mov/neg for sne. |
| |
| (define_split |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (plus:SI (reg:SI T_REG) |
| (const_int -1)))] |
| "TARGET_SH1" |
| [(set (match_dup 0) (eq:SI (reg:SI T_REG) (const_int 1))) |
| (set (match_dup 0) (plus:SI (match_dup 0) (const_int -1)))] |
| "") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Instructions to cope with inline literal tables |
| ;; ------------------------------------------------------------------------- |
| |
| ; 2 byte integer in line |
| |
| (define_insn "consttable_2" |
| [(unspec_volatile [(match_operand:SI 0 "general_operand" "=g") |
| (match_operand 1 "" "")] |
| UNSPECV_CONST2)] |
| "" |
| "* |
| { |
| if (operands[1] != const0_rtx) |
| assemble_integer (operands[0], 2, BITS_PER_UNIT * 2, 1); |
| return \"\"; |
| }" |
| [(set_attr "length" "2") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ; 4 byte integer in line |
| |
| (define_insn "consttable_4" |
| [(unspec_volatile [(match_operand:SI 0 "general_operand" "=g") |
| (match_operand 1 "" "")] |
| UNSPECV_CONST4)] |
| "" |
| "* |
| { |
| if (operands[1] != const0_rtx) |
| assemble_integer (operands[0], 4, BITS_PER_UNIT * 4, 1); |
| return \"\"; |
| }" |
| [(set_attr "length" "4") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ; 8 byte integer in line |
| |
| (define_insn "consttable_8" |
| [(unspec_volatile [(match_operand:SI 0 "general_operand" "=g") |
| (match_operand 1 "" "")] |
| UNSPECV_CONST8)] |
| "" |
| "* |
| { |
| if (operands[1] != const0_rtx) |
| assemble_integer (operands[0], 8, BITS_PER_UNIT * 8, 1); |
| return \"\"; |
| }" |
| [(set_attr "length" "8") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ; 4 byte floating point |
| |
| (define_insn "consttable_sf" |
| [(unspec_volatile [(match_operand:SF 0 "general_operand" "=g") |
| (match_operand 1 "" "")] |
| UNSPECV_CONST4)] |
| "" |
| "* |
| { |
| if (operands[1] != const0_rtx) |
| { |
| REAL_VALUE_TYPE d; |
| REAL_VALUE_FROM_CONST_DOUBLE (d, operands[0]); |
| assemble_real (d, SFmode, GET_MODE_ALIGNMENT (SFmode)); |
| } |
| return \"\"; |
| }" |
| [(set_attr "length" "4") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ; 8 byte floating point |
| |
| (define_insn "consttable_df" |
| [(unspec_volatile [(match_operand:DF 0 "general_operand" "=g") |
| (match_operand 1 "" "")] |
| UNSPECV_CONST8)] |
| "" |
| "* |
| { |
| if (operands[1] != const0_rtx) |
| { |
| REAL_VALUE_TYPE d; |
| REAL_VALUE_FROM_CONST_DOUBLE (d, operands[0]); |
| assemble_real (d, DFmode, GET_MODE_ALIGNMENT (DFmode)); |
| } |
| return \"\"; |
| }" |
| [(set_attr "length" "8") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ;; Alignment is needed for some constant tables; it may also be added for |
| ;; Instructions at the start of loops, or after unconditional branches. |
| ;; ??? We would get more accurate lengths if we did instruction |
| ;; alignment based on the value of INSN_CURRENT_ADDRESS; the approach used |
| ;; here is too conservative. |
| |
| ; align to a two byte boundary |
| |
| (define_expand "align_2" |
| [(unspec_volatile [(const_int 1)] UNSPECV_ALIGN)] |
| "" |
| "") |
| |
| ; align to a four byte boundary |
| ;; align_4 and align_log are instructions for the starts of loops, or |
| ;; after unconditional branches, which may take up extra room. |
| |
| (define_expand "align_4" |
| [(unspec_volatile [(const_int 2)] UNSPECV_ALIGN)] |
| "" |
| "") |
| |
| ; align to a cache line boundary |
| |
| (define_insn "align_log" |
| [(unspec_volatile [(match_operand 0 "const_int_operand" "")] UNSPECV_ALIGN)] |
| "" |
| "" |
| [(set_attr "length" "0") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ; emitted at the end of the literal table, used to emit the |
| ; 32bit branch labels if needed. |
| |
| (define_insn "consttable_end" |
| [(unspec_volatile [(const_int 0)] UNSPECV_CONST_END)] |
| "" |
| "* return output_jump_label_table ();" |
| [(set_attr "in_delay_slot" "no")]) |
| |
| ; emitted at the end of the window in the literal table. |
| |
| (define_insn "consttable_window_end" |
| [(unspec_volatile [(match_operand 0 "" "")] UNSPECV_WINDOW_END)] |
| "" |
| "" |
| [(set_attr "length" "0") |
| (set_attr "in_delay_slot" "no")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Misc |
| ;; ------------------------------------------------------------------------- |
| |
| ;; String/block move insn. |
| |
| (define_expand "movstrsi" |
| [(parallel [(set (mem:BLK (match_operand:BLK 0 "" "")) |
| (mem:BLK (match_operand:BLK 1 "" ""))) |
| (use (match_operand:SI 2 "nonmemory_operand" "")) |
| (use (match_operand:SI 3 "immediate_operand" "")) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R4_REG)) |
| (clobber (reg:SI R5_REG)) |
| (clobber (reg:SI R0_REG))])] |
| "TARGET_SH1 && ! TARGET_SH5" |
| " |
| { |
| if(expand_block_move (operands)) |
| DONE; |
| else FAIL; |
| }") |
| |
| (define_insn "block_move_real" |
| [(parallel [(set (mem:BLK (reg:SI R4_REG)) |
| (mem:BLK (reg:SI R5_REG))) |
| (use (match_operand:SI 0 "arith_reg_operand" "r")) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R0_REG))])] |
| "TARGET_SH1 && ! TARGET_HARD_SH4" |
| "jsr @%0%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "block_lump_real" |
| [(parallel [(set (mem:BLK (reg:SI R4_REG)) |
| (mem:BLK (reg:SI R5_REG))) |
| (use (match_operand:SI 0 "arith_reg_operand" "r")) |
| (use (reg:SI R6_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI R4_REG)) |
| (clobber (reg:SI R5_REG)) |
| (clobber (reg:SI R6_REG)) |
| (clobber (reg:SI R0_REG))])] |
| "TARGET_SH1 && ! TARGET_HARD_SH4" |
| "jsr @%0%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "block_move_real_i4" |
| [(parallel [(set (mem:BLK (reg:SI R4_REG)) |
| (mem:BLK (reg:SI R5_REG))) |
| (use (match_operand:SI 0 "arith_reg_operand" "r")) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI R0_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R2_REG))])] |
| "TARGET_HARD_SH4" |
| "jsr @%0%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| (define_insn "block_lump_real_i4" |
| [(parallel [(set (mem:BLK (reg:SI R4_REG)) |
| (mem:BLK (reg:SI R5_REG))) |
| (use (match_operand:SI 0 "arith_reg_operand" "r")) |
| (use (reg:SI R6_REG)) |
| (clobber (reg:SI PR_REG)) |
| (clobber (reg:SI T_REG)) |
| (clobber (reg:SI R4_REG)) |
| (clobber (reg:SI R5_REG)) |
| (clobber (reg:SI R6_REG)) |
| (clobber (reg:SI R0_REG)) |
| (clobber (reg:SI R1_REG)) |
| (clobber (reg:SI R2_REG)) |
| (clobber (reg:SI R3_REG))])] |
| "TARGET_HARD_SH4" |
| "jsr @%0%#" |
| [(set_attr "type" "sfunc") |
| (set_attr "needs_delay_slot" "yes")]) |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Floating point instructions. |
| ;; ------------------------------------------------------------------------- |
| |
| ;; ??? All patterns should have a type attribute. |
| |
| (define_expand "fpu_switch0" |
| [(set (match_operand:SI 0 "" "") (match_dup 2)) |
| (set (match_dup 1) (mem:PSI (match_dup 0)))] |
| "TARGET_SH4" |
| " |
| { |
| operands[1] = get_fpscr_rtx (); |
| operands[2] = gen_rtx_SYMBOL_REF (SImode, \"__fpscr_values\"); |
| if (flag_pic) |
| operands[2] = legitimize_pic_address (operands[2], SImode, |
| no_new_pseudos ? operands[0] : 0); |
| }") |
| |
| (define_expand "fpu_switch1" |
| [(set (match_operand:SI 0 "" "") (match_dup 2)) |
| (set (match_dup 3) (plus:SI (match_dup 0) (const_int 4))) |
| (set (match_dup 1) (mem:PSI (match_dup 3)))] |
| "TARGET_SH4" |
| " |
| { |
| operands[1] = get_fpscr_rtx (); |
| operands[2] = gen_rtx_SYMBOL_REF (SImode, \"__fpscr_values\"); |
| if (flag_pic) |
| operands[2] = legitimize_pic_address (operands[2], SImode, |
| no_new_pseudos ? operands[0] : 0); |
| operands[3] = no_new_pseudos ? operands[0] : gen_reg_rtx (SImode); |
| }") |
| |
| (define_expand "movpsi" |
| [(set (match_operand:PSI 0 "register_operand" "") |
| (match_operand:PSI 1 "general_movsrc_operand" ""))] |
| "TARGET_SH4" |
| "") |
| |
| ;; The c / m alternative is a fake to guide reload to load directly into |
| ;; fpscr, since reload doesn't know how to use post-increment. |
| ;; GO_IF_LEGITIMATE_ADDRESS guards about bogus addresses before reload, |
| ;; SECONDARY_INPUT_RELOAD_CLASS does this during reload, and the insn's |
| ;; predicate after reload. |
| ;; The mac_gp type for r/!c might look a bit odd, but it actually schedules |
| ;; like a mac -> gpr move. |
| (define_insn "fpu_switch" |
| [(set (match_operand:PSI 0 "general_movdst_operand" "=c,c,r,c,c,r,m,r,<") |
| (match_operand:PSI 1 "general_movsrc_operand" "c,>,m,m,r,r,r,!c,c"))] |
| "TARGET_SH2E |
| && (! reload_completed |
| || true_regnum (operands[0]) != FPSCR_REG |
| || GET_CODE (operands[1]) != MEM |
| || GET_CODE (XEXP (operands[1], 0)) != PLUS)" |
| "@ |
| ! precision stays the same |
| lds.l %1,fpscr |
| mov.l %1,%0 |
| # |
| lds %1,fpscr |
| mov %1,%0 |
| mov.l %1,%0 |
| sts fpscr,%0 |
| sts.l fpscr,%0" |
| [(set_attr "length" "0,2,2,4,2,2,2,2,2") |
| (set_attr "type" "nil,mem_fpscr,load,mem_fpscr,gp_fpscr,move,store,mac_gp,store")]) |
| |
| (define_split |
| [(set (reg:PSI FPSCR_REG) |
| (mem:PSI (match_operand:SI 0 "register_operand" "")))] |
| "TARGET_SH4 && find_regno_note (insn, REG_DEAD, true_regnum (operands[0]))" |
| [(set (match_dup 0) (match_dup 0))] |
| " |
| { |
| rtx insn = emit_insn (gen_fpu_switch (get_fpscr_rtx (), |
| gen_rtx (MEM, PSImode, |
| gen_rtx (POST_INC, Pmode, |
| operands[0])))); |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, operands[0], NULL_RTX); |
| }") |
| |
| (define_split |
| [(set (reg:PSI FPSCR_REG) |
| (mem:PSI (match_operand:SI 0 "register_operand" "")))] |
| "TARGET_SH4" |
| [(set (match_dup 0) (plus:SI (match_dup 0) (const_int -4)))] |
| " |
| { |
| rtx insn = emit_insn (gen_fpu_switch (get_fpscr_rtx (), |
| gen_rtx (MEM, PSImode, |
| gen_rtx (POST_INC, Pmode, |
| operands[0])))); |
| REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, operands[0], NULL_RTX); |
| }") |
| |
| ;; ??? This uses the fp unit, but has no type indicating that. |
| ;; If we did that, this would either give a bogus latency or introduce |
| ;; a bogus FIFO constraint. |
| ;; Since this insn is currently only used for prologues/epilogues, |
| ;; it is probably best to claim no function unit, which matches the |
| ;; current setting. |
| (define_insn "toggle_sz" |
| [(set (reg:PSI FPSCR_REG) |
| (xor:PSI (reg:PSI FPSCR_REG) (const_int 1048576)))] |
| "TARGET_SH4" |
| "fschg" |
| [(set_attr "fp_set" "unknown")]) |
| |
| (define_expand "addsf3" |
| [(set (match_operand:SF 0 "arith_reg_operand" "") |
| (plus:SF (match_operand:SF 1 "arith_reg_operand" "") |
| (match_operand:SF 2 "arith_reg_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH2E) |
| { |
| expand_sf_binop (&gen_addsf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*addsf3_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (plus:SF (match_operand:SF 1 "fp_arith_reg_operand" "%f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fadd.s %1, %2, %0" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn_and_split "unary_sf_op" |
| [(set (match_operand:V2SF 0 "fp_arith_reg_operand" "=f") |
| (vec_select:V2SF |
| (vec_concat:V2SF |
| (vec_select:SF |
| (match_dup 0) |
| (parallel [(not:BI (match_operand 3 "const_int_operand" "n"))])) |
| (match_operator:SF 2 "unary_float_operator" |
| [(vec_select:SF (match_operand:V2SF 1 "fp_arith_reg_operand" "f") |
| (parallel [(match_operand 4 |
| "const_int_operand" "n")]))])) |
| (parallel [(not:BI (match_dup 3)) (match_dup 3)])))] |
| "TARGET_SHMEDIA_FPU" |
| "#" |
| "TARGET_SHMEDIA_FPU && reload_completed" |
| [(set (match_dup 5) (match_dup 6))] |
| " |
| { |
| int endian = TARGET_LITTLE_ENDIAN ? 0 : 1; |
| rtx op1 = gen_rtx_REG (SFmode, |
| (true_regnum (operands[1]) |
| + (INTVAL (operands[4]) ^ endian))); |
| |
| operands[7] = gen_rtx_REG (SFmode, |
| (true_regnum (operands[0]) |
| + (INTVAL (operands[3]) ^ endian))); |
| operands[6] = gen_rtx (GET_CODE (operands[2]), SFmode, op1); |
| }" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn_and_split "binary_sf_op" |
| [(set (match_operand:V2SF 0 "fp_arith_reg_operand" "=f") |
| (vec_select:V2SF |
| (vec_concat:V2SF |
| (vec_select:SF |
| (match_dup 0) |
| (parallel [(match_operand 7 "const_int_operand" "n")])) |
| (match_operator:SF 3 "binary_float_operator" |
| [(vec_select:SF (match_operand:V2SF 1 "fp_arith_reg_operand" "f") |
| (parallel [(match_operand 5 |
| "const_int_operand" "n")])) |
| (vec_select:SF (match_operand:V2SF 2 "fp_arith_reg_operand" "f") |
| (parallel [(match_operand 6 |
| "const_int_operand" "n")]))])) |
| (parallel [(match_dup 7) (match_operand 4 "const_int_operand" "n")])))] |
| "TARGET_SHMEDIA_FPU && INTVAL (operands[4]) != INTVAL (operands[7])" |
| "#" |
| "&& reload_completed" |
| [(set (match_dup 8) (match_dup 9))] |
| " |
| { |
| int endian = TARGET_LITTLE_ENDIAN ? 0 : 1; |
| rtx op1 = gen_rtx_REG (SFmode, |
| (true_regnum (operands[1]) |
| + (INTVAL (operands[5]) ^ endian))); |
| rtx op2 = gen_rtx_REG (SFmode, |
| (true_regnum (operands[2]) |
| + (INTVAL (operands[6]) ^ endian))); |
| |
| operands[8] = gen_rtx_REG (SFmode, |
| (true_regnum (operands[0]) |
| + (INTVAL (operands[4]) ^ endian))); |
| operands[9] = gen_rtx (GET_CODE (operands[3]), SFmode, op1, op2); |
| }" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn "addsf3_i" |
| [(set (match_operand:SF 0 "arith_reg_operand" "=f") |
| (plus:SF (match_operand:SF 1 "arith_reg_operand" "%0") |
| (match_operand:SF 2 "arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH2E" |
| "fadd %2,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_expand "subsf3" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "") |
| (minus:SF (match_operand:SF 1 "fp_arith_reg_operand" "") |
| (match_operand:SF 2 "fp_arith_reg_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH2E) |
| { |
| expand_sf_binop (&gen_subsf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*subsf3_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (minus:SF (match_operand:SF 1 "fp_arith_reg_operand" "f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fsub.s %1, %2, %0" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn "subsf3_i" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (minus:SF (match_operand:SF 1 "fp_arith_reg_operand" "0") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH2E" |
| "fsub %2,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| ;; Unfortunately, the combiner is unable to cope with the USE of the FPSCR |
| ;; register in feeding fp instructions. Thus, we cannot generate fmac for |
| ;; mixed-precision SH4 targets. To allow it to be still generated for the |
| ;; SH3E, we use a separate insn for SH3E mulsf3. |
| |
| (define_expand "mulsf3" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "") |
| (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "") |
| (match_operand:SF 2 "fp_arith_reg_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| expand_sf_binop (&gen_mulsf3_i4, operands); |
| else if (TARGET_SH2E) |
| emit_insn (gen_mulsf3_ie (operands[0], operands[1], operands[2])); |
| if (! TARGET_SHMEDIA) |
| DONE; |
| }") |
| |
| (define_insn "*mulsf3_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fmul.s %1, %2, %0" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn "mulsf3_i4" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%0") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH2E" |
| "fmul %2,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "mulsf3_ie" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%0") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SH2E && ! TARGET_SH4" |
| "fmul %2,%0" |
| [(set_attr "type" "fp")]) |
| |
| (define_insn "*mac_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (plus:SF (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")) |
| (match_operand:SF 3 "fp_arith_reg_operand" "0")))] |
| "TARGET_SHMEDIA_FPU" |
| "fmac.s %1, %2, %0" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn "*macsf3" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (plus:SF (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%w") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")) |
| (match_operand:SF 3 "arith_reg_operand" "0"))) |
| (use (match_operand:PSI 4 "fpscr_operand" "c"))] |
| "TARGET_SH2E && ! TARGET_SH4" |
| "fmac fr0,%2,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_expand "divsf3" |
| [(set (match_operand:SF 0 "arith_reg_operand" "") |
| (div:SF (match_operand:SF 1 "arith_reg_operand" "") |
| (match_operand:SF 2 "arith_reg_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH2E) |
| { |
| expand_sf_binop (&gen_divsf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*divsf3_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (div:SF (match_operand:SF 1 "fp_arith_reg_operand" "f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fdiv.s %1, %2, %0" |
| [(set_attr "type" "fdiv_media")]) |
| |
| (define_insn "divsf3_i" |
| [(set (match_operand:SF 0 "arith_reg_operand" "=f") |
| (div:SF (match_operand:SF 1 "arith_reg_operand" "0") |
| (match_operand:SF 2 "arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH2E" |
| "fdiv %2,%0" |
| [(set_attr "type" "fdiv") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "floatdisf2" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (float:SF (match_operand:DI 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "float.qs %1, %0" |
| [(set_attr "type" "fpconv_media")]) |
| |
| (define_expand "floatsisf2" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "") |
| (float:SF (match_operand:SI 1 "fpul_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| emit_sf_insn (gen_floatsisf2_i4 (operands[0], operands[1], get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*floatsisf2_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (float:SF (match_operand:SI 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "float.ls %1, %0" |
| [(set_attr "type" "fpconv_media")]) |
| |
| (define_insn "floatsisf2_i4" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (float:SF (match_operand:SI 1 "fpul_operand" "y"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "float %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "*floatsisf2_ie" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (float:SF (match_operand:SI 1 "fpul_operand" "y")))] |
| "TARGET_SH2E && ! TARGET_SH4" |
| "float %1,%0" |
| [(set_attr "type" "fp")]) |
| |
| (define_insn "fix_truncsfdi2" |
| [(set (match_operand:DI 0 "fp_arith_reg_operand" "=f") |
| (fix:DI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "ftrc.sq %1, %0" |
| [(set_attr "type" "fpconv_media")]) |
| |
| (define_expand "fix_truncsfsi2" |
| [(set (match_operand:SI 0 "fpul_operand" "=y") |
| (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| emit_sf_insn (gen_fix_truncsfsi2_i4 (operands[0], operands[1], get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*fix_truncsfsi2_media" |
| [(set (match_operand:SI 0 "fp_arith_reg_operand" "=f") |
| (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "ftrc.sl %1, %0" |
| [(set_attr "type" "fpconv_media")]) |
| |
| (define_insn "fix_truncsfsi2_i4" |
| [(set (match_operand:SI 0 "fpul_operand" "=y") |
| (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "ftrc %1,%0" |
| [(set_attr "type" "ftrc_s") |
| (set_attr "fp_mode" "single")]) |
| |
| ;; ??? This pattern is used nowhere. fix_truncsfsi2 always expands to |
| ;; fix_truncsfsi2_i4. |
| ;; (define_insn "fix_truncsfsi2_i4_2" |
| ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| ;; (fix:SI (match_operand:SF 1 "arith_reg_operand" "f"))) |
| ;; (use (reg:PSI FPSCR_REG)) |
| ;; (clobber (reg:SI FPUL_REG))] |
| ;; "TARGET_SH4" |
| ;; "#" |
| ;; [(set_attr "length" "4") |
| ;; (set_attr "fp_mode" "single")]) |
| |
| ;;(define_split |
| ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| ;; (fix:SI (match_operand:SF 1 "arith_reg_operand" "f"))) |
| ;; (use (match_operand:PSI 2 "fpscr_operand" "c")) |
| ;; (clobber (reg:SI FPUL_REG))] |
| ;; "TARGET_SH4" |
| ;; [(parallel [(set (reg:SI FPUL_REG) (fix:SI (match_dup 1))) |
| ;; (use (match_dup 2))]) |
| ;; (set (match_dup 0) (reg:SI FPUL_REG))]) |
| |
| (define_insn "*fixsfsi" |
| [(set (match_operand:SI 0 "fpul_operand" "=y") |
| (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SH2E && ! TARGET_SH4" |
| "ftrc %1,%0" |
| [(set_attr "type" "fp")]) |
| |
| (define_insn "cmpgtsf_t" |
| [(set (reg:SI T_REG) |
| (gt:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") |
| (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SH2E && ! TARGET_SH4" |
| "fcmp/gt %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "cmpeqsf_t" |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") |
| (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SH2E && ! TARGET_SH4" |
| "fcmp/eq %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "ieee_ccmpeqsf_t" |
| [(set (reg:SI T_REG) |
| (ior:SI (reg:SI T_REG) |
| (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") |
| (match_operand:SF 1 "fp_arith_reg_operand" "f"))))] |
| "TARGET_SH2E && TARGET_IEEE && ! TARGET_SH4" |
| "* return output_ieee_ccmpeq (insn, operands);" |
| [(set_attr "length" "4")]) |
| |
| |
| (define_insn "cmpgtsf_t_i4" |
| [(set (reg:SI T_REG) |
| (gt:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") |
| (match_operand:SF 1 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fcmp/gt %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "cmpeqsf_t_i4" |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") |
| (match_operand:SF 1 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fcmp/eq %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "*ieee_ccmpeqsf_t_4" |
| [(set (reg:SI T_REG) |
| (ior:SI (reg:SI T_REG) |
| (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") |
| (match_operand:SF 1 "fp_arith_reg_operand" "f")))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_IEEE && TARGET_SH4" |
| "* return output_ieee_ccmpeq (insn, operands);" |
| [(set_attr "length" "4") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_insn "cmpeqsf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (eq:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpeq.s %1, %2, %0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_insn "cmpgtsf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (gt:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpgt.s %1, %2, %0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_insn "cmpgesf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (ge:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpge.s %1, %2, %0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_insn "cmpunsf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (unordered:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") |
| (match_operand:SF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpun.s %1, %2, %0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_expand "cmpsf" |
| [(set (reg:SI T_REG) |
| (compare (match_operand:SF 0 "arith_operand" "") |
| (match_operand:SF 1 "arith_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| sh_compare_op0 = operands[0]; |
| sh_compare_op1 = operands[1]; |
| DONE; |
| }") |
| |
| (define_expand "negsf2" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "") |
| (neg:SF (match_operand:SF 1 "fp_arith_reg_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH2E) |
| { |
| expand_sf_unop (&gen_negsf2_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*negsf2_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (neg:SF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fneg.s %1, %0" |
| [(set_attr "type" "fmove_media")]) |
| |
| (define_insn "negsf2_i" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (neg:SF (match_operand:SF 1 "fp_arith_reg_operand" "0"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH2E" |
| "fneg %0" |
| [(set_attr "type" "fmove") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_expand "sqrtsf2" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "") |
| (sqrt:SF (match_operand:SF 1 "fp_arith_reg_operand" "")))] |
| "TARGET_SH3E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH3E) |
| { |
| expand_sf_unop (&gen_sqrtsf2_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*sqrtsf2_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (sqrt:SF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fsqrt.s %1, %0" |
| [(set_attr "type" "fdiv_media")]) |
| |
| (define_insn "sqrtsf2_i" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (sqrt:SF (match_operand:SF 1 "fp_arith_reg_operand" "0"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH3E" |
| "fsqrt %0" |
| [(set_attr "type" "fdiv") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_expand "abssf2" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "") |
| (abs:SF (match_operand:SF 1 "fp_arith_reg_operand" "")))] |
| "TARGET_SH2E || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH2E) |
| { |
| expand_sf_unop (&gen_abssf2_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*abssf2_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (abs:SF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fabs.s %1, %0" |
| [(set_attr "type" "fmove_media")]) |
| |
| (define_insn "abssf2_i" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (abs:SF (match_operand:SF 1 "fp_arith_reg_operand" "0"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH2E" |
| "fabs %0" |
| [(set_attr "type" "fmove") |
| (set_attr "fp_mode" "single")]) |
| |
| (define_expand "adddf3" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "") |
| (plus:DF (match_operand:DF 1 "fp_arith_reg_operand" "") |
| (match_operand:DF 2 "fp_arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_binop (&gen_adddf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*adddf3_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (plus:DF (match_operand:DF 1 "fp_arith_reg_operand" "%f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fadd.d %1, %2, %0" |
| [(set_attr "type" "dfparith_media")]) |
| |
| (define_insn "adddf3_i" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (plus:DF (match_operand:DF 1 "fp_arith_reg_operand" "%0") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fadd %2,%0" |
| [(set_attr "type" "dfp_arith") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "subdf3" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "") |
| (minus:DF (match_operand:DF 1 "fp_arith_reg_operand" "") |
| (match_operand:DF 2 "fp_arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_binop (&gen_subdf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*subdf3_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (minus:DF (match_operand:DF 1 "fp_arith_reg_operand" "f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fsub.d %1, %2, %0" |
| [(set_attr "type" "dfparith_media")]) |
| |
| (define_insn "subdf3_i" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (minus:DF (match_operand:DF 1 "fp_arith_reg_operand" "0") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fsub %2,%0" |
| [(set_attr "type" "dfp_arith") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "muldf3" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "") |
| (mult:DF (match_operand:DF 1 "fp_arith_reg_operand" "") |
| (match_operand:DF 2 "fp_arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_binop (&gen_muldf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*muldf3_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (mult:DF (match_operand:DF 1 "fp_arith_reg_operand" "%f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fmul.d %1, %2, %0" |
| [(set_attr "type" "dfmul_media")]) |
| |
| (define_insn "muldf3_i" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (mult:DF (match_operand:DF 1 "fp_arith_reg_operand" "%0") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fmul %2,%0" |
| [(set_attr "type" "dfp_arith") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "divdf3" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "") |
| (div:DF (match_operand:DF 1 "fp_arith_reg_operand" "") |
| (match_operand:DF 2 "fp_arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_binop (&gen_divdf3_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*divdf3_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (div:DF (match_operand:DF 1 "fp_arith_reg_operand" "f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fdiv.d %1, %2, %0" |
| [(set_attr "type" "dfdiv_media")]) |
| |
| (define_insn "divdf3_i" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (div:DF (match_operand:DF 1 "fp_arith_reg_operand" "0") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 3 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fdiv %2,%0" |
| [(set_attr "type" "dfdiv") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_insn "floatdidf2" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (float:DF (match_operand:DI 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "float.qd %1, %0" |
| [(set_attr "type" "dfpconv_media")]) |
| |
| (define_expand "floatsidf2" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "") |
| (float:DF (match_operand:SI 1 "fpul_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| emit_df_insn (gen_floatsidf2_i (operands[0], operands[1], |
| get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*floatsidf2_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (float:DF (match_operand:SI 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "float.ld %1, %0" |
| [(set_attr "type" "dfpconv_media")]) |
| |
| (define_insn "floatsidf2_i" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (float:DF (match_operand:SI 1 "fpul_operand" "y"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "float %1,%0" |
| [(set_attr "type" "dfp_conv") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_insn "fix_truncdfdi2" |
| [(set (match_operand:DI 0 "fp_arith_reg_operand" "=f") |
| (fix:DI (match_operand:DF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "ftrc.dq %1, %0" |
| [(set_attr "type" "dfpconv_media")]) |
| |
| (define_expand "fix_truncdfsi2" |
| [(set (match_operand:SI 0 "fpul_operand" "") |
| (fix:SI (match_operand:DF 1 "fp_arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| emit_df_insn (gen_fix_truncdfsi2_i (operands[0], operands[1], |
| get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*fix_truncdfsi2_media" |
| [(set (match_operand:SI 0 "fp_arith_reg_operand" "=f") |
| (fix:SI (match_operand:DF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "ftrc.dl %1, %0" |
| [(set_attr "type" "dfpconv_media")]) |
| |
| (define_insn "fix_truncdfsi2_i" |
| [(set (match_operand:SI 0 "fpul_operand" "=y") |
| (fix:SI (match_operand:DF 1 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "ftrc %1,%0" |
| [(set_attr "type" "dfp_conv") |
| (set_attr "dfp_comp" "no") |
| (set_attr "fp_mode" "double")]) |
| |
| ;; ??? This pattern is used nowhere. fix_truncdfsi2 always expands to |
| ;; fix_truncdfsi2_i. |
| ;; (define_insn "fix_truncdfsi2_i4" |
| ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| ;; (fix:SI (match_operand:DF 1 "arith_reg_operand" "f"))) |
| ;; (use (match_operand:PSI 2 "fpscr_operand" "c")) |
| ;; (clobber (reg:SI FPUL_REG))] |
| ;; "TARGET_SH4" |
| ;; "#" |
| ;; [(set_attr "length" "4") |
| ;; (set_attr "fp_mode" "double")]) |
| ;; |
| ;; (define_split |
| ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| ;; (fix:SI (match_operand:DF 1 "arith_reg_operand" "f"))) |
| ;; (use (match_operand:PSI 2 "fpscr_operand" "c")) |
| ;; (clobber (reg:SI FPUL_REG))] |
| ;; "TARGET_SH4" |
| ;; [(parallel [(set (reg:SI FPUL_REG) (fix:SI (match_dup 1))) |
| ;; (use (match_dup 2))]) |
| ;; (set (match_dup 0) (reg:SI FPUL_REG))]) |
| |
| (define_insn "cmpgtdf_t" |
| [(set (reg:SI T_REG) |
| (gt:SI (match_operand:DF 0 "arith_reg_operand" "f") |
| (match_operand:DF 1 "arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fcmp/gt %1,%0" |
| [(set_attr "type" "dfp_cmp") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_insn "cmpeqdf_t" |
| [(set (reg:SI T_REG) |
| (eq:SI (match_operand:DF 0 "arith_reg_operand" "f") |
| (match_operand:DF 1 "arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fcmp/eq %1,%0" |
| [(set_attr "type" "dfp_cmp") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_insn "*ieee_ccmpeqdf_t" |
| [(set (reg:SI T_REG) |
| (ior:SI (reg:SI T_REG) |
| (eq:SI (match_operand:DF 0 "arith_reg_operand" "f") |
| (match_operand:DF 1 "arith_reg_operand" "f")))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_IEEE && TARGET_SH4" |
| "* return output_ieee_ccmpeq (insn, operands);" |
| [(set_attr "length" "4") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_insn "cmpeqdf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (eq:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpeq.d %1,%2,%0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_insn "cmpgtdf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (gt:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpgt.d %1,%2,%0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_insn "cmpgedf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (ge:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpge.d %1,%2,%0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_insn "cmpundf_media" |
| [(set (match_operand:DI 0 "register_operand" "=r") |
| (unordered:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") |
| (match_operand:DF 2 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcmpun.d %1,%2,%0" |
| [(set_attr "type" "fcmp_media")]) |
| |
| (define_expand "cmpdf" |
| [(set (reg:SI T_REG) |
| (compare (match_operand:DF 0 "arith_operand" "") |
| (match_operand:DF 1 "arith_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| sh_compare_op0 = operands[0]; |
| sh_compare_op1 = operands[1]; |
| DONE; |
| }") |
| |
| (define_expand "negdf2" |
| [(set (match_operand:DF 0 "arith_reg_operand" "") |
| (neg:DF (match_operand:DF 1 "arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_unop (&gen_negdf2_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*negdf2_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (neg:DF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fneg.d %1, %0" |
| [(set_attr "type" "fmove_media")]) |
| |
| (define_insn "negdf2_i" |
| [(set (match_operand:DF 0 "arith_reg_operand" "=f") |
| (neg:DF (match_operand:DF 1 "arith_reg_operand" "0"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fneg %0" |
| [(set_attr "type" "fmove") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "sqrtdf2" |
| [(set (match_operand:DF 0 "arith_reg_operand" "") |
| (sqrt:DF (match_operand:DF 1 "arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_unop (&gen_sqrtdf2_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*sqrtdf2_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (sqrt:DF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fsqrt.d %1, %0" |
| [(set_attr "type" "dfdiv_media")]) |
| |
| (define_insn "sqrtdf2_i" |
| [(set (match_operand:DF 0 "arith_reg_operand" "=f") |
| (sqrt:DF (match_operand:DF 1 "arith_reg_operand" "0"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fsqrt %0" |
| [(set_attr "type" "dfdiv") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "absdf2" |
| [(set (match_operand:DF 0 "arith_reg_operand" "") |
| (abs:DF (match_operand:DF 1 "arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| expand_df_unop (&gen_absdf2_i, operands); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*absdf2_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (abs:DF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fabs.d %1, %0" |
| [(set_attr "type" "fmove_media")]) |
| |
| (define_insn "absdf2_i" |
| [(set (match_operand:DF 0 "arith_reg_operand" "=f") |
| (abs:DF (match_operand:DF 1 "arith_reg_operand" "0"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fabs %0" |
| [(set_attr "type" "fmove") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "extendsfdf2" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "") |
| (float_extend:DF (match_operand:SF 1 "fpul_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| emit_df_insn (gen_extendsfdf2_i4 (operands[0], operands[1], |
| get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*extendsfdf2_media" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (float_extend:DF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcnv.sd %1, %0" |
| [(set_attr "type" "dfpconv_media")]) |
| |
| (define_insn "extendsfdf2_i4" |
| [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") |
| (float_extend:DF (match_operand:SF 1 "fpul_operand" "y"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fcnvsd %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "double")]) |
| |
| (define_expand "truncdfsf2" |
| [(set (match_operand:SF 0 "fpul_operand" "") |
| (float_truncate:SF (match_operand:DF 1 "fp_arith_reg_operand" "")))] |
| "TARGET_SH4 || TARGET_SHMEDIA_FPU" |
| " |
| { |
| if (TARGET_SH4) |
| { |
| emit_df_insn (gen_truncdfsf2_i4 (operands[0], operands[1], |
| get_fpscr_rtx ())); |
| DONE; |
| } |
| }") |
| |
| (define_insn "*truncdfsf2_media" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (float_truncate:SF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] |
| "TARGET_SHMEDIA_FPU" |
| "fcnv.ds %1, %0" |
| [(set_attr "type" "dfpconv_media")]) |
| |
| (define_insn "truncdfsf2_i4" |
| [(set (match_operand:SF 0 "fpul_operand" "=y") |
| (float_truncate:SF (match_operand:DF 1 "fp_arith_reg_operand" "f"))) |
| (use (match_operand:PSI 2 "fpscr_operand" "c"))] |
| "TARGET_SH4" |
| "fcnvds %1,%0" |
| [(set_attr "type" "fp") |
| (set_attr "fp_mode" "double")]) |
| |
| ;; Bit field extract patterns. These give better code for packed bitfields, |
| ;; because they allow auto-increment addresses to be generated. |
| |
| (define_expand "insv" |
| [(set (zero_extract:SI (match_operand:QI 0 "memory_operand" "") |
| (match_operand:SI 1 "immediate_operand" "") |
| (match_operand:SI 2 "immediate_operand" "")) |
| (match_operand:SI 3 "general_operand" ""))] |
| "TARGET_SH1 && ! TARGET_LITTLE_ENDIAN" |
| " |
| { |
| rtx addr_target, orig_address, shift_reg, qi_val; |
| HOST_WIDE_INT bitsize, size, v; |
| rtx x = operands[3]; |
| |
| /* ??? expmed doesn't care for non-register predicates. */ |
| if (! memory_operand (operands[0], VOIDmode) |
| || ! immediate_operand (operands[1], VOIDmode) |
| || ! immediate_operand (operands[2], VOIDmode) |
| || ! general_operand (x, VOIDmode)) |
| FAIL; |
| /* If this isn't a 16 / 24 / 32 bit field, or if |
| it doesn't start on a byte boundary, then fail. */ |
| bitsize = INTVAL (operands[1]); |
| if (bitsize < 16 || bitsize > 32 || bitsize % 8 != 0 |
| || (INTVAL (operands[2]) % 8) != 0) |
| FAIL; |
| |
| size = bitsize / 8; |
| orig_address = XEXP (operands[0], 0); |
| shift_reg = gen_reg_rtx (SImode); |
| if (GET_CODE (x) == CONST_INT) |
| { |
| v = INTVAL (x); |
| qi_val = force_reg (QImode, GEN_INT (trunc_int_for_mode (v, QImode))); |
| } |
| else |
| { |
| emit_insn (gen_movsi (shift_reg, operands[3])); |
| qi_val = gen_rtx_SUBREG (QImode, shift_reg, 3); |
| } |
| addr_target = copy_addr_to_reg (plus_constant (orig_address, size - 1)); |
| |
| operands[0] = replace_equiv_address (operands[0], addr_target); |
| emit_insn (gen_movqi (operands[0], qi_val)); |
| |
| while (size -= 1) |
| { |
| if (GET_CODE (x) == CONST_INT) |
| qi_val |
| = force_reg (QImode, GEN_INT (trunc_int_for_mode (v >>= 8, QImode))); |
| else |
| { |
| emit_insn (gen_lshrsi3_k (shift_reg, shift_reg, GEN_INT (8))); |
| qi_val = gen_rtx_SUBREG (QImode, shift_reg, 3); |
| } |
| emit_insn (gen_addsi3 (addr_target, addr_target, GEN_INT (-1))); |
| emit_insn (gen_movqi (operands[0], qi_val)); |
| } |
| |
| DONE; |
| }") |
| |
| ;; ------------------------------------------------------------------------- |
| ;; Peepholes |
| ;; ------------------------------------------------------------------------- |
| |
| ;; This matches cases where a stack pointer increment at the start of the |
| ;; epilogue combines with a stack slot read loading the return value. |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "arith_reg_operand" "") |
| (mem:SI (match_operand:SI 1 "arith_reg_operand" ""))) |
| (set (match_dup 1) (plus:SI (match_dup 1) (const_int 4)))] |
| "TARGET_SH1 && REGNO (operands[1]) != REGNO (operands[0])" |
| "mov.l @%1+,%0") |
| |
| ;; See the comment on the dt combiner pattern above. |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "arith_reg_operand" "=r") |
| (plus:SI (match_dup 0) |
| (const_int -1))) |
| (set (reg:SI T_REG) |
| (eq:SI (match_dup 0) |
| (const_int 0)))] |
| "TARGET_SH2" |
| "dt %0") |
| |
| ;; These convert sequences such as `mov #k,r0; add r15,r0; mov.l @r0,rn' |
| ;; to `mov #k,r0; mov.l @(r0,r15),rn'. These sequences are generated by |
| ;; reload when the constant is too large for a reg+offset address. |
| |
| ;; ??? We would get much better code if this was done in reload. This would |
| ;; require modifying find_reloads_address to recognize that if the constant |
| ;; is out-of-range for an immediate add, then we get better code by reloading |
| ;; the constant into a register than by reloading the sum into a register, |
| ;; since the former is one instruction shorter if the address does not need |
| ;; to be offsettable. Unfortunately this does not work, because there is |
| ;; only one register, r0, that can be used as an index register. This register |
| ;; is also the function return value register. So, if we try to force reload |
| ;; to use double-reg addresses, then we end up with some instructions that |
| ;; need to use r0 twice. The only way to fix this is to change the calling |
| ;; convention so that r0 is not used to return values. |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (mem:SI (match_dup 0)) |
| (match_operand:SI 2 "general_movsrc_operand" ""))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" |
| "mov.l %2,@(%0,%1)") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (match_operand:SI 2 "general_movdst_operand" "") |
| (mem:SI (match_dup 0)))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" |
| "mov.l @(%0,%1),%2") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (mem:HI (match_dup 0)) |
| (match_operand:HI 2 "general_movsrc_operand" ""))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" |
| "mov.w %2,@(%0,%1)") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (match_operand:HI 2 "general_movdst_operand" "") |
| (mem:HI (match_dup 0)))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" |
| "mov.w @(%0,%1),%2") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (mem:QI (match_dup 0)) |
| (match_operand:QI 2 "general_movsrc_operand" ""))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" |
| "mov.b %2,@(%0,%1)") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (match_operand:QI 2 "general_movdst_operand" "") |
| (mem:QI (match_dup 0)))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" |
| "mov.b @(%0,%1),%2") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (mem:SF (match_dup 0)) |
| (match_operand:SF 2 "general_movsrc_operand" ""))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 |
| && ((GET_CODE (operands[2]) == REG && REGNO (operands[2]) < 16) |
| || (GET_CODE (operands[2]) == SUBREG |
| && REGNO (SUBREG_REG (operands[2])) < 16)) |
| && reg_unused_after (operands[0], insn)" |
| "mov.l %2,@(%0,%1)") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (match_operand:SF 2 "general_movdst_operand" "") |
| |
| (mem:SF (match_dup 0)))] |
| "TARGET_SH1 && REGNO (operands[0]) == 0 |
| && ((GET_CODE (operands[2]) == REG && REGNO (operands[2]) < 16) |
| || (GET_CODE (operands[2]) == SUBREG |
| && REGNO (SUBREG_REG (operands[2])) < 16)) |
| && reg_unused_after (operands[0], insn)" |
| "mov.l @(%0,%1),%2") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (mem:SF (match_dup 0)) |
| (match_operand:SF 2 "general_movsrc_operand" ""))] |
| "TARGET_SH2E && REGNO (operands[0]) == 0 |
| && ((GET_CODE (operands[2]) == REG |
| && FP_OR_XD_REGISTER_P (REGNO (operands[2]))) |
| || (GET_CODE (operands[2]) == SUBREG |
| && FP_OR_XD_REGISTER_P (REGNO (SUBREG_REG (operands[2]))))) |
| && reg_unused_after (operands[0], insn)" |
| "fmov{.s|} %2,@(%0,%1)") |
| |
| (define_peephole |
| [(set (match_operand:SI 0 "register_operand" "=r") |
| (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) |
| (set (match_operand:SF 2 "general_movdst_operand" "") |
| |
| (mem:SF (match_dup 0)))] |
| "TARGET_SH2E && REGNO (operands[0]) == 0 |
| && ((GET_CODE (operands[2]) == REG |
| && FP_OR_XD_REGISTER_P (REGNO (operands[2]))) |
| || (GET_CODE (operands[2]) == SUBREG |
| && FP_OR_XD_REGISTER_P (REGNO (SUBREG_REG (operands[2]))))) |
| && reg_unused_after (operands[0], insn)" |
| "fmov{.s|} @(%0,%1),%2") |
| |
| ;; Switch to a new stack with its address in sp_switch (a SYMBOL_REF). */ |
| (define_insn "sp_switch_1" |
| [(const_int 1)] |
| "TARGET_SH1" |
| "* |
| { |
| rtx xoperands[1]; |
| |
| xoperands[0] = sp_switch; |
| output_asm_insn (\"mov.l r0,@-r15\;mov.l %0,r0\", xoperands); |
| output_asm_insn (\"mov.l @r0,r0\;mov.l r15,@-r0\", xoperands); |
| return \"mov r0,r15\"; |
| }" |
| [(set_attr "length" "10")]) |
| |
| ;; Switch back to the original stack for interrupt functions with the |
| ;; sp_switch attribute. */ |
| (define_insn "sp_switch_2" |
| [(const_int 2)] |
| "TARGET_SH1" |
| "mov.l @r15+,r15\;mov.l @r15+,r0" |
| [(set_attr "length" "4")]) |
| |
| ;; Integer vector moves |
| |
| (define_expand "movv8qi" |
| [(set (match_operand:V8QI 0 "general_movdst_operand" "") |
| (match_operand:V8QI 1 "general_movsrc_operand" ""))] |
| "TARGET_SHMEDIA" |
| "{ if (prepare_move_operands (operands, V8QImode)) DONE; }") |
| |
| (define_insn "movv8qi_i" |
| [(set (match_operand:V8QI 0 "general_movdst_operand" "=r,r,r,rl,m") |
| (match_operand:V8QI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], V8QImode) |
| || sh_register_operand (operands[1], V8QImode))" |
| "@ |
| add %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") |
| (set_attr "length" "4,4,16,4,4")]) |
| |
| (define_split |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "") |
| (subreg:V8QI (const_int 0) 0))] |
| "TARGET_SHMEDIA" |
| [(set (match_dup 0) |
| (const_vector:V8QI [(const_int 0) (const_int 0) (const_int 0) |
| (const_int 0) (const_int 0) (const_int 0) |
| (const_int 0) (const_int 0)]))]) |
| |
| (define_split |
| [(set (match_operand 0 "arith_reg_dest" "") |
| (match_operand 1 "sh_rep_vec" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && GET_MODE (operands[0]) == GET_MODE (operands[1]) |
| && VECTOR_MODE_SUPPORTED_P (GET_MODE (operands[0])) |
| && GET_MODE_SIZE (GET_MODE (operands[0])) == 8 |
| && (XVECEXP (operands[1], 0, 0) != const0_rtx |
| || XVECEXP (operands[1], 0, 1) != const0_rtx) |
| && (XVECEXP (operands[1], 0, 0) != constm1_rtx |
| || XVECEXP (operands[1], 0, 1) != constm1_rtx)" |
| [(set (match_dup 0) (match_dup 1)) |
| (match_dup 2)] |
| " |
| { |
| int unit_size = GET_MODE_UNIT_SIZE (GET_MODE (operands[1])); |
| rtx elt1 = XVECEXP (operands[1], 0, 1); |
| |
| if (unit_size > 2) |
| operands[2] = gen_mshflo_l (operands[0], operands[0], operands[0]); |
| else |
| { |
| if (unit_size < 2) |
| operands[0] = gen_rtx_REG (V4HImode, true_regnum (operands[0])); |
| operands[2] = gen_mperm_w0 (operands[0], operands[0]); |
| } |
| operands[0] = gen_rtx_REG (DImode, true_regnum (operands[0])); |
| operands[1] = XVECEXP (operands[1], 0, 0); |
| if (unit_size < 2) |
| { |
| if (GET_CODE (operands[1]) == CONST_INT && GET_CODE (elt1) == CONST_INT) |
| operands[1] |
| = GEN_INT (TARGET_LITTLE_ENDIAN |
| ? (INTVAL (operands[1]) & 0xff) + (INTVAL (elt1) << 8) |
| : (INTVAL (operands[1]) << 8) + (INTVAL (elt1) & 0xff)); |
| else |
| { |
| operands[0] = gen_rtx_REG (V2QImode, true_regnum (operands[0])); |
| operands[1] |
| = gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, operands[1], elt1)); |
| } |
| } |
| }") |
| |
| (define_split |
| [(set (match_operand 0 "arith_reg_dest" "") |
| (match_operand 1 "sh_const_vec" ""))] |
| "TARGET_SHMEDIA && reload_completed |
| && GET_MODE (operands[0]) == GET_MODE (operands[1]) |
| && VECTOR_MODE_SUPPORTED_P (GET_MODE (operands[0])) |
| && operands[1] != CONST0_RTX (GET_MODE (operands[1]))" |
| [(set (match_dup 0) (match_dup 1))] |
| " |
| { |
| rtx v = operands[1]; |
| enum machine_mode new_mode |
| = mode_for_size (GET_MODE_BITSIZE (GET_MODE (v)), MODE_INT, 0); |
| |
| operands[0] = gen_rtx_REG (new_mode, true_regnum (operands[0])); |
| operands[1] |
| = simplify_subreg (new_mode, operands[1], GET_MODE (operands[1]), 0); |
| }") |
| |
| (define_expand "movv2hi" |
| [(set (match_operand:V2HI 0 "general_movdst_operand" "") |
| (match_operand:V2HI 1 "general_movsrc_operand" ""))] |
| "TARGET_SHMEDIA" |
| "{ if (prepare_move_operands (operands, V2HImode)) DONE; }") |
| |
| (define_insn "movv2hi_i" |
| [(set (match_operand:V2HI 0 "general_movdst_operand" "=r,r,r,rl,m") |
| (match_operand:V2HI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], V2HImode) |
| || sh_register_operand (operands[1], V2HImode))" |
| "@ |
| addz.l %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.l %m1, %0 |
| st%M0.l %m0, %N1" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") |
| (set_attr "length" "4,4,16,4,4")]) |
| |
| (define_expand "movv4hi" |
| [(set (match_operand:V4HI 0 "general_movdst_operand" "") |
| (match_operand:V4HI 1 "general_movsrc_operand" ""))] |
| "TARGET_SHMEDIA" |
| "{ if (prepare_move_operands (operands, V4HImode)) DONE; }") |
| |
| (define_insn "movv4hi_i" |
| [(set (match_operand:V4HI 0 "general_movdst_operand" "=r,r,r,rl,m") |
| (match_operand:V4HI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], V4HImode) |
| || sh_register_operand (operands[1], V4HImode))" |
| "@ |
| add %1, r63, %0 |
| movi %1, %0 |
| # |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") |
| (set_attr "length" "4,4,16,4,4")]) |
| |
| (define_expand "movv2si" |
| [(set (match_operand:V2SI 0 "general_movdst_operand" "") |
| (match_operand:V2SI 1 "general_movsrc_operand" ""))] |
| "TARGET_SHMEDIA" |
| "{ if (prepare_move_operands (operands, V2SImode)) DONE; }") |
| |
| (define_insn "movv2si_i" |
| [(set (match_operand:V2SI 0 "general_movdst_operand" "=r,r,r,rl,m") |
| (match_operand:V2SI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] |
| "TARGET_SHMEDIA |
| && (register_operand (operands[0], V2SImode) |
| || sh_register_operand (operands[1], V2SImode))" |
| "@ |
| add %1, r63, %0 |
| # |
| # |
| ld%M1.q %m1, %0 |
| st%M0.q %m0, %N1" |
| [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") |
| (set_attr "length" "4,4,16,4,4")]) |
| |
| ;; Multimedia Intrinsics |
| |
| (define_insn "absv2si2" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (abs:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mabs.l %1, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "absv4hi2" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (abs:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mabs.w %1, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "addv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (plus:V2SI (match_operand:V2SI 1 "arith_reg_operand" "%r") |
| (match_operand:V2SI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "madd.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "addv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (plus:V4HI (match_operand:V4HI 1 "arith_reg_operand" "%r") |
| (match_operand:V4HI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "madd.w %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "ssaddv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ss_plus:V2SI (match_operand:V2SI 1 "arith_reg_operand" "%r") |
| (match_operand:V2SI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "madds.l %1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "usaddv8qi3" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (us_plus:V8QI (match_operand:V8QI 1 "arith_reg_operand" "%r") |
| (match_operand:V8QI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "madds.ub %1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "ssaddv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ss_plus:V4HI (match_operand:V4HI 1 "arith_reg_operand" "%r") |
| (match_operand:V4HI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "madds.w %1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "negcmpeqv8qi" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (neg:V8QI (eq:V8QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "%rZ") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcmpeq.b %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "negcmpeqv2si" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (neg:V2SI (eq:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "%rZ") |
| (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcmpeq.l %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "negcmpeqv4hi" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (neg:V4HI (eq:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "%rZ") |
| (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcmpeq.w %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "negcmpgtuv8qi" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (neg:V8QI (gtu:V8QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "%rZ") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcmpgt.ub %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "negcmpgtv2si" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (neg:V2SI (gt:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "%rZ") |
| (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcmpgt.l %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "negcmpgtv4hi" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (neg:V4HI (gt:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "%rZ") |
| (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcmpgt.w %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "mcmv" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (and:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_operand" "r")) |
| (and:DI (match_operand:DI 3 "arith_reg_operand" "0") |
| (not:DI (match_dup 2)))))] |
| "TARGET_SHMEDIA" |
| "mcmv %N1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mcnvs_lw" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_concat:V4HI |
| (ss_truncate:V2HI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ")) |
| (ss_truncate:V2HI (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcnvs.lw %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "mcnvs_wb" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (vec_concat:V8QI |
| (ss_truncate:V4QI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ")) |
| (ss_truncate:V4QI (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcnvs.wb %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "mcnvs_wub" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (vec_concat:V8QI |
| (us_truncate:V4QI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ")) |
| (us_truncate:V4QI (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mcnvs.wub %N1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "mextr_rl" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (lshiftrt:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:HI 3 "mextr_bit_offset" "i")) |
| (ashift:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") |
| (match_operand:HI 4 "mextr_bit_offset" "i"))))] |
| "TARGET_SHMEDIA && INTVAL (operands[3]) + INTVAL (operands[4]) == 64" |
| "* |
| { |
| static char templ[16]; |
| |
| sprintf (templ, \"mextr%d\\t%%N1, %%N2, %%0\", |
| (int) INTVAL (operands[3]) >> 3); |
| return templ; |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "*mextr_lr" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:HI 3 "mextr_bit_offset" "i")) |
| (lshiftrt:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") |
| (match_operand:HI 4 "mextr_bit_offset" "i"))))] |
| "TARGET_SHMEDIA && INTVAL (operands[3]) + INTVAL (operands[4]) == 64" |
| "* |
| { |
| static char templ[16]; |
| |
| sprintf (templ, \"mextr%d\\t%%N2, %%N1, %%0\", |
| (int) INTVAL (operands[4]) >> 3); |
| return templ; |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| ; mextrN can be modelled with vec_select / vec_concat, but the selection |
| ; vector then varies depending on endianness. |
| (define_expand "mextr1" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (1 * 8), GEN_INT (7 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mextr2" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (2 * 8), GEN_INT (6 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mextr3" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (3 * 8), GEN_INT (5 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mextr4" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (4 * 8), GEN_INT (4 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mextr5" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (5 * 8), GEN_INT (3 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mextr6" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (6 * 8), GEN_INT (2 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mextr7" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], |
| GEN_INT (7 * 8), GEN_INT (1 * 8))); |
| DONE; |
| }") |
| |
| (define_expand "mmacfx_wl" |
| [(match_operand:V2SI 0 "arith_reg_dest" "") |
| (match_operand:V2HI 1 "extend_reg_operand" "") |
| (match_operand:V2HI 2 "extend_reg_operand" "") |
| (match_operand:V2SI 3 "arith_reg_operand" "")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mmacfx_wl_i (operands[0], operands[3], |
| operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mmacfx_wl_i" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ss_plus:V2SI |
| (match_operand:V2SI 1 "arith_reg_operand" "0") |
| (ss_truncate:V2SI |
| (ashift:V2DI |
| (sign_extend:V2DI |
| (mult:V2SI |
| (sign_extend:V2SI (match_operand:V2HI 2 "extend_reg_operand" "r")) |
| (sign_extend:V2SI (match_operand:V2HI 3 "extend_reg_operand" "r")))) |
| (const_int 1)))))] |
| "TARGET_SHMEDIA" |
| "mmacfx.wl %2, %3, %0" |
| [(set_attr "type" "mac_media")]) |
| |
| (define_expand "mmacnfx_wl" |
| [(match_operand:V2SI 0 "arith_reg_dest" "") |
| (match_operand:V2HI 1 "extend_reg_operand" "") |
| (match_operand:V2HI 2 "extend_reg_operand" "") |
| (match_operand:V2SI 3 "arith_reg_operand" "")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mmacnfx_wl_i (operands[0], operands[3], |
| operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mmacnfx_wl_i" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ss_minus:V2SI |
| (match_operand:V2SI 1 "arith_reg_operand" "0") |
| (ss_truncate:V2SI |
| (ashift:V2DI |
| (sign_extend:V2DI |
| (mult:V2SI |
| (sign_extend:V2SI (match_operand:V2HI 2 "extend_reg_operand" "r")) |
| (sign_extend:V2SI (match_operand:V2HI 3 "extend_reg_operand" "r")))) |
| (const_int 1)))))] |
| "TARGET_SHMEDIA" |
| "mmacnfx.wl %2, %3, %0" |
| [(set_attr "type" "mac_media")]) |
| |
| (define_insn "mulv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (mult:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") |
| (match_operand:V2SI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mmul.l %1, %2, %0" |
| [(set_attr "type" "d2mpy_media")]) |
| |
| (define_insn "mulv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (mult:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (match_operand:V4HI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mmul.w %1, %2, %0" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_insn "mmulfx_l" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ss_truncate:V2SI |
| (ashiftrt:V2DI |
| (mult:V2DI |
| (sign_extend:V2DI (match_operand:V2SI 1 "arith_reg_operand" "r")) |
| (sign_extend:V2DI (match_operand:V2SI 2 "arith_reg_operand" "r"))) |
| (const_int 31))))] |
| "TARGET_SHMEDIA" |
| "mmulfx.l %1, %2, %0" |
| [(set_attr "type" "d2mpy_media")]) |
| |
| (define_insn "mmulfx_w" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ss_truncate:V4HI |
| (ashiftrt:V4SI |
| (mult:V4SI |
| (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) |
| (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) |
| (const_int 15))))] |
| "TARGET_SHMEDIA" |
| "mmulfx.w %1, %2, %0" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_insn "mmulfxrp_w" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ss_truncate:V4HI |
| (ashiftrt:V4SI |
| (plus:V4SI |
| (mult:V4SI |
| (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) |
| (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) |
| (const_int 16384)) |
| (const_int 15))))] |
| "TARGET_SHMEDIA" |
| "mmulfxrp.w %1, %2, %0" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_expand "mmulhi_wl" |
| [(match_operand:V2SI 0 "arith_reg_dest" "") |
| (match_operand:V4HI 1 "arith_reg_operand" "") |
| (match_operand:V4HI 2 "arith_reg_operand" "")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mmul23_wl : gen_mmul01_wl) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_expand "mmullo_wl" |
| [(match_operand:V2SI 0 "arith_reg_dest" "") |
| (match_operand:V4HI 1 "arith_reg_operand" "") |
| (match_operand:V4HI 2 "arith_reg_operand" "")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mmul01_wl : gen_mmul23_wl) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mmul23_wl" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (vec_select:V2SI |
| (mult:V4SI |
| (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) |
| (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) |
| (parallel [(const_int 2) (const_int 3)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mmulhi.wl %1, %2, %0\" |
| : \"mmullo.wl %1, %2, %0\");" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_insn "mmul01_wl" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (vec_select:V2SI |
| (mult:V4SI |
| (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) |
| (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) |
| (parallel [(const_int 0) (const_int 1)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mmullo.wl %1, %2, %0\" |
| : \"mmulhi.wl %1, %2, %0\");" |
| [(set_attr "type" "dmpy_media")]) |
| |
| (define_expand "mmulsum_wq" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:V4HI 1 "arith_reg_operand" "") |
| (match_operand:V4HI 2 "arith_reg_operand" "") |
| (match_operand:DI 3 "arith_reg_operand" "")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_mmulsum_wq_i (operands[0], operands[3], |
| operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mmulsum_wq_i" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (plus:DI (match_operand:DI 1 "arith_reg_operand" "0") |
| (plus:DI |
| (plus:DI |
| (vec_select:DI |
| (mult:V4DI |
| (sign_extend:V4DI (match_operand:V4HI 2 "arith_reg_operand" "r")) |
| (sign_extend:V4DI (match_operand:V4HI 3 "arith_reg_operand" "r"))) |
| (parallel [(const_int 0)])) |
| (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_dup 2)) |
| (sign_extend:V4DI (match_dup 3))) |
| (parallel [(const_int 1)]))) |
| (plus:DI |
| (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_dup 2)) |
| (sign_extend:V4DI (match_dup 3))) |
| (parallel [(const_int 2)])) |
| (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_dup 2)) |
| (sign_extend:V4DI (match_dup 3))) |
| (parallel [(const_int 3)]))))))] |
| "TARGET_SHMEDIA" |
| "mmulsum.wq %2, %3, %0" |
| [(set_attr "type" "mac_media")]) |
| |
| (define_expand "mperm_w" |
| [(match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (match_operand:QI 2 "extend_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mperm_w_little : gen_mperm_w_big) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| ; This use of vec_select isn't exactly correct according to rtl.texi |
| ; (because not constant), but it seems a straightforward extension. |
| (define_insn "mperm_w_little" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_select:V4HI |
| (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (parallel |
| [(zero_extract:QI (match_operand:QI 2 "extend_reg_or_0_operand" "rZ") |
| (const_int 2) (const_int 0)) |
| (zero_extract:QI (match_dup 2) (const_int 2) (const_int 2)) |
| (zero_extract:QI (match_dup 2) (const_int 2) (const_int 4)) |
| (zero_extract:QI (match_dup 2) (const_int 2) (const_int 6))])))] |
| "TARGET_SHMEDIA && TARGET_LITTLE_ENDIAN" |
| "mperm.w %1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mperm_w_big" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_select:V4HI |
| (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (parallel |
| [(zero_extract:QI (not:QI (match_operand:QI 2 |
| "extend_reg_or_0_operand" "rZ")) |
| (const_int 2) (const_int 0)) |
| (zero_extract:QI (not:QI (match_dup 2)) (const_int 2) (const_int 2)) |
| (zero_extract:QI (not:QI (match_dup 2)) (const_int 2) (const_int 4)) |
| (zero_extract:QI (not:QI (match_dup 2)) |
| (const_int 2) (const_int 6))])))] |
| "TARGET_SHMEDIA && ! TARGET_LITTLE_ENDIAN" |
| "mperm.w %1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mperm_w0" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_duplicate:V4HI (truncate:HI (match_operand 1 |
| "trunc_hi_operand" "r"))))] |
| "TARGET_SHMEDIA" |
| "mperm.w %1, r63, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "msad_ubq" |
| [(match_operand:DI 0 "arith_reg_dest" "") |
| (match_operand:V8QI 1 "arith_reg_or_0_operand" "") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "") |
| (match_operand:DI 3 "arith_reg_operand" "")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn (gen_msad_ubq_i (operands[0], operands[3], |
| operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "msad_ubq_i" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (plus:DI |
| (plus:DI |
| (plus:DI |
| (plus:DI |
| (match_operand:DI 1 "arith_reg_operand" "0") |
| (abs:DI (vec_select:DI |
| (minus:V8DI |
| (zero_extend:V8DI |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")) |
| (zero_extend:V8DI |
| (match_operand:V8QI 3 "arith_reg_or_0_operand" "rZ"))) |
| (parallel [(const_int 0)])))) |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 1)])))) |
| (plus:DI |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 2)]))) |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 3)]))))) |
| (plus:DI |
| (plus:DI |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 4)]))) |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 5)])))) |
| (plus:DI |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 6)]))) |
| (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) |
| (zero_extend:V8DI (match_dup 3))) |
| (parallel [(const_int 7)])))))))] |
| "TARGET_SHMEDIA" |
| "msad.ubq %N2, %N3, %0" |
| [(set_attr "type" "mac_media")]) |
| |
| (define_insn "mshalds_l" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ss_truncate:V2SI |
| (ashift:V2DI |
| (sign_extend:V2DI (match_operand:V2SI 1 "arith_reg_operand" "r")) |
| (and:DI (match_operand:DI 2 "arith_reg_operand" "r") |
| (const_int 31)))))] |
| "TARGET_SHMEDIA" |
| "mshalds.l %1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "mshalds_w" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ss_truncate:V4HI |
| (ashift:V4SI |
| (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) |
| (and:DI (match_operand:DI 2 "arith_reg_operand" "r") |
| (const_int 15)))))] |
| "TARGET_SHMEDIA" |
| "mshalds.w %1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "ashrv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ashiftrt:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mshard.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "ashrv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ashiftrt:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mshard.w %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mshards_q" |
| [(set (match_operand:HI 0 "arith_reg_dest" "=r") |
| (ss_truncate:HI |
| (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_or_0_operand" "rZ"))))] |
| "TARGET_SHMEDIA" |
| "mshards.q %1, %N2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_expand "mshfhi_b" |
| [(match_operand:V8QI 0 "arith_reg_dest" "") |
| (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf4_b : gen_mshf0_b) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_expand "mshflo_b" |
| [(match_operand:V8QI 0 "arith_reg_dest" "") |
| (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf0_b : gen_mshf4_b) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mshf4_b" |
| [(set |
| (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (vec_select:V8QI |
| (vec_concat:V16QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 4) (const_int 12) (const_int 5) (const_int 13) |
| (const_int 6) (const_int 14) (const_int 7) (const_int 15)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mshfhi.b %N1, %N2, %0\" |
| : \"mshflo.b %N1, %N2, %0\");" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mshf0_b" |
| [(set |
| (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (vec_select:V8QI |
| (vec_concat:V16QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 0) (const_int 8) (const_int 1) (const_int 9) |
| (const_int 2) (const_int 10) (const_int 3) (const_int 11)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mshflo.b %N1, %N2, %0\" |
| : \"mshfhi.b %N1, %N2, %0\");" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "mshfhi_l" |
| [(match_operand:V2SI 0 "arith_reg_dest" "") |
| (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf4_l : gen_mshf0_l) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_expand "mshflo_l" |
| [(match_operand:V2SI 0 "arith_reg_dest" "") |
| (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf0_l : gen_mshf4_l) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mshf4_l" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (vec_select:V2SI |
| (vec_concat:V4SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 1) (const_int 3)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mshfhi.l %N1, %N2, %0\" |
| : \"mshflo.l %N1, %N2, %0\");" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mshf0_l" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (vec_select:V2SI |
| (vec_concat:V4SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 0) (const_int 2)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mshflo.l %N1, %N2, %0\" |
| : \"mshfhi.l %N1, %N2, %0\");" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "mshfhi_w" |
| [(match_operand:V4HI 0 "arith_reg_dest" "") |
| (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf4_w : gen_mshf0_w) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_expand "mshflo_w" |
| [(match_operand:V4HI 0 "arith_reg_dest" "") |
| (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")] |
| "TARGET_SHMEDIA" |
| " |
| { |
| emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf0_w : gen_mshf4_w) |
| (operands[0], operands[1], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mshf4_w" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_select:V4HI |
| (vec_concat:V8HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 2) (const_int 6) (const_int 3) (const_int 7)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mshfhi.w %N1, %N2, %0\" |
| : \"mshflo.w %N1, %N2, %0\");" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mshf0_w" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_select:V4HI |
| (vec_concat:V8HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 0) (const_int 4) (const_int 1) (const_int 5)])))] |
| "TARGET_SHMEDIA" |
| "* return (TARGET_LITTLE_ENDIAN |
| ? \"mshflo.w %N1, %N2, %0\" |
| : \"mshfhi.w %N1, %N2, %0\");" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "mshflo_w_x" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (vec_select:V4HI |
| (vec_concat:V4HI (match_operand:V2HI 1 "extend_reg_or_0_operand" "rZ") |
| (match_operand:V2HI 2 "extend_reg_or_0_operand" "rZ")) |
| (parallel [(const_int 2) (const_int 0) (const_int 3) (const_int 1)])))] |
| "TARGET_SHMEDIA" |
| "mshflo.w %N1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| /* These are useful to expand ANDs and as combiner patterns. */ |
| (define_insn_and_split "mshfhi_l_di" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r,f") |
| (ior:DI (lshiftrt:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ,f") |
| (const_int 32)) |
| (and:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ,?f") |
| (const_int -4294967296))))] |
| "TARGET_SHMEDIA" |
| "@ |
| mshfhi.l %N1, %N2, %0 |
| #" |
| "TARGET_SHMEDIA && reload_completed |
| && ! GENERAL_REGISTER_P (true_regnum (operands[0]))" |
| [(set (match_dup 3) (match_dup 4)) |
| (set (match_dup 5) (match_dup 6))] |
| " |
| { |
| operands[3] = gen_lowpart (SImode, operands[0]); |
| operands[4] = gen_highpart (SImode, operands[1]); |
| operands[5] = gen_highpart (SImode, operands[0]); |
| operands[6] = gen_highpart (SImode, operands[2]); |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "*mshfhi_l_di_rev" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (and:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (const_int -4294967296)) |
| (lshiftrt:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") |
| (const_int 32))))] |
| "TARGET_SHMEDIA" |
| "mshfhi.l %N2, %N1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_split |
| [(set (match_operand:DI 0 "arith_reg_dest" "") |
| (ior:DI (zero_extend:DI (match_operand:SI 1 |
| "extend_reg_or_0_operand" "")) |
| (and:DI (match_operand:DI 2 "arith_reg_or_0_operand" "") |
| (const_int -4294967296)))) |
| (clobber (match_operand:DI 3 "arith_reg_dest" ""))] |
| "TARGET_SHMEDIA" |
| [(const_int 0)] |
| " |
| { |
| emit_insn (gen_ashldi3_media (operands[3], |
| simplify_gen_subreg (DImode, operands[1], |
| SImode, 0), |
| GEN_INT (32))); |
| emit_insn (gen_mshfhi_l_di (operands[0], operands[3], operands[2])); |
| DONE; |
| }") |
| |
| (define_insn "mshflo_l_di" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (and:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (const_int 4294967295)) |
| (ashift:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") |
| (const_int 32))))] |
| |
| "TARGET_SHMEDIA" |
| "mshflo.l %N1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "*mshflo_l_di_rev" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (const_int 32)) |
| (and:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") |
| (const_int 4294967295))))] |
| |
| "TARGET_SHMEDIA" |
| "mshflo.l %N2, %N1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| ;; Combiner pattern for trampoline initialization. |
| (define_insn_and_split "*double_shori" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_operand" "0") |
| (const_int 32)) |
| (match_operand:DI 2 "const_int_operand" "n")))] |
| "TARGET_SHMEDIA |
| && INTVAL (operands[2]) == trunc_int_for_mode (INTVAL (operands[2]), SImode)" |
| "#" |
| "rtx_equal_p (operands[0], operands[1])" |
| [(const_int 0)] |
| " |
| { |
| HOST_WIDE_INT v = INTVAL (operands[2]); |
| |
| emit_insn (gen_shori_media (operands[0], operands[0], |
| gen_int_mode (INTVAL (operands[2]) >> 16, HImode))); |
| emit_insn (gen_shori_media (operands[0], operands[0], |
| gen_int_mode (v, HImode))); |
| DONE; |
| }") |
| |
| |
| (define_insn "*mshflo_l_di_x" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (zero_extend:DI (match_operand:SI 1 "extend_reg_or_0_operand" |
| "rZ")) |
| (ashift:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") |
| (const_int 32))))] |
| |
| "TARGET_SHMEDIA" |
| "mshflo.l %N1, %N2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn_and_split "concat_v2sf" |
| [(set (match_operand:V2SF 0 "register_operand" "=r,f,f?") |
| ;; (vec_concat:V2SF (match_operand:SF 1 "register_operand" "rZ,0,f") |
| (vec_concat:V2SF (match_operand:SF 1 "register_operand" "rZ,f,f") |
| (match_operand:SF 2 "register_operand" "rZ,f,f")))] |
| |
| "TARGET_SHMEDIA" |
| "@ |
| mshflo.l %N1, %N2, %0 |
| # |
| #" |
| "TARGET_SHMEDIA && reload_completed |
| && ! GENERAL_REGISTER_P (true_regnum (operands[0]))" |
| [(set (match_dup 3) (match_dup 1)) |
| (set (match_dup 4) (match_dup 2))] |
| " |
| { |
| operands[3] = simplify_gen_subreg (SFmode, operands[0], V2SFmode, 0); |
| operands[4] = simplify_gen_subreg (SFmode, operands[0], V2SFmode, 4); |
| }" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "*mshflo_l_di_x_rev" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") |
| (const_int 32)) |
| (zero_extend:DI (match_operand:SI 2 "extend_reg_or_0_operand" "rZ"))))] |
| |
| "TARGET_SHMEDIA" |
| "mshflo.l %N2, %N1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "ashlv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ashift:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mshlld.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "ashlv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ashift:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mshlld.w %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "lshrv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (lshiftrt:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mshlrd.l %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "lshrv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (lshiftrt:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") |
| (match_operand:DI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "mshlrd.w %1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "subv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (minus:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V2SI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "msub.l %N1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "subv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (minus:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V4HI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "msub.w %N1, %2, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "sssubv2si3" |
| [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") |
| (ss_minus:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V2SI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "msubs.l %N1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "ussubv8qi3" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (us_minus:V8QI (match_operand:V8QI 1 "arith_reg_operand" "r") |
| (match_operand:V8QI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "msubs.ub %1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| (define_insn "sssubv4hi3" |
| [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") |
| (ss_minus:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") |
| (match_operand:V4HI 2 "arith_reg_operand" "r")))] |
| "TARGET_SHMEDIA" |
| "msubs.w %N1, %2, %0" |
| [(set_attr "type" "mcmp_media")]) |
| |
| ;; Floating Point Intrinsics |
| |
| (define_insn "fcosa_s" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (unspec:SF [(match_operand:SI 1 "fp_arith_reg_operand" "f")] |
| UNSPEC_FCOSA))] |
| "TARGET_SHMEDIA" |
| "fcosa.s %1, %0" |
| [(set_attr "type" "atrans_media")]) |
| |
| (define_insn "fsina_s" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (unspec:SF [(match_operand:SI 1 "fp_arith_reg_operand" "f")] |
| UNSPEC_FSINA))] |
| "TARGET_SHMEDIA" |
| "fsina.s %1, %0" |
| [(set_attr "type" "atrans_media")]) |
| |
| (define_insn "fipr" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (plus:SF (plus:SF (vec_select:SF (mult:V4SF (match_operand:V4SF 1 |
| "fp_arith_reg_operand" "f") |
| (match_operand:V4SF 2 |
| "fp_arith_reg_operand" "f")) |
| (parallel [(const_int 0)])) |
| (vec_select:SF (mult:V4SF (match_dup 1) (match_dup 2)) |
| (parallel [(const_int 1)]))) |
| (plus:SF (vec_select:SF (mult:V4SF (match_dup 1) (match_dup 2)) |
| (parallel [(const_int 2)])) |
| (vec_select:SF (mult:V4SF (match_dup 1) (match_dup 2)) |
| (parallel [(const_int 3)])))))] |
| "TARGET_SHMEDIA" |
| "fipr.s %1, %2, %0" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn "fsrra_s" |
| [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") |
| (unspec:SF [(match_operand:SF 1 "fp_arith_reg_operand" "f")] |
| UNSPEC_FSRRA))] |
| "TARGET_SHMEDIA" |
| "fsrra.s %1, %0" |
| [(set_attr "type" "atrans_media")]) |
| |
| (define_insn "ftrv" |
| [(set (match_operand:V4SF 0 "fp_arith_reg_operand" "=f") |
| (plus:V4SF |
| (plus:V4SF |
| (mult:V4SF |
| (vec_select:V4SF (match_operand:V16SF 1 "fp_arith_reg_operand" "f") |
| (parallel [(const_int 0) (const_int 5) |
| (const_int 10) (const_int 15)])) |
| (match_operand:V4SF 2 "fp_arith_reg_operand" "f")) |
| (mult:V4SF |
| (vec_select:V4SF (match_dup 1) |
| (parallel [(const_int 4) (const_int 9) |
| (const_int 14) (const_int 3)])) |
| (vec_select:V4SF (match_dup 2) |
| (parallel [(const_int 1) (const_int 2) |
| (const_int 3) (const_int 0)])))) |
| (plus:V4SF |
| (mult:V4SF |
| (vec_select:V4SF (match_dup 1) |
| (parallel [(const_int 8) (const_int 13) |
| (const_int 2) (const_int 7)])) |
| (vec_select:V4SF (match_dup 2) |
| (parallel [(const_int 2) (const_int 3) |
| (const_int 0) (const_int 1)]))) |
| (mult:V4SF |
| (vec_select:V4SF (match_dup 1) |
| (parallel [(const_int 12) (const_int 1) |
| (const_int 6) (const_int 11)])) |
| (vec_select:V4SF (match_dup 2) |
| (parallel [(const_int 3) (const_int 0) |
| (const_int 1) (const_int 2)]))))))] |
| "TARGET_SHMEDIA" |
| "ftrv.s %1, %2, %0" |
| [(set_attr "type" "fparith_media")]) |
| |
| (define_insn "nsb" |
| [(set (match_operand:QI 0 "arith_reg_dest" "=r") |
| (unspec:QI [(match_operand:DI 1 "arith_reg_operand" "r")] |
| UNSPEC_NSB))] |
| "TARGET_SHMEDIA" |
| "nsb %1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "nsbsi" |
| [(set (match_operand:SI 0 "arith_reg_dest" "=r") |
| (zero_extend:SI |
| (unspec:QI [(match_operand:DI 1 "arith_reg_operand" "r")] |
| UNSPEC_NSB)))] |
| "TARGET_SHMEDIA" |
| "nsb %1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "nsbdi" |
| [(set (match_operand:DI 0 "arith_reg_dest" "=r") |
| (zero_extend:DI |
| (unspec:QI [(match_operand:DI 1 "arith_reg_operand" "r")] |
| UNSPEC_NSB)))] |
| "TARGET_SHMEDIA" |
| "nsb %1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_expand "ffsdi2" |
| [(set (match_operand:DI 0 "arith_reg_dest" "") |
| (ffs:DI (match_operand:DI 1 "arith_reg_operand" "")))] |
| "TARGET_SHMEDIA" |
| " |
| { |
| rtx scratch = gen_reg_rtx (DImode); |
| rtx last; |
| |
| emit_insn (gen_adddi3 (scratch, operands[1], GEN_INT (-1))); |
| emit_insn (gen_xordi3 (scratch, operands[1], scratch)); |
| emit_insn (gen_lshrdi3_media (scratch, scratch, const1_rtx)); |
| emit_insn (gen_nsbdi (scratch, scratch)); |
| emit_insn (gen_adddi3 (scratch, scratch, GEN_INT (-64))); |
| emit_insn (gen_movdicc_false (scratch, operands[1], const0_rtx, scratch)); |
| last = emit_insn (gen_subdi3 (operands[0], const0_rtx, scratch)); |
| REG_NOTES (last) |
| = gen_rtx_EXPR_LIST (REG_EQUAL, |
| gen_rtx_FFS (DImode, operands[0]), REG_NOTES (last)); |
| DONE; |
| }") |
| |
| (define_expand "ffssi2" |
| [(set (match_operand:SI 0 "arith_reg_dest" "") |
| (ffs:SI (match_operand:SI 1 "arith_reg_operand" "")))] |
| "TARGET_SHMEDIA" |
| " |
| { |
| rtx scratch = gen_reg_rtx (SImode); |
| rtx discratch = gen_reg_rtx (DImode); |
| rtx last; |
| |
| emit_insn (gen_adddi3 (discratch, |
| simplify_gen_subreg (DImode, operands[1], SImode, 0), |
| GEN_INT (-1))); |
| emit_insn (gen_andcdi3 (discratch, |
| simplify_gen_subreg (DImode, operands[1], SImode, 0), |
| discratch)); |
| emit_insn (gen_nsbsi (scratch, discratch)); |
| last = emit_insn (gen_subsi3 (operands[0], |
| force_reg (SImode, GEN_INT (63)), scratch)); |
| REG_NOTES (last) |
| = gen_rtx_EXPR_LIST (REG_EQUAL, |
| gen_rtx_FFS (SImode, operands[0]), REG_NOTES (last)); |
| DONE; |
| }") |
| |
| (define_insn "byterev" |
| [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") |
| (vec_select:V8QI (match_operand:V8QI 1 "arith_reg_operand" "r") |
| (parallel [(const_int 7) (const_int 6) (const_int 5) |
| (const_int 4) (const_int 3) (const_int 2) |
| (const_int 1) (const_int 0)])))] |
| "TARGET_SHMEDIA" |
| "byterev %1, %0" |
| [(set_attr "type" "arith_media")]) |
| |
| (define_insn "prefetch" |
| [(prefetch (match_operand:QI 0 "address_operand" "p") |
| (match_operand:SI 1 "const_int_operand" "n") |
| (match_operand:SI 2 "const_int_operand" "n"))] |
| "TARGET_SHMEDIA" |
| "* |
| { |
| operands[0] = gen_rtx_MEM (QImode, operands[0]); |
| output_asm_insn (\"ld%M0.b %m0,r63\", operands); |
| return \"\"; |
| }" |
| [(set_attr "type" "other")]) |
| |
| ;; The following description models the |
| ;; SH4 pipeline using the DFA based scheduler. |
| ;; The DFA based description is better way to model |
| ;; a superscalar pipeline as compared to function unit |
| ;; reservation model. |
| ;; 1. The function unit based model is oriented to describe at most one |
| ;; unit reservation by each insn. It is difficult to model unit reservations in multiple |
| ;; pipeline units by same insn. This can be done using DFA based description. |
| ;; 2. The execution performance of DFA based scheduler does not depend on processor complexity. |
| ;; 3. Writing all unit reservations for an instruction class is more natural description |
| ;; of the pipeline and makes interface of the hazard recognizer simpler than the |
| ;; old function unit based model. |
| ;; 4. The DFA model is richer and is a part of greater overall framework of RCSP. |
| |
| |
| ;; Two automata are defined to reduce number of states |
| ;; which a single large automaton will have.(Factoring) |
| |
| (define_automaton "inst_pipeline,fpu_pipe") |
| |
| ;; This unit is basically the decode unit of the processor. |
| ;; Since SH4 is a dual issue machine,it is as if there are two |
| ;; units so that any insn can be processed by either one |
| ;; of the decoding unit. |
| |
| (define_cpu_unit "pipe_01,pipe_02" "inst_pipeline") |
| |
| |
| ;; The fixed point arithmetic calculator(?? EX Unit). |
| |
| (define_cpu_unit "int" "inst_pipeline") |
| |
| ;; f1_1 and f1_2 are floating point units.Actually there is |
| ;; a f1 unit which can overlap with other f1 unit but |
| ;; not another F1 unit.It is as though there were two |
| ;; f1 units. |
| |
| (define_cpu_unit "f1_1,f1_2" "fpu_pipe") |
| |
| ;; The floating point units (except FS - F2 always precedes it.) |
| |
| (define_cpu_unit "F0,F1,F2,F3" "fpu_pipe") |
| |
| ;; This is basically the MA unit of SH4 |
| ;; used in LOAD/STORE pipeline. |
| |
| (define_cpu_unit "memory" "inst_pipeline") |
| |
| ;; However, there are LS group insns that don't use it, even ones that |
| ;; complete in 0 cycles. So we use an extra unit for the issue of LS insns. |
| (define_cpu_unit "load_store" "inst_pipeline") |
| |
| ;; The address calculator used for branch instructions. |
| ;; This will be reserved after "issue" of branch instructions |
| ;; and this is to make sure that no two branch instructions |
| ;; can be issued in parallel. |
| |
| (define_cpu_unit "pcr_addrcalc" "inst_pipeline") |
| |
| ;; ---------------------------------------------------- |
| ;; This reservation is to simplify the dual issue description. |
| |
| (define_reservation "issue" "pipe_01|pipe_02") |
| |
| ;; This is to express the locking of D stage. |
| ;; Note that the issue of a CO group insn also effectively locks the D stage. |
| |
| (define_reservation "d_lock" "pipe_01+pipe_02") |
| |
| ;; Every FE instruction but fipr / ftrv starts with issue and this. |
| (define_reservation "F01" "F0+F1") |
| |
| ;; This is to simplify description where F1,F2,FS |
| ;; are used simultaneously. |
| |
| (define_reservation "fpu" "F1+F2") |
| |
| ;; This is to highlight the fact that f1 |
| ;; cannot overlap with F1. |
| |
| (exclusion_set "f1_1,f1_2" "F1") |
| |
| (define_insn_reservation "nil" 0 (eq_attr "type" "nil") "nothing") |
| |
| ;; Although reg moves have a latency of zero |
| ;; we need to highlight that they use D stage |
| ;; for one cycle. |
| |
| ;; Group: MT |
| |
| (define_insn_reservation "reg_mov" 0 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "move")) |
| "issue") |
| |
| ;; Group: LS |
| |
| (define_insn_reservation "freg_mov" 0 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "fmove")) |
| "issue+load_store") |
| |
| ;; We don't model all pipeline stages; we model the issue ('D') stage |
| ;; inasmuch as we allow only two instructions to issue simultaneously, |
| ;; and CO instructions prevent any simultaneous issue of another instruction. |
| ;; (This uses pipe_01 and pipe_02). |
| ;; Double issue of EX insns is prevented by using the int unit in the EX stage. |
| ;; Double issue of EX / BR insns is prevented by using the int unit / |
| ;; pcr_addrcalc unit in the EX stage. |
| ;; Double issue of BR / LS instructions is prevented by using the |
| ;; pcr_addrcalc / load_store unit in the issue cycle. |
| ;; Double issue of FE instructions is prevented by using F0 in the first |
| ;; pipeline stage after the first D stage. |
| ;; There is no need to describe the [ES]X / [MN]A / S stages after a D stage |
| ;; (except in the cases outlined above), nor to describe the FS stage after |
| ;; the F2 stage. |
| |
| ;; Other MT group instructions(1 step operations) |
| ;; Group: MT |
| ;; Latency: 1 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "mt" 1 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "mt_group")) |
| "issue") |
| |
| ;; Fixed Point Arithmetic Instructions(1 step operations) |
| ;; Group: EX |
| ;; Latency: 1 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "sh4_simple_arith" 1 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "insn_class" "ex_group")) |
| "issue,int") |
| |
| ;; Load and store instructions have no alignment peculiarities for the SH4, |
| ;; but they use the load-store unit, which they share with the fmove type |
| ;; insns (fldi[01]; fmov frn,frm; flds; fsts; fabs; fneg) . |
| ;; Loads have a latency of two. |
| ;; However, call insns can only paired with a preceding insn, and have |
| ;; a delay slot, so that we want two more insns to be scheduled between the |
| ;; load of the function address and the call. This is equivalent to a |
| ;; latency of three. |
| ;; ADJUST_COST can only properly handle reductions of the cost, so we |
| ;; use a latency of three here, which gets multiplied by 10 to yield 30. |
| ;; We only do this for SImode loads of general registers, to make the work |
| ;; for ADJUST_COST easier. |
| |
| ;; Load Store instructions. (MOV.[BWL]@(d,GBR) |
| ;; Group: LS |
| ;; Latency: 2 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "sh4_load" 2 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "load,pcload")) |
| "issue+load_store,nothing,memory") |
| |
| ;; calls / sfuncs need an extra instruction for their delay slot. |
| ;; Moreover, estimating the latency for SImode loads as 3 will also allow |
| ;; adjust_cost to meaningfully bump it back up to 3 if they load the shift |
| ;; count of a dynamic shift. |
| (define_insn_reservation "sh4_load_si" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "load_si,pcload_si")) |
| "issue+load_store,nothing,memory") |
| |
| ;; (define_bypass 2 "sh4_load_si" "!sh4_call") |
| |
| ;; The load latency is upped to three higher if the dependent insn does |
| ;; double precision computation. We want the 'default' latency to reflect |
| ;; that increased latency because otherwise the insn priorities won't |
| ;; allow proper scheduling. |
| (define_insn_reservation "sh4_fload" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "fload,pcfload")) |
| "issue+load_store,nothing,memory") |
| |
| ;; (define_bypass 2 "sh4_fload" "!") |
| |
| (define_insn_reservation "sh4_store" 1 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "store")) |
| "issue+load_store,nothing,memory") |
| |
| ;; Load Store instructions. |
| ;; Group: LS |
| ;; Latency: 1 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "sh4_gp_fpul" 1 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "gp_fpul")) |
| "issue+load_store") |
| |
| ;; Load Store instructions. |
| ;; Group: LS |
| ;; Latency: 3 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "sh4_fpul_gp" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "fpul_gp")) |
| "issue+load_store") |
| |
| ;; Branch (BF,BF/S,BT,BT/S,BRA) |
| ;; Group: BR |
| ;; Latency when taken: 2 (or 1) |
| ;; Issue Rate: 1 |
| ;; The latency is 1 when displacement is 0. |
| ;; We can't really do much with the latency, even if we could express it, |
| ;; but the pairing restrictions are useful to take into account. |
| ;; ??? If the branch is likely, we might want to fill the delay slot; |
| ;; if the branch is likely, but not very likely, should we pretend to use |
| ;; a resource that CO instructions use, to get a pairable delay slot insn? |
| |
| (define_insn_reservation "sh4_branch" 1 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "cbranch,jump")) |
| "issue+pcr_addrcalc") |
| |
| ;; Branch Far (JMP,RTS,BRAF) |
| ;; Group: CO |
| ;; Latency: 3 |
| ;; Issue Rate: 2 |
| ;; ??? Scheduling happens before branch shortening, and hence jmp and braf |
| ;; can't be distinguished from bra for the "jump" pattern. |
| |
| (define_insn_reservation "sh4_return" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "return,jump_ind")) |
| "d_lock*2") |
| |
| ;; RTE |
| ;; Group: CO |
| ;; Latency: 5 |
| ;; Issue Rate: 5 |
| ;; this instruction can be executed in any of the pipelines |
| ;; and blocks the pipeline for next 4 stages. |
| |
| (define_insn_reservation "sh4_return_from_exp" 5 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "rte")) |
| "d_lock*5") |
| |
| ;; OCBP, OCBWB |
| ;; Group: CO |
| ;; Latency: 1-5 |
| ;; Issue Rate: 1 |
| |
| ;; cwb is used for the sequence ocbwb @%0; extu.w %0,%2; or %1,%2; mov.l %0,@%2 |
| ;; ocbwb on its own would be "d_lock,nothing,memory*5" |
| (define_insn_reservation "ocbwb" 6 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "cwb")) |
| "d_lock*2,(d_lock+memory)*3,issue+load_store+memory,memory*2") |
| |
| ;; LDS to PR,JSR |
| ;; Group: CO |
| ;; Latency: 3 |
| ;; Issue Rate: 2 |
| ;; The SX stage is blocked for last 2 cycles. |
| ;; OTOH, the only time that has an effect for insns generated by the compiler |
| ;; is when lds to PR is followed by sts from PR - and that is highly unlikely - |
| ;; or when we are doing a function call - and we don't do inter-function |
| ;; scheduling. For the function call case, it's really best that we end with |
| ;; something that models an rts. |
| |
| (define_insn_reservation "sh4_lds_to_pr" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "prset") ) |
| "d_lock*2") |
| |
| ;; calls introduce a longisch delay that is likely to flush the pipelines |
| ;; of the caller's instructions. Ordinary functions tend to end with a |
| ;; load to restore a register (in the delay slot of rts), while sfuncs |
| ;; tend to end with an EX or MT insn. But that is not actually relevant, |
| ;; since there are no instructions that contend for memory access early. |
| ;; We could, of course, provide exact scheduling information for specific |
| ;; sfuncs, if that should prove useful. |
| |
| (define_insn_reservation "sh4_call" 16 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "call,sfunc")) |
| "d_lock*16") |
| |
| ;; LDS.L to PR |
| ;; Group: CO |
| ;; Latency: 3 |
| ;; Issue Rate: 2 |
| ;; The SX unit is blocked for last 2 cycles. |
| |
| (define_insn_reservation "ldsmem_to_pr" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "pload")) |
| "d_lock*2") |
| |
| ;; STS from PR |
| ;; Group: CO |
| ;; Latency: 2 |
| ;; Issue Rate: 2 |
| ;; The SX unit in second and third cycles. |
| |
| (define_insn_reservation "sts_from_pr" 2 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "prget")) |
| "d_lock*2") |
| |
| ;; STS.L from PR |
| ;; Group: CO |
| ;; Latency: 2 |
| ;; Issue Rate: 2 |
| |
| (define_insn_reservation "sh4_prstore_mem" 2 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "pstore")) |
| "d_lock*2,nothing,memory") |
| |
| ;; LDS to FPSCR |
| ;; Group: CO |
| ;; Latency: 4 |
| ;; Issue Rate: 1 |
| ;; F1 is blocked for last three cycles. |
| |
| (define_insn_reservation "fpscr_load" 4 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "gp_fpscr")) |
| "d_lock,nothing,F1*3") |
| |
| ;; LDS.L to FPSCR |
| ;; Group: CO |
| ;; Latency: 1 / 4 |
| ;; Latency to update Rn is 1 and latency to update FPSCR is 4 |
| ;; Issue Rate: 1 |
| ;; F1 is blocked for last three cycles. |
| |
| (define_insn_reservation "fpscr_load_mem" 4 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "mem_fpscr")) |
| "d_lock,nothing,(F1+memory),F1*2") |
| |
| |
| ;; Fixed point multiplication (DMULS.L DMULU.L MUL.L MULS.W,MULU.W) |
| ;; Group: CO |
| ;; Latency: 4 / 4 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "multi" 4 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "smpy,dmpy")) |
| "d_lock,(d_lock+f1_1),(f1_1|f1_2)*3,F2") |
| |
| ;; Fixed STS from MACL / MACH |
| ;; Group: CO |
| ;; Latency: 3 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "sh4_mac_gp" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "mac_gp")) |
| "d_lock") |
| |
| |
| ;; Single precision floating point computation FCMP/EQ, |
| ;; FCMP/GT, FADD, FLOAT, FMAC, FMUL, FSUB, FTRC, FRVHG, FSCHG |
| ;; Group: FE |
| ;; Latency: 3/4 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "fp_arith" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "fp")) |
| "issue,F01,F2") |
| |
| (define_insn_reservation "fp_arith_ftrc" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "ftrc_s")) |
| "issue,F01,F2") |
| |
| (define_bypass 1 "fp_arith_ftrc" "sh4_fpul_gp") |
| |
| ;; Single Precision FDIV/SQRT |
| ;; Group: FE |
| ;; Latency: 12/13 (FDIV); 11/12 (FSQRT) |
| ;; Issue Rate: 1 |
| ;; We describe fdiv here; fsqrt is actually one cycle faster. |
| |
| (define_insn_reservation "fp_div" 12 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "fdiv")) |
| "issue,F01+F3,F2+F3,F3*7,F1+F3,F2") |
| |
| ;; Double Precision floating point computation |
| ;; (FCNVDS, FCNVSD, FLOAT, FTRC) |
| ;; Group: FE |
| ;; Latency: (3,4)/5 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "dp_float" 4 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "dfp_conv")) |
| "issue,F01,F1+F2,F2") |
| |
| ;; Double-precision floating-point (FADD,FMUL,FSUB) |
| ;; Group: FE |
| ;; Latency: (7,8)/9 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "fp_double_arith" 8 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "dfp_arith")) |
| "issue,F01,F1+F2,fpu*4,F2") |
| |
| ;; Double-precision FCMP (FCMP/EQ,FCMP/GT) |
| ;; Group: CO |
| ;; Latency: 3/5 |
| ;; Issue Rate: 2 |
| |
| (define_insn_reservation "fp_double_cmp" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "dfp_cmp")) |
| "d_lock,(d_lock+F01),F1+F2,F2") |
| |
| ;; Double precision FDIV/SQRT |
| ;; Group: FE |
| ;; Latency: (24,25)/26 |
| ;; Issue Rate: 1 |
| |
| (define_insn_reservation "dp_div" 25 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "dfdiv")) |
| "issue,F01+F3,F1+F2+F3,F2+F3,F3*16,F1+F3,(fpu+F3)*2,F2") |
| |
| |
| ;; Use the branch-not-taken case to model arith3 insns. For the branch taken |
| ;; case, we'd get a d_lock instead of issue at the end. |
| (define_insn_reservation "arith3" 3 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "arith3")) |
| "issue,d_lock+pcr_addrcalc,issue") |
| |
| ;; arith3b insns schedule the same no matter if the branch is taken or not. |
| (define_insn_reservation "arith3b" 2 |
| (and (eq_attr "pipe_model" "sh4") |
| (eq_attr "type" "arith3")) |
| "issue,d_lock+pcr_addrcalc") |