;;- Machine description for Renesas / SuperH SH. ;; Copyright (C) 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, ;; 2003, 2004 Free Software Foundation, Inc. ;; Contributed by Steve Chamberlain (sac@cygnus.com). ;; Improved by Jim Wilson (wilson@cygnus.com). ;; This file is part of GCC. ;; GCC is free software; you can redistribute it and/or modify ;; it under the terms of the GNU General Public License as published by ;; the Free Software Foundation; either version 2, or (at your option) ;; any later version. ;; GCC is distributed in the hope that it will be useful, ;; but WITHOUT ANY WARRANTY; without even the implied warranty of ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ;; GNU General Public License for more details. ;; You should have received a copy of the GNU General Public License ;; along with GCC; see the file COPYING. If not, write to ;; the Free Software Foundation, 59 Temple Place - Suite 330, ;; Boston, MA 02111-1307, USA. ;; ??? Should prepend a * to all pattern names which are not used. ;; This will make the compiler smaller, and rebuilds after changes faster. ;; ??? Should be enhanced to include support for many more GNU superoptimizer ;; sequences. Especially the sequences for arithmetic right shifts. ;; ??? Should check all DImode patterns for consistency and usefulness. ;; ??? The MAC.W and MAC.L instructions are not supported. There is no ;; way to generate them. ;; ??? The cmp/str instruction is not supported. Perhaps it can be used ;; for a str* inline function. ;; BSR is not generated by the compiler proper, but when relaxing, it ;; generates .uses pseudo-ops that allow linker relaxation to create ;; BSR. This is actually implemented in bfd/{coff,elf32}-sh.c ;; Special constraints for SH machine description: ;; ;; t -- T ;; x -- mac ;; l -- pr ;; z -- r0 ;; ;; Special formats used for outputting SH instructions: ;; ;; %. -- print a .s if insn needs delay slot ;; %@ -- print rte/rts if is/isn't an interrupt function ;; %# -- output a nop if there is nothing to put in the delay slot ;; %O -- print a constant without the # ;; %R -- print the lsw reg of a double ;; %S -- print the msw reg of a double ;; %T -- print next word of a double REG or MEM ;; ;; Special predicates: ;; ;; arith_operand -- operand is valid source for arithmetic op ;; arith_reg_operand -- operand is valid register for arithmetic op ;; general_movdst_operand -- operand is valid move destination ;; general_movsrc_operand -- operand is valid move source ;; logical_operand -- operand is valid source for logical op ;; ------------------------------------------------------------------------- ;; Constants ;; ------------------------------------------------------------------------- (define_constants [ (AP_REG 145) (PR_REG 146) (T_REG 147) (GBR_REG 144) (MACH_REG 148) (MACL_REG 149) (FPUL_REG 150) (RAP_REG 152) (FPSCR_REG 151) (PIC_REG 12) (FP_REG 14) (SP_REG 15) (PR_MEDIA_REG 18) (T_MEDIA_REG 19) (R0_REG 0) (R1_REG 1) (R2_REG 2) (R3_REG 3) (R4_REG 4) (R5_REG 5) (R6_REG 6) (R7_REG 7) (R8_REG 8) (R9_REG 9) (R10_REG 10) (R20_REG 20) (R21_REG 21) (R22_REG 22) (R23_REG 23) (DR0_REG 64) (DR2_REG 66) (DR4_REG 68) (FR23_REG 87) (TR0_REG 128) (TR1_REG 129) (TR2_REG 130) (XD0_REG 136) ;; These are used with unspec. (UNSPEC_COMPACT_ARGS 0) (UNSPEC_MOVA 1) (UNSPEC_CASESI 2) (UNSPEC_DATALABEL 3) (UNSPEC_BBR 4) (UNSPEC_SFUNC 5) (UNSPEC_PIC 6) (UNSPEC_GOT 7) (UNSPEC_GOTOFF 8) (UNSPEC_PLT 9) (UNSPEC_CALLER 10) (UNSPEC_GOTPLT 11) (UNSPEC_ICACHE 12) (UNSPEC_INIT_TRAMP 13) (UNSPEC_FCOSA 14) (UNSPEC_FSRRA 15) (UNSPEC_FSINA 16) (UNSPEC_NSB 17) (UNSPEC_ALLOCO 18) (UNSPEC_EH_RETURN 19) (UNSPEC_TLSGD 20) (UNSPEC_TLSLDM 21) (UNSPEC_TLSIE 22) (UNSPEC_DTPOFF 23) (UNSPEC_GOTTPOFF 24) (UNSPEC_TPOFF 25) (UNSPEC_RA 26) ;; These are used with unspec_volatile. (UNSPECV_BLOCKAGE 0) (UNSPECV_ALIGN 1) (UNSPECV_CONST2 2) (UNSPECV_CONST4 4) (UNSPECV_CONST8 6) (UNSPECV_WINDOW_END 10) (UNSPECV_CONST_END 11) ]) ;; ------------------------------------------------------------------------- ;; Attributes ;; ------------------------------------------------------------------------- ;; Target CPU. (define_attr "cpu" "sh1,sh2,sh2e,sh3,sh3e,sh4,sh5" (const (symbol_ref "sh_cpu_attr"))) (define_attr "endian" "big,little" (const (if_then_else (symbol_ref "TARGET_LITTLE_ENDIAN") (const_string "little") (const_string "big")))) ;; Indicate if the default fpu mode is single precision. (define_attr "fpu_single" "yes,no" (const (if_then_else (symbol_ref "TARGET_FPU_SINGLE") (const_string "yes") (const_string "no")))) (define_attr "fmovd" "yes,no" (const (if_then_else (symbol_ref "TARGET_FMOVD") (const_string "yes") (const_string "no")))) ;; pipeline model (define_attr "pipe_model" "sh1,sh4,sh5media" (const (cond [(symbol_ref "TARGET_SHMEDIA") (const_string "sh5media") (symbol_ref "TARGET_SUPERSCALAR") (const_string "sh4")] (const_string "sh1")))) ;; cbranch conditional branch instructions ;; jump unconditional jumps ;; arith ordinary arithmetic ;; arith3 a compound insn that behaves similarly to a sequence of ;; three insns of type arith ;; arith3b like above, but might end with a redirected branch ;; load from memory ;; load_si Likewise, SImode variant for general register. ;; fload Likewise, but load to fp register. ;; store to memory ;; move general purpose register to register ;; mt_group other sh4 mt instructions ;; fmove register to register, floating point ;; smpy word precision integer multiply ;; dmpy longword or doublelongword precision integer multiply ;; return rts ;; pload load of pr reg, which can't be put into delay slot of rts ;; prset copy register to pr reg, ditto ;; pstore store of pr reg, which can't be put into delay slot of jsr ;; prget copy pr to register, ditto ;; pcload pc relative load of constant value ;; pcfload Likewise, but load to fp register. ;; pcload_si Likewise, SImode variant for general register. ;; rte return from exception ;; sfunc special function call with known used registers ;; call function call ;; fp floating point ;; fdiv floating point divide (or square root) ;; gp_fpul move from general purpose register to fpul ;; fpul_gp move from fpul to general purpose register ;; mac_gp move from mac[lh] to general purpose register ;; dfp_arith, dfp_cmp,dfp_conv ;; ftrc_s fix_truncsfsi2_i4 ;; dfdiv double precision floating point divide (or square root) ;; cwb ic_invalidate_line_i ;; tls_load load TLS related address ;; arith_media SHmedia arithmetic, logical, and shift instructions ;; cbranch_media SHmedia conditional branch instructions ;; cmp_media SHmedia compare instructions ;; dfdiv_media SHmedia double precision divide and square root ;; dfmul_media SHmedia double precision multiply instruction ;; dfparith_media SHmedia double precision floating point arithmetic ;; dfpconv_media SHmedia double precision floating point conversions ;; dmpy_media SHmedia longword multiply ;; fcmp_media SHmedia floating point compare instructions ;; fdiv_media SHmedia single precision divide and square root ;; fload_media SHmedia floating point register load instructions ;; fmove_media SHmedia floating point register moves (inc. fabs and fneg) ;; fparith_media SHmedia single precision floating point arithmetic ;; fpconv_media SHmedia single precision floating point conversions ;; fstore_media SHmedia floating point register store instructions ;; gettr_media SHmedia gettr instruction ;; invalidate_line_media SHmedia invalidate_line sequence ;; jump_media SHmedia unconditional branch instructions ;; load_media SHmedia general register load instructions ;; pt_media SHmedia pt instruction (expanded by assembler) ;; ptabs_media SHmedia ptabs instruction ;; store_media SHmedia general register store instructions ;; mcmp_media SHmedia multimedia compare, absolute, saturating ops ;; mac_media SHmedia mac-style fixed point operations ;; d2mpy_media SHmedia: two 32 bit integer multiplies ;; atrans SHmedia approximate transcendental functions ;; ustore_media SHmedia unaligned stores ;; nil no-op move, will be deleted. (define_attr "type" "mt_group,cbranch,jump,jump_ind,arith,arith3,arith3b,dyn_shift,load,load_si,fload,store,move,fmove,smpy,dmpy,return,pload,prset,pstore,prget,pcload,pcload_si,pcfload,rte,sfunc,call,fp,fdiv,ftrc_s,dfp_arith,dfp_cmp,dfp_conv,dfdiv,gp_fpul,fpul_gp,mac_gp,mem_fpscr,gp_fpscr,cwb,tls_load,arith_media,cbranch_media,cmp_media,dfdiv_media,dfmul_media,dfparith_media,dfpconv_media,dmpy_media,fcmp_media,fdiv_media,fload_media,fmove_media,fparith_media,fpconv_media,fstore_media,gettr_media,invalidate_line_media,jump_media,load_media,pt_media,ptabs_media,store_media,mcmp_media,mac_media,d2mpy_media,atrans_media,ustore_media,nil,other" (const_string "other")) ;; We define a new attribute namely "insn_class".We use ;; this for the DFA based pipeline description. ;; ;; mt_group SH4 "mt" group instructions. ;; ;; ex_group SH4 "ex" group instructions. ;; ;; ls_group SH4 "ls" group instructions. ;; (define_attr "insn_class" "mt_group,ex_group,ls_group,br_group,fe_group,co_group,none" (cond [(eq_attr "type" "move,mt_group") (const_string "mt_group") (eq_attr "type" "arith,dyn_shift") (const_string "ex_group") (eq_attr "type" "fmove,load,pcload,load_si,pcload_si,fload,pcfload,store,gp_fpul,fpul_gp") (const_string "ls_group") (eq_attr "type" "cbranch,jump") (const_string "br_group") (eq_attr "type" "fp,fdiv,ftrc_s,dfp_arith,dfp_conv,dfdiv") (const_string "fe_group") (eq_attr "type" "jump_ind,smpy,dmpy,mac_gp,return,pload,prset,pstore,prget,rte,sfunc,call,dfp_cmp,mem_fpscr,gp_fpscr,cwb") (const_string "co_group")] (const_string "none"))) ;; nil are zero instructions, and arith3 / arith3b are multiple instructions, ;; so these do not belong in an insn group, although they are modeled ;; with their own define_insn_reservations. ;; Indicate what precision must be selected in fpscr for this insn, if any. (define_attr "fp_mode" "single,double,none" (const_string "none")) ;; Indicate if the fpu mode is set by this instruction ;; "unknown" must have the value as "none" in fp_mode, and means ;; that the instruction/abi has left the processor in an unknown ;; state. ;; "none" means that nothing has changed and no mode is set. ;; This attribute is only used for the Renesas ABI. (define_attr "fp_set" "single,double,unknown,none" (const_string "none")) ; If a conditional branch destination is within -252..258 bytes away ; from the instruction it can be 2 bytes long. Something in the ; range -4090..4100 bytes can be 6 bytes long. All other conditional ; branches are initially assumed to be 16 bytes long. ; In machine_dependent_reorg, we split all branches that are longer than ; 2 bytes. ;; The maximum range used for SImode constant pool entries is 1018. A final ;; instruction can add 8 bytes while only being 4 bytes in size, thus we ;; can have a total of 1022 bytes in the pool. Add 4 bytes for a branch ;; instruction around the pool table, 2 bytes of alignment before the table, ;; and 30 bytes of alignment after the table. That gives a maximum total ;; pool size of 1058 bytes. ;; Worst case code/pool content size ratio is 1:2 (using asms). ;; Thus, in the worst case, there is one instruction in front of a maximum ;; sized pool, and then there are 1052 bytes of pool for every 508 bytes of ;; code. For the last n bytes of code, there are 2n + 36 bytes of pool. ;; If we have a forward branch, the initial table will be put after the ;; unconditional branch. ;; ;; ??? We could do much better by keeping track of the actual pcloads within ;; the branch range and in the pcload range in front of the branch range. ;; ??? This looks ugly because genattrtab won't allow if_then_else or cond ;; inside an le. (define_attr "short_cbranch_p" "no,yes" (cond [(ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 252)) (const_int 506)) (const_string "yes") (ne (symbol_ref "NEXT_INSN (PREV_INSN (insn)) != insn") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 252)) (const_int 508)) (const_string "yes") ] (const_string "no"))) (define_attr "med_branch_p" "no,yes" (cond [(leu (plus (minus (match_dup 0) (pc)) (const_int 990)) (const_int 1988)) (const_string "yes") (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 4092)) (const_int 8186)) (const_string "yes") ] (const_string "no"))) (define_attr "med_cbranch_p" "no,yes" (cond [(leu (plus (minus (match_dup 0) (pc)) (const_int 988)) (const_int 1986)) (const_string "yes") (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 4090)) (const_int 8184)) (const_string "yes") ] (const_string "no"))) (define_attr "braf_branch_p" "no,yes" (cond [(ne (symbol_ref "! TARGET_SH2") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 10330)) (const_int 20660)) (const_string "yes") (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 32764)) (const_int 65530)) (const_string "yes") ] (const_string "no"))) (define_attr "braf_cbranch_p" "no,yes" (cond [(ne (symbol_ref "! TARGET_SH2") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 10328)) (const_int 20658)) (const_string "yes") (ne (symbol_ref "mdep_reorg_phase <= SH_FIXUP_PCLOAD") (const_int 0)) (const_string "no") (leu (plus (minus (match_dup 0) (pc)) (const_int 32762)) (const_int 65528)) (const_string "yes") ] (const_string "no"))) ; An unconditional jump in the range -4092..4098 can be 2 bytes long. ; For wider ranges, we need a combination of a code and a data part. ; If we can get a scratch register for a long range jump, the code ; part can be 4 bytes long; otherwise, it must be 8 bytes long. ; If the jump is in the range -32764..32770, the data part can be 2 bytes ; long; otherwise, it must be 6 bytes long. ; All other instructions are two bytes long by default. ;; ??? This should use something like *branch_p (minus (match_dup 0) (pc)), ;; but getattrtab doesn't understand this. (define_attr "length" "" (cond [(eq_attr "type" "cbranch") (cond [(eq_attr "short_cbranch_p" "yes") (const_int 2) (eq_attr "med_cbranch_p" "yes") (const_int 6) (eq_attr "braf_cbranch_p" "yes") (const_int 12) ;; ??? using pc is not computed transitively. (ne (match_dup 0) (match_dup 0)) (const_int 14) (ne (symbol_ref ("flag_pic")) (const_int 0)) (const_int 24) ] (const_int 16)) (eq_attr "type" "jump") (cond [(eq_attr "med_branch_p" "yes") (const_int 2) (and (eq (symbol_ref "GET_CODE (prev_nonnote_insn (insn))") (symbol_ref "INSN")) (eq (symbol_ref "INSN_CODE (prev_nonnote_insn (insn))") (symbol_ref "code_for_indirect_jump_scratch"))) (if_then_else (eq_attr "braf_branch_p" "yes") (const_int 6) (const_int 10)) (eq_attr "braf_branch_p" "yes") (const_int 10) ;; ??? using pc is not computed transitively. (ne (match_dup 0) (match_dup 0)) (const_int 12) (ne (symbol_ref ("flag_pic")) (const_int 0)) (const_int 22) ] (const_int 14)) (eq_attr "type" "pt_media") (if_then_else (ne (symbol_ref "TARGET_SHMEDIA64") (const_int 0)) (const_int 20) (const_int 12)) ] (if_then_else (ne (symbol_ref "TARGET_SHMEDIA") (const_int 0)) (const_int 4) (const_int 2)))) ;; (define_function_unit {name} {num-units} {n-users} {test} ;; {ready-delay} {issue-delay} [{conflict-list}]) ;; Load and store instructions save a cycle if they are aligned on a ;; four byte boundary. Using a function unit for stores encourages ;; gcc to separate load and store instructions by one instruction, ;; which makes it more likely that the linker will be able to word ;; align them when relaxing. ;; Loads have a latency of two. ;; However, call insns can have a delay slot, so that we want one more ;; insn to be scheduled between the load of the function address and the call. ;; This is equivalent to a latency of three. ;; We cannot use a conflict list for this, because we need to distinguish ;; between the actual call address and the function arguments. ;; ADJUST_COST can only properly handle reductions of the cost, so we ;; use a latency of three here. ;; We only do this for SImode loads of general registers, to make the work ;; for ADJUST_COST easier. (define_function_unit "memory" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "load_si,pcload_si")) 3 2) (define_function_unit "memory" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "load,pcload,pload,store,pstore")) 2 2) (define_function_unit "int" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "arith3,arith3b")) 3 3) (define_function_unit "int" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "dyn_shift")) 2 2) (define_function_unit "int" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "!arith3,arith3b,dyn_shift")) 1 1) ;; ??? These are approximations. (define_function_unit "mpy" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "smpy")) 2 2) (define_function_unit "mpy" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "dmpy")) 3 3) (define_function_unit "fp" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "fp,fmove")) 2 1) (define_function_unit "fp" 1 0 (and (eq_attr "pipe_model" "sh1") (eq_attr "type" "fdiv")) 13 12) ;; SH-5 SHmedia scheduling ;; When executing SHmedia code, the SH-5 is a fairly straightforward ;; single-issue machine. It has four pipelines, the branch unit (br), ;; the integer and multimedia unit (imu), the load/store unit (lsu), and ;; the floating point unit (fpu). ;; Here model the instructions with a latency greater than one cycle. ;; Every instruction on SH-5 occupies the issue resource for at least one ;; cycle. (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "!pt_media,ptabs_media,invalidate_line_media,dmpy_media,load_media,fload_media,fcmp_media,fmove_media,fparith_media,dfparith_media,fpconv_media,dfpconv_media,dfmul_media,store_media,fstore_media,mcmp_media,mac_media,d2mpy_media,atrans_media,ustore_media")) 1 1) ;; Specify the various types of instruction which have latency > 1 (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "mcmp_media")) 2 1) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "dmpy_media,load_media,fcmp_media,mac_media")) 3 1) ;; but see sh_adjust_cost for mac_media exception. (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "fload_media,fmove_media")) 4 1) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "d2mpy_media")) 4 2) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "pt_media,ptabs_media")) 5 1) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "fparith_media,dfparith_media,fpconv_media,dfpconv_media")) 6 1) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "invalidate_line_media")) 7 7) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "dfmul_media")) 9 4) (define_function_unit "sh5issue" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "atrans_media")) 10 5) ;; Floating-point divide and square-root occupy an additional resource, ;; which is not internally pipelined. However, other instructions ;; can continue to issue. (define_function_unit "sh5fds" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "fdiv_media")) 19 19) (define_function_unit "sh5fds" 1 0 (and (eq_attr "pipe_model" "sh5media") (eq_attr "type" "dfdiv_media")) 35 35) ; Definitions for filling branch delay slots. (define_attr "needs_delay_slot" "yes,no" (const_string "no")) ;; ??? This should be (nil) instead of (const_int 0) (define_attr "hit_stack" "yes,no" (cond [(eq (symbol_ref "find_regno_note (insn, REG_INC, SP_REG)") (const_int 0)) (const_string "no")] (const_string "yes"))) (define_attr "interrupt_function" "no,yes" (const (symbol_ref "current_function_interrupt"))) (define_attr "in_delay_slot" "yes,no" (cond [(eq_attr "type" "cbranch") (const_string "no") (eq_attr "type" "pcload,pcload_si") (const_string "no") (eq_attr "needs_delay_slot" "yes") (const_string "no") (eq_attr "length" "2") (const_string "yes") ] (const_string "no"))) (define_attr "cond_delay_slot" "yes,no" (cond [(eq_attr "in_delay_slot" "yes") (const_string "yes") ] (const_string "no"))) (define_attr "is_sfunc" "" (if_then_else (eq_attr "type" "sfunc") (const_int 1) (const_int 0))) (define_attr "is_mac_media" "" (if_then_else (eq_attr "type" "mac_media") (const_int 1) (const_int 0))) (define_attr "branch_zero" "yes,no" (cond [(eq_attr "type" "!cbranch") (const_string "no") (ne (symbol_ref "(next_active_insn (insn)\ == (prev_active_insn\ (XEXP (SET_SRC (PATTERN (insn)), 1))))\ && get_attr_length (next_active_insn (insn)) == 2") (const_int 0)) (const_string "yes")] (const_string "no"))) ;; SH4 Double-precision computation with double-precision result - ;; the two halves are ready at different times. (define_attr "dfp_comp" "yes,no" (cond [(eq_attr "type" "dfp_arith,dfp_conv,dfdiv") (const_string "yes")] (const_string "no"))) ;; Insns for which the latency of a preceding fp insn is decreased by one. (define_attr "late_fp_use" "yes,no" (const_string "no")) ;; And feeding insns for which this relevant. (define_attr "any_fp_comp" "yes,no" (cond [(eq_attr "type" "fp,fdiv,ftrc_s,dfp_arith,dfp_conv,dfdiv") (const_string "yes")] (const_string "no"))) (define_attr "any_int_load" "yes,no" (cond [(eq_attr "type" "load,load_si,pcload,pcload_si") (const_string "yes")] (const_string "no"))) (define_delay (eq_attr "needs_delay_slot" "yes") [(eq_attr "in_delay_slot" "yes") (nil) (nil)]) ;; On the SH and SH2, the rte instruction reads the return pc from the stack, ;; and thus we can't put a pop instruction in its delay slot. ;; ??? On the SH3, the rte instruction does not use the stack, so a pop ;; instruction can go in the delay slot. ;; Since a normal return (rts) implicitly uses the PR register, ;; we can't allow PR register loads in an rts delay slot. (define_delay (eq_attr "type" "return") [(and (eq_attr "in_delay_slot" "yes") (ior (and (eq_attr "interrupt_function" "no") (eq_attr "type" "!pload,prset")) (and (eq_attr "interrupt_function" "yes") (ior (ne (symbol_ref "TARGET_SH3") (const_int 0)) (eq_attr "hit_stack" "no"))))) (nil) (nil)]) ;; Since a call implicitly uses the PR register, we can't allow ;; a PR register store in a jsr delay slot. (define_delay (ior (eq_attr "type" "call") (eq_attr "type" "sfunc")) [(and (eq_attr "in_delay_slot" "yes") (eq_attr "type" "!pstore,prget")) (nil) (nil)]) ;; Say that we have annulled true branches, since this gives smaller and ;; faster code when branches are predicted as not taken. (define_delay (and (eq_attr "type" "cbranch") (ne (symbol_ref "TARGET_SH2") (const_int 0))) ;; SH2e has a hardware bug that pretty much prohibits the use of ;; annuled delay slots. [(eq_attr "in_delay_slot" "yes") (and (eq_attr "cond_delay_slot" "yes") (not (eq_attr "cpu" "sh2e"))) (nil)]) ;; ------------------------------------------------------------------------- ;; SImode signed integer comparisons ;; ------------------------------------------------------------------------- (define_insn "" [(set (reg:SI T_REG) (eq:SI (and:SI (match_operand:SI 0 "arith_reg_operand" "z,r") (match_operand:SI 1 "arith_operand" "K08,r")) (const_int 0)))] "TARGET_SH1" "tst %1,%0" [(set_attr "type" "mt_group")]) ;; ??? Perhaps should only accept reg/constant if the register is reg 0. ;; That would still allow reload to create cmpi instructions, but would ;; perhaps allow forcing the constant into a register when that is better. ;; Probably should use r0 for mem/imm compares, but force constant into a ;; register for pseudo/imm compares. (define_insn "cmpeqsi_t" [(set (reg:SI T_REG) (eq:SI (match_operand:SI 0 "arith_reg_operand" "r,z,r") (match_operand:SI 1 "arith_operand" "N,rI08,r")))] "TARGET_SH1" "@ tst %0,%0 cmp/eq %1,%0 cmp/eq %1,%0" [(set_attr "type" "mt_group")]) (define_insn "cmpgtsi_t" [(set (reg:SI T_REG) (gt:SI (match_operand:SI 0 "arith_reg_operand" "r,r") (match_operand:SI 1 "arith_reg_or_0_operand" "r,N")))] "TARGET_SH1" "@ cmp/gt %1,%0 cmp/pl %0" [(set_attr "type" "mt_group")]) (define_insn "cmpgesi_t" [(set (reg:SI T_REG) (ge:SI (match_operand:SI 0 "arith_reg_operand" "r,r") (match_operand:SI 1 "arith_reg_or_0_operand" "r,N")))] "TARGET_SH1" "@ cmp/ge %1,%0 cmp/pz %0" [(set_attr "type" "mt_group")]) ;; ------------------------------------------------------------------------- ;; SImode unsigned integer comparisons ;; ------------------------------------------------------------------------- (define_insn "cmpgeusi_t" [(set (reg:SI T_REG) (geu:SI (match_operand:SI 0 "arith_reg_operand" "r") (match_operand:SI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "cmp/hs %1,%0" [(set_attr "type" "mt_group")]) (define_insn "cmpgtusi_t" [(set (reg:SI T_REG) (gtu:SI (match_operand:SI 0 "arith_reg_operand" "r") (match_operand:SI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "cmp/hi %1,%0" [(set_attr "type" "mt_group")]) ;; We save the compare operands in the cmpxx patterns and use them when ;; we generate the branch. (define_expand "cmpsi" [(set (reg:SI T_REG) (compare (match_operand:SI 0 "cmpsi_operand" "") (match_operand:SI 1 "arith_operand" "")))] "TARGET_SH1" " { if (GET_CODE (operands[0]) == REG && REGNO (operands[0]) == T_REG && GET_CODE (operands[1]) != CONST_INT) operands[0] = copy_to_mode_reg (SImode, operands[0]); sh_compare_op0 = operands[0]; sh_compare_op1 = operands[1]; DONE; }") ;; ------------------------------------------------------------------------- ;; DImode signed integer comparisons ;; ------------------------------------------------------------------------- ;; ??? Could get better scheduling by splitting the initial test from the ;; rest of the insn after reload. However, the gain would hardly justify ;; the sh.md size increase necessary to do that. (define_insn "" [(set (reg:SI T_REG) (eq:SI (and:DI (match_operand:DI 0 "arith_reg_operand" "r") (match_operand:DI 1 "arith_operand" "r")) (const_int 0)))] "TARGET_SH1" "* return output_branchy_insn (EQ, \"tst\\t%S1,%S0\;bf\\t%l9\;tst\\t%R1,%R0\", insn, operands);" [(set_attr "length" "6") (set_attr "type" "arith3b")]) (define_insn "cmpeqdi_t" [(set (reg:SI T_REG) (eq:SI (match_operand:DI 0 "arith_reg_operand" "r,r") (match_operand:DI 1 "arith_reg_or_0_operand" "N,r")))] "TARGET_SH1" "@ tst %S0,%S0\;bf %,Ldi%=\;tst %R0,%R0\\n%,Ldi%=: cmp/eq %S1,%S0\;bf %,Ldi%=\;cmp/eq %R1,%R0\\n%,Ldi%=:" [(set_attr "length" "6") (set_attr "type" "arith3b")]) (define_split [(set (reg:SI T_REG) (eq:SI (match_operand:DI 0 "arith_reg_operand" "") (match_operand:DI 1 "arith_reg_or_0_operand" "")))] ;; If we applied this split when not optimizing, it would only be ;; applied during the machine-dependent reorg, when no new basic blocks ;; may be created. "TARGET_SH1 && reload_completed && optimize" [(set (reg:SI T_REG) (eq:SI (match_dup 2) (match_dup 3))) (set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_dup 6)) (pc))) (set (reg:SI T_REG) (eq:SI (match_dup 4) (match_dup 5))) (match_dup 6)] " { operands[2] = gen_rtx_REG (SImode, true_regnum (operands[0]) + (TARGET_LITTLE_ENDIAN ? 1 : 0)); operands[3] = (operands[1] == const0_rtx ? const0_rtx : gen_rtx_REG (SImode, true_regnum (operands[1]) + (TARGET_LITTLE_ENDIAN ? 1 : 0))); operands[4] = gen_lowpart (SImode, operands[0]); operands[5] = gen_lowpart (SImode, operands[1]); operands[6] = gen_label_rtx (); }") (define_insn "cmpgtdi_t" [(set (reg:SI T_REG) (gt:SI (match_operand:DI 0 "arith_reg_operand" "r,r") (match_operand:DI 1 "arith_reg_or_0_operand" "r,N")))] "TARGET_SH2" "@ cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/gt\\t%S1,%S0\;cmp/hi\\t%R1,%R0\\n%,Ldi%=: tst\\t%S0,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/pl\\t%S0\;cmp/hi\\t%S0,%R0\\n%,Ldi%=:" [(set_attr "length" "8") (set_attr "type" "arith3")]) (define_insn "cmpgedi_t" [(set (reg:SI T_REG) (ge:SI (match_operand:DI 0 "arith_reg_operand" "r,r") (match_operand:DI 1 "arith_reg_or_0_operand" "r,N")))] "TARGET_SH2" "@ cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/ge\\t%S1,%S0\;cmp/hs\\t%R1,%R0\\n%,Ldi%=: cmp/pz\\t%S0" [(set_attr "length" "8,2") (set_attr "type" "arith3,mt_group")]) ;; ------------------------------------------------------------------------- ;; DImode unsigned integer comparisons ;; ------------------------------------------------------------------------- (define_insn "cmpgeudi_t" [(set (reg:SI T_REG) (geu:SI (match_operand:DI 0 "arith_reg_operand" "r") (match_operand:DI 1 "arith_reg_operand" "r")))] "TARGET_SH2" "cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/hs\\t%S1,%S0\;cmp/hs\\t%R1,%R0\\n%,Ldi%=:" [(set_attr "length" "8") (set_attr "type" "arith3")]) (define_insn "cmpgtudi_t" [(set (reg:SI T_REG) (gtu:SI (match_operand:DI 0 "arith_reg_operand" "r") (match_operand:DI 1 "arith_reg_operand" "r")))] "TARGET_SH2" "cmp/eq\\t%S1,%S0\;bf{.|/}s\\t%,Ldi%=\;cmp/hi\\t%S1,%S0\;cmp/hi\\t%R1,%R0\\n%,Ldi%=:" [(set_attr "length" "8") (set_attr "type" "arith3")]) (define_insn "cmpeqdi_media" [(set (match_operand:DI 0 "register_operand" "=r") (eq:DI (match_operand:DI 1 "register_operand" "%r") (match_operand:DI 2 "arith_reg_or_0_operand" "Nr")))] "TARGET_SHMEDIA" "cmpeq %1, %N2, %0" [(set_attr "type" "cmp_media")]) (define_insn "cmpgtdi_media" [(set (match_operand:DI 0 "register_operand" "=r") (gt:DI (match_operand:DI 1 "arith_reg_or_0_operand" "Nr") (match_operand:DI 2 "arith_reg_or_0_operand" "rN")))] "TARGET_SHMEDIA" "cmpgt %N1, %N2, %0" [(set_attr "type" "cmp_media")]) (define_insn "cmpgtudi_media" [(set (match_operand:DI 0 "register_operand" "=r") (gtu:DI (match_operand:DI 1 "arith_reg_or_0_operand" "Nr") (match_operand:DI 2 "arith_reg_or_0_operand" "rN")))] "TARGET_SHMEDIA" "cmpgtu %N1, %N2, %0" [(set_attr "type" "cmp_media")]) ;; We save the compare operands in the cmpxx patterns and use them when ;; we generate the branch. (define_expand "cmpdi" [(set (reg:SI T_REG) (compare (match_operand:DI 0 "arith_operand" "") (match_operand:DI 1 "arith_operand" "")))] "TARGET_SH2 || TARGET_SHMEDIA" " { sh_compare_op0 = operands[0]; sh_compare_op1 = operands[1]; DONE; }") ;; ------------------------------------------------------------------------- ;; Conditional move instructions ;; ------------------------------------------------------------------------- ;; The insn names may seem reversed, but note that cmveq performs the move ;; if op1 == 0, and cmvne does it if op1 != 0. (define_insn "movdicc_false" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (if_then_else:DI (eq (match_operand:DI 1 "arith_reg_operand" "r") (const_int 0)) (match_operand:DI 2 "arith_reg_or_0_operand" "rN") (match_operand:DI 3 "arith_reg_operand" "0")))] "TARGET_SHMEDIA" "cmveq %1, %N2, %0" [(set_attr "type" "arith_media")]) (define_insn "movdicc_true" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (if_then_else:DI (ne (match_operand:DI 1 "arith_reg_operand" "r") (const_int 0)) (match_operand:DI 2 "arith_reg_or_0_operand" "rN") (match_operand:DI 3 "arith_reg_operand" "0")))] "TARGET_SHMEDIA" "cmvne %1, %N2, %0" [(set_attr "type" "arith_media")]) (define_expand "movdicc" [(set (match_operand:DI 0 "register_operand" "") (if_then_else:DI (match_operand 1 "comparison_operator" "") (match_operand:DI 2 "register_operand" "") (match_operand:DI 3 "register_operand" "")))] "TARGET_SHMEDIA" " { if ((GET_CODE (operands[1]) == EQ || GET_CODE (operands[1]) == NE) && GET_MODE (sh_compare_op0) == DImode && sh_compare_op1 == const0_rtx) operands[1] = gen_rtx (GET_CODE (operands[1]), VOIDmode, sh_compare_op0, sh_compare_op1); else { rtx tmp; if (no_new_pseudos) FAIL; tmp = gen_reg_rtx (DImode); switch (GET_CODE (operands[1])) { case EQ: emit_insn (gen_seq (tmp)); operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); break; case NE: emit_insn (gen_seq (tmp)); operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); break; case GT: emit_insn (gen_sgt (tmp)); operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); break; case LT: emit_insn (gen_slt (tmp)); operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); break; case GE: emit_insn (gen_slt (tmp)); operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); break; case LE: emit_insn (gen_sgt (tmp)); operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); break; case GTU: emit_insn (gen_sgtu (tmp)); operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); break; case LTU: emit_insn (gen_sltu (tmp)); operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); break; case GEU: emit_insn (gen_sltu (tmp)); operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); break; case LEU: emit_insn (gen_sgtu (tmp)); operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); break; case UNORDERED: emit_insn (gen_sunordered (tmp)); operands[1] = gen_rtx (NE, VOIDmode, tmp, const0_rtx); break; case ORDERED: emit_insn (gen_sunordered (tmp)); operands[1] = gen_rtx (EQ, VOIDmode, tmp, const0_rtx); break; case UNEQ: case UNGE: case UNGT: case UNLE: case UNLT: case LTGT: FAIL; default: abort (); } } }") ;; ------------------------------------------------------------------------- ;; Addition instructions ;; ------------------------------------------------------------------------- (define_expand "adddi3" [(set (match_operand:DI 0 "arith_reg_operand" "") (plus:DI (match_operand:DI 1 "arith_reg_operand" "") (match_operand:DI 2 "arith_operand" "")))] "" " { if (TARGET_SH1) { if (no_new_pseudos && ! arith_reg_operand (operands[2], DImode)) FAIL; operands[2] = force_reg (DImode, operands[2]); emit_insn (gen_adddi3_compact (operands[0], operands[1], operands[2])); DONE; } }") (define_insn "*adddi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (plus:DI (match_operand:DI 1 "arith_reg_operand" "%r,r") (match_operand:DI 2 "arith_operand" "r,I10")))] "TARGET_SHMEDIA" "@ add %1, %2, %0 addi %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "adddi3z_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (zero_extend:DI (plus:SI (match_operand:SI 1 "extend_reg_operand" "r") (match_operand:SI 2 "extend_reg_or_0_operand" "rN"))))] "TARGET_SHMEDIA" "addz.l %1, %N2, %0" [(set_attr "type" "arith_media")]) (define_insn "adddi3_compact" [(set (match_operand:DI 0 "arith_reg_operand" "=&r") (plus:DI (match_operand:DI 1 "arith_reg_operand" "%0") (match_operand:DI 2 "arith_reg_operand" "r"))) (clobber (reg:SI T_REG))] "TARGET_SH1" "#" [(set_attr "length" "6")]) (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (plus:DI (match_operand:DI 1 "arith_reg_operand" "") (match_operand:DI 2 "arith_reg_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1 && reload_completed" [(const_int 0)] " { rtx high0, high2, low0 = gen_lowpart (SImode, operands[0]); high0 = gen_rtx_REG (SImode, true_regnum (operands[0]) + (TARGET_LITTLE_ENDIAN ? 1 : 0)); high2 = gen_rtx_REG (SImode, true_regnum (operands[2]) + (TARGET_LITTLE_ENDIAN ? 1 : 0)); emit_insn (gen_clrt ()); emit_insn (gen_addc (low0, low0, gen_lowpart (SImode, operands[2]))); emit_insn (gen_addc1 (high0, high0, high2)); DONE; }") (define_insn "addc" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (plus:SI (plus:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "arith_reg_operand" "r")) (reg:SI T_REG))) (set (reg:SI T_REG) (ltu:SI (plus:SI (match_dup 1) (match_dup 2)) (match_dup 1)))] "TARGET_SH1" "addc %2,%0" [(set_attr "type" "arith")]) (define_insn "addc1" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (plus:SI (plus:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "arith_reg_operand" "r")) (reg:SI T_REG))) (clobber (reg:SI T_REG))] "TARGET_SH1" "addc %2,%0" [(set_attr "type" "arith")]) (define_expand "addsi3" [(set (match_operand:SI 0 "arith_reg_operand" "") (plus:SI (match_operand:SI 1 "arith_operand" "") (match_operand:SI 2 "arith_operand" "")))] "" " { if (TARGET_SHMEDIA) operands[1] = force_reg (SImode, operands[1]); }") (define_insn "addsi3_media" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (plus:SI (match_operand:SI 1 "extend_reg_operand" "%r,r") (match_operand:SI 2 "arith_operand" "r,I10")))] "TARGET_SHMEDIA" "@ add.l %1, %2, %0 addi.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "*addsi3_compact" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (plus:SI (match_operand:SI 1 "arith_operand" "%0") (match_operand:SI 2 "arith_operand" "rI08")))] "TARGET_SH1" "add %2,%0" [(set_attr "type" "arith")]) ;; ------------------------------------------------------------------------- ;; Subtraction instructions ;; ------------------------------------------------------------------------- (define_expand "subdi3" [(set (match_operand:DI 0 "arith_reg_operand" "") (minus:DI (match_operand:DI 1 "arith_reg_or_0_operand" "") (match_operand:DI 2 "arith_reg_operand" "")))] "" " { if (TARGET_SH1) { operands[1] = force_reg (DImode, operands[1]); emit_insn (gen_subdi3_compact (operands[0], operands[1], operands[2])); DONE; } }") (define_insn "*subdi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (minus:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rN") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "sub %N1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "subdi3_compact" [(set (match_operand:DI 0 "arith_reg_operand" "=&r") (minus:DI (match_operand:DI 1 "arith_reg_operand" "0") (match_operand:DI 2 "arith_reg_operand" "r"))) (clobber (reg:SI T_REG))] "TARGET_SH1" "#" [(set_attr "length" "6")]) (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (minus:DI (match_operand:DI 1 "arith_reg_operand" "") (match_operand:DI 2 "arith_reg_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1 && reload_completed" [(const_int 0)] " { rtx high0, high2, low0 = gen_lowpart (SImode, operands[0]); high0 = gen_rtx_REG (SImode, true_regnum (operands[0]) + (TARGET_LITTLE_ENDIAN ? 1 : 0)); high2 = gen_rtx_REG (SImode, true_regnum (operands[2]) + (TARGET_LITTLE_ENDIAN ? 1 : 0)); emit_insn (gen_clrt ()); emit_insn (gen_subc (low0, low0, gen_lowpart (SImode, operands[2]))); emit_insn (gen_subc1 (high0, high0, high2)); DONE; }") (define_insn "subc" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (minus:SI (minus:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "arith_reg_operand" "r")) (reg:SI T_REG))) (set (reg:SI T_REG) (gtu:SI (minus:SI (minus:SI (match_dup 1) (match_dup 2)) (reg:SI T_REG)) (match_dup 1)))] "TARGET_SH1" "subc %2,%0" [(set_attr "type" "arith")]) (define_insn "subc1" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (minus:SI (minus:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "arith_reg_operand" "r")) (reg:SI T_REG))) (clobber (reg:SI T_REG))] "TARGET_SH1" "subc %2,%0" [(set_attr "type" "arith")]) (define_insn "*subsi3_internal" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (minus:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "arith_reg_operand" "r")))] "TARGET_SH1" "sub %2,%0" [(set_attr "type" "arith")]) (define_insn "*subsi3_media" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (minus:SI (match_operand:SI 1 "extend_reg_or_0_operand" "rN") (match_operand:SI 2 "extend_reg_operand" "r")))] "TARGET_SHMEDIA" "sub.l %N1, %2, %0" [(set_attr "type" "arith_media")]) ;; Convert `constant - reg' to `neg rX; add rX, #const' since this ;; will sometimes save one instruction. Otherwise we might get ;; `mov #const, rY; sub rY,rX; mov rX, rY' if the source and dest regs ;; are the same. (define_expand "subsi3" [(set (match_operand:SI 0 "arith_reg_operand" "") (minus:SI (match_operand:SI 1 "arith_operand" "") (match_operand:SI 2 "arith_reg_operand" "")))] "" " { if (TARGET_SH1 && GET_CODE (operands[1]) == CONST_INT) { emit_insn (gen_negsi2 (operands[0], operands[2])); emit_insn (gen_addsi3 (operands[0], operands[0], operands[1])); DONE; } if (TARGET_SHMEDIA) { if (no_new_pseudos && ! arith_reg_or_0_operand (operands[1], SImode)) FAIL; if (operands[1] != const0_rtx) operands[1] = force_reg (SImode, operands[1]); } }") ;; ------------------------------------------------------------------------- ;; Division instructions ;; ------------------------------------------------------------------------- ;; We take advantage of the library routines which don't clobber as many ;; registers as a normal function call would. ;; The INSN_REFERENCES_ARE_DELAYED in sh.h is problematic because it ;; also has an effect on the register that holds the address of the sfunc. ;; To make this work, we have an extra dummy insn that shows the use ;; of this register for reorg. (define_insn "use_sfunc_addr" [(set (reg:SI PR_REG) (unspec:SI [(match_operand:SI 0 "register_operand" "r")] UNSPEC_SFUNC))] "TARGET_SH1 && check_use_sfunc_addr (insn, operands[0])" "" [(set_attr "length" "0")]) ;; We must use a pseudo-reg forced to reg 0 in the SET_DEST rather than ;; hard register 0. If we used hard register 0, then the next instruction ;; would be a move from hard register 0 to a pseudo-reg. If the pseudo-reg ;; gets allocated to a stack slot that needs its address reloaded, then ;; there is nothing to prevent reload from using r0 to reload the address. ;; This reload would clobber the value in r0 we are trying to store. ;; If we let reload allocate r0, then this problem can never happen. (define_insn "udivsi3_i1" [(set (match_operand:SI 0 "register_operand" "=z") (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI R4_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "TARGET_SH1 && ! TARGET_SH4" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) ; Since shmedia-nofpu code could be linked against shcompact code, and ; the udivsi3 libcall has the same name, we must consider all registers ; clobbered that are in the union of the registers clobbered by the ; shmedia and the shcompact implementation. Note, if the shcompact ; implementation actually used shcompact code, we'd need to clobber ; also r23 and fr23. (define_insn "udivsi3_i1_media" [(set (match_operand:SI 0 "register_operand" "=z") (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_MEDIA_REG)) (clobber (reg:SI PR_MEDIA_REG)) (clobber (reg:SI R20_REG)) (clobber (reg:SI R21_REG)) (clobber (reg:SI R22_REG)) (clobber (reg:DI TR0_REG)) (clobber (reg:DI TR1_REG)) (clobber (reg:DI TR2_REG)) (use (match_operand:DI 1 "target_operand" "b"))] "TARGET_SHMEDIA && ! TARGET_SHMEDIA_FPU" "blink %1, r18" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_expand "udivsi3_i4_media" [(set (match_dup 3) (zero_extend:DI (match_operand:SI 1 "register_operand" ""))) (set (match_dup 4) (zero_extend:DI (match_operand:SI 2 "register_operand" ""))) (set (match_dup 5) (float:DF (match_dup 3))) (set (match_dup 6) (float:DF (match_dup 4))) (set (match_dup 7) (div:DF (match_dup 5) (match_dup 6))) (set (match_dup 8) (fix:DI (match_dup 7))) (set (match_operand:SI 0 "register_operand" "") (truncate:SI (match_dup 8)))] "TARGET_SHMEDIA_FPU" " { operands[3] = gen_reg_rtx (DImode); operands[4] = gen_reg_rtx (DImode); operands[5] = gen_reg_rtx (DFmode); operands[6] = gen_reg_rtx (DFmode); operands[7] = gen_reg_rtx (DFmode); operands[8] = gen_reg_rtx (DImode); }") (define_insn "udivsi3_i4" [(set (match_operand:SI 0 "register_operand" "=y") (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:DF DR0_REG)) (clobber (reg:DF DR2_REG)) (clobber (reg:DF DR4_REG)) (clobber (reg:SI R0_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R4_REG)) (clobber (reg:SI R5_REG)) (use (reg:PSI FPSCR_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "TARGET_SH4 && ! TARGET_FPU_SINGLE" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "fp_mode" "double") (set_attr "needs_delay_slot" "yes")]) (define_insn "udivsi3_i4_single" [(set (match_operand:SI 0 "register_operand" "=y") (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:DF DR0_REG)) (clobber (reg:DF DR2_REG)) (clobber (reg:DF DR4_REG)) (clobber (reg:SI R0_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R4_REG)) (clobber (reg:SI R5_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "(TARGET_HARD_SH4 || TARGET_SHCOMPACT) && TARGET_FPU_SINGLE" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_expand "udivsi3" [(set (match_dup 3) (symbol_ref:SI "__udivsi3")) (set (reg:SI R4_REG) (match_operand:SI 1 "general_operand" "")) (set (reg:SI R5_REG) (match_operand:SI 2 "general_operand" "")) (parallel [(set (match_operand:SI 0 "register_operand" "") (udiv:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI R4_REG)) (use (match_dup 3))])] "" " { rtx first, last; operands[3] = gen_reg_rtx (Pmode); /* Emit the move of the address to a pseudo outside of the libcall. */ if (TARGET_HARD_SH4 && TARGET_SH2E) { emit_move_insn (operands[3], function_symbol (\"__udivsi3_i4\")); if (TARGET_FPU_SINGLE) last = gen_udivsi3_i4_single (operands[0], operands[3]); else last = gen_udivsi3_i4 (operands[0], operands[3]); } else if (TARGET_SHMEDIA_FPU) { operands[1] = force_reg (SImode, operands[1]); operands[2] = force_reg (SImode, operands[2]); emit_insn (gen_udivsi3_i4_media (operands[0], operands[1], operands[2])); DONE; } else if (TARGET_SH5) { emit_move_insn (operands[3], function_symbol (TARGET_FPU_ANY ? \"__udivsi3_i4\" : \"__udivsi3\")); if (TARGET_SHMEDIA) last = gen_udivsi3_i1_media (operands[0], Pmode == DImode ? operands[3] : gen_rtx_SUBREG (DImode, operands[3], 0)); else if (TARGET_FPU_ANY) last = gen_udivsi3_i4_single (operands[0], operands[3]); else last = gen_udivsi3_i1 (operands[0], operands[3]); } else { emit_move_insn (operands[3], function_symbol (\"__udivsi3\")); last = gen_udivsi3_i1 (operands[0], operands[3]); } first = emit_move_insn (gen_rtx_REG (SImode, 4), operands[1]); emit_move_insn (gen_rtx_REG (SImode, 5), operands[2]); last = emit_insn (last); /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); DONE; }") (define_insn "divsi3_i1" [(set (match_operand:SI 0 "register_operand" "=z") (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R2_REG)) (clobber (reg:SI R3_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "TARGET_SH1 && ! TARGET_SH4" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) ; Since shmedia-nofpu code could be linked against shcompact code, and ; the sdivsi3 libcall has the same name, we must consider all registers ; clobbered that are in the union of the registers clobbered by the ; shmedia and the shcompact implementation. Note, if the shcompact ; implementation actually used shcompact code, we'd need to clobber ; also r22, r23 and fr23. (define_insn "divsi3_i1_media" [(set (match_operand:SI 0 "register_operand" "=z") (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_MEDIA_REG)) (clobber (reg:SI PR_MEDIA_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R2_REG)) (clobber (reg:SI R3_REG)) (clobber (reg:SI R20_REG)) (clobber (reg:SI R21_REG)) (clobber (reg:DI TR0_REG)) (clobber (reg:DI TR1_REG)) (clobber (reg:DI TR2_REG)) (use (match_operand:DI 1 "target_operand" "b"))] "TARGET_SHMEDIA && ! TARGET_SHMEDIA_FPU" "blink %1, r18" [(set_attr "type" "sfunc")]) (define_expand "divsi3_i4_media" [(set (match_dup 3) (float:DF (match_operand:SI 1 "register_operand" "r"))) (set (match_dup 4) (float:DF (match_operand:SI 2 "register_operand" "r"))) (set (match_dup 5) (div:DF (match_dup 3) (match_dup 4))) (set (match_operand:SI 0 "register_operand" "=r") (fix:SI (match_dup 5)))] "TARGET_SHMEDIA_FPU" " { operands[3] = gen_reg_rtx (DFmode); operands[4] = gen_reg_rtx (DFmode); operands[5] = gen_reg_rtx (DFmode); }") (define_insn "divsi3_i4" [(set (match_operand:SI 0 "register_operand" "=y") (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI PR_REG)) (clobber (reg:DF DR0_REG)) (clobber (reg:DF DR2_REG)) (use (reg:PSI FPSCR_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "TARGET_SH4 && ! TARGET_FPU_SINGLE" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "fp_mode" "double") (set_attr "needs_delay_slot" "yes")]) (define_insn "divsi3_i4_single" [(set (match_operand:SI 0 "register_operand" "=y") (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI PR_REG)) (clobber (reg:DF DR0_REG)) (clobber (reg:DF DR2_REG)) (clobber (reg:SI R2_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "(TARGET_HARD_SH4 || TARGET_SHCOMPACT) && TARGET_FPU_SINGLE" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_expand "divsi3" [(set (match_dup 3) (symbol_ref:SI "__sdivsi3")) (set (reg:SI R4_REG) (match_operand:SI 1 "general_operand" "")) (set (reg:SI R5_REG) (match_operand:SI 2 "general_operand" "")) (parallel [(set (match_operand:SI 0 "register_operand" "") (div:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R2_REG)) (clobber (reg:SI R3_REG)) (use (match_dup 3))])] "" " { rtx first, last; operands[3] = gen_reg_rtx (Pmode); /* Emit the move of the address to a pseudo outside of the libcall. */ if (TARGET_HARD_SH4 && TARGET_SH2E) { emit_move_insn (operands[3], function_symbol (\"__sdivsi3_i4\")); if (TARGET_FPU_SINGLE) last = gen_divsi3_i4_single (operands[0], operands[3]); else last = gen_divsi3_i4 (operands[0], operands[3]); } else if (TARGET_SHMEDIA_FPU) { operands[1] = force_reg (SImode, operands[1]); operands[2] = force_reg (SImode, operands[2]); emit_insn (gen_divsi3_i4_media (operands[0], operands[1], operands[2])); DONE; } else if (TARGET_SH5) { emit_move_insn (operands[3], function_symbol (TARGET_FPU_ANY ? \"__sdivsi3_i4\" : \"__sdivsi3\")); if (TARGET_SHMEDIA) last = gen_divsi3_i1_media (operands[0], Pmode == DImode ? operands[3] : gen_rtx_SUBREG (DImode, operands[3], 0)); else if (TARGET_FPU_ANY) last = gen_divsi3_i4_single (operands[0], operands[3]); else last = gen_divsi3_i1 (operands[0], operands[3]); } else { emit_move_insn (operands[3], function_symbol (\"__sdivsi3\")); last = gen_divsi3_i1 (operands[0], operands[3]); } first = emit_move_insn (gen_rtx_REG (SImode, 4), operands[1]); emit_move_insn (gen_rtx_REG (SImode, 5), operands[2]); last = emit_insn (last); /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); DONE; }") ;; ------------------------------------------------------------------------- ;; Multiplication instructions ;; ------------------------------------------------------------------------- (define_insn "umulhisi3_i" [(set (reg:SI MACL_REG) (mult:SI (zero_extend:SI (match_operand:HI 0 "arith_reg_operand" "r")) (zero_extend:SI (match_operand:HI 1 "arith_reg_operand" "r"))))] "TARGET_SH1" "mulu.w %1,%0" [(set_attr "type" "smpy")]) (define_insn "mulhisi3_i" [(set (reg:SI MACL_REG) (mult:SI (sign_extend:SI (match_operand:HI 0 "arith_reg_operand" "r")) (sign_extend:SI (match_operand:HI 1 "arith_reg_operand" "r"))))] "TARGET_SH1" "muls.w %1,%0" [(set_attr "type" "smpy")]) (define_expand "mulhisi3" [(set (reg:SI MACL_REG) (mult:SI (sign_extend:SI (match_operand:HI 1 "arith_reg_operand" "")) (sign_extend:SI (match_operand:HI 2 "arith_reg_operand" "")))) (set (match_operand:SI 0 "arith_reg_operand" "") (reg:SI MACL_REG))] "TARGET_SH1" " { rtx first, last; first = emit_insn (gen_mulhisi3_i (operands[1], operands[2])); last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACL_REG)); /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); /* expand_binop can't find a suitable code in umul_widen_optab to make a REG_EQUAL note from, so make one here. See also smulsi3_highpart. ??? Alternatively, we could put this at the calling site of expand_binop, i.e. expand_expr. */ REG_NOTES (last) = gen_rtx_EXPR_LIST (REG_EQUAL, copy_rtx (SET_SRC (single_set (first))), REG_NOTES (last)); DONE; }") (define_expand "umulhisi3" [(set (reg:SI MACL_REG) (mult:SI (zero_extend:SI (match_operand:HI 1 "arith_reg_operand" "")) (zero_extend:SI (match_operand:HI 2 "arith_reg_operand" "")))) (set (match_operand:SI 0 "arith_reg_operand" "") (reg:SI MACL_REG))] "TARGET_SH1" " { rtx first, last; first = emit_insn (gen_umulhisi3_i (operands[1], operands[2])); last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACL_REG)); /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); /* expand_binop can't find a suitable code in umul_widen_optab to make a REG_EQUAL note from, so make one here. See also smulsi3_highpart. ??? Alternatively, we could put this at the calling site of expand_binop, i.e. expand_expr. */ REG_NOTES (last) = gen_rtx_EXPR_LIST (REG_EQUAL, copy_rtx (SET_SRC (single_set (first))), REG_NOTES (last)); DONE; }") ;; mulsi3 on the SH2 can be done in one instruction, on the SH1 we generate ;; a call to a routine which clobbers known registers. (define_insn "" [(set (match_operand:SI 1 "register_operand" "=z") (mult:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI MACL_REG)) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI R3_REG)) (clobber (reg:SI R2_REG)) (clobber (reg:SI R1_REG)) (use (match_operand:SI 0 "arith_reg_operand" "r"))] "TARGET_SH1" "jsr @%0%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_expand "mulsi3_call" [(set (reg:SI R4_REG) (match_operand:SI 1 "general_operand" "")) (set (reg:SI R5_REG) (match_operand:SI 2 "general_operand" "")) (parallel[(set (match_operand:SI 0 "register_operand" "") (mult:SI (reg:SI R4_REG) (reg:SI R5_REG))) (clobber (reg:SI MACL_REG)) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI R3_REG)) (clobber (reg:SI R2_REG)) (clobber (reg:SI R1_REG)) (use (match_operand:SI 3 "register_operand" ""))])] "TARGET_SH1" "") (define_insn "mul_l" [(set (reg:SI MACL_REG) (mult:SI (match_operand:SI 0 "arith_reg_operand" "r") (match_operand:SI 1 "arith_reg_operand" "r")))] "TARGET_SH2" "mul.l %1,%0" [(set_attr "type" "dmpy")]) (define_expand "mulsi3" [(set (reg:SI MACL_REG) (mult:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "arith_reg_operand" ""))) (set (match_operand:SI 0 "arith_reg_operand" "") (reg:SI MACL_REG))] "TARGET_SH1" " { rtx first, last; if (!TARGET_SH2) { /* The address must be set outside the libcall, since it goes into a pseudo. */ rtx sym = function_symbol (\"__mulsi3\"); rtx addr = force_reg (SImode, sym); rtx insns = gen_mulsi3_call (operands[0], operands[1], operands[2], addr); first = insns; last = emit_insn (insns); } else { rtx macl = gen_rtx_REG (SImode, MACL_REG); first = emit_insn (gen_mul_l (operands[1], operands[2])); /* consec_sets_giv can only recognize the first insn that sets a giv as the giv insn. So we must tag this also with a REG_EQUAL note. */ last = emit_insn (gen_movsi_i ((operands[0]), macl)); } /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); DONE; }") (define_insn "mulsidi3_i" [(set (reg:SI MACH_REG) (truncate:SI (lshiftrt:DI (mult:DI (sign_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) (const_int 32)))) (set (reg:SI MACL_REG) (mult:SI (match_dup 0) (match_dup 1)))] "TARGET_SH2" "dmuls.l %1,%0" [(set_attr "type" "dmpy")]) (define_expand "mulsidi3" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mult:DI (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" "r"))))] "TARGET_SH2 || TARGET_SHMEDIA" " { if (TARGET_SH2) { emit_insn (gen_mulsidi3_compact (operands[0], operands[1], operands[2])); DONE; } }") (define_insn "mulsidi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mult:DI (sign_extend:DI (match_operand:SI 1 "extend_reg_operand" "%r")) (sign_extend:DI (match_operand:SI 2 "extend_reg_operand" "r"))))] "TARGET_SHMEDIA" "muls.l %1, %2, %0" [(set_attr "type" "dmpy_media")]) (define_insn "mulsidi3_compact" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mult:DI (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" "r")))) (clobber (reg:SI MACH_REG)) (clobber (reg:SI MACL_REG))] "TARGET_SH2" "#") (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (mult:DI (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" "")))) (clobber (reg:SI MACH_REG)) (clobber (reg:SI MACL_REG))] "TARGET_SH2" [(const_int 0)] " { rtx low_dst = gen_lowpart (SImode, operands[0]); rtx high_dst = gen_highpart (SImode, operands[0]); emit_insn (gen_mulsidi3_i (operands[1], operands[2])); emit_move_insn (low_dst, gen_rtx_REG (SImode, MACL_REG)); emit_move_insn (high_dst, gen_rtx_REG (SImode, MACH_REG)); /* We need something to tag the possible REG_EQUAL notes on to. */ emit_move_insn (operands[0], operands[0]); DONE; }") (define_insn "umulsidi3_i" [(set (reg:SI MACH_REG) (truncate:SI (lshiftrt:DI (mult:DI (zero_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) (const_int 32)))) (set (reg:SI MACL_REG) (mult:SI (match_dup 0) (match_dup 1)))] "TARGET_SH2" "dmulu.l %1,%0" [(set_attr "type" "dmpy")]) (define_expand "umulsidi3" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mult:DI (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" "r"))))] "TARGET_SH2 || TARGET_SHMEDIA" " { if (TARGET_SH2) { emit_insn (gen_umulsidi3_compact (operands[0], operands[1], operands[2])); DONE; } }") (define_insn "umulsidi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mult:DI (zero_extend:DI (match_operand:SI 1 "extend_reg_operand" "%r")) (zero_extend:DI (match_operand:SI 2 "extend_reg_operand" "r"))))] "TARGET_SHMEDIA" "mulu.l %1, %2, %0" [(set_attr "type" "dmpy_media")]) (define_insn "umulsidi3_compact" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mult:DI (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r")) (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" "r")))) (clobber (reg:SI MACH_REG)) (clobber (reg:SI MACL_REG))] "TARGET_SH2" "#") (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (mult:DI (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" "")))) (clobber (reg:SI MACH_REG)) (clobber (reg:SI MACL_REG))] "TARGET_SH2" [(const_int 0)] " { rtx low_dst = gen_lowpart (SImode, operands[0]); rtx high_dst = gen_highpart (SImode, operands[0]); emit_insn (gen_umulsidi3_i (operands[1], operands[2])); emit_move_insn (low_dst, gen_rtx_REG (SImode, MACL_REG)); emit_move_insn (high_dst, gen_rtx_REG (SImode, MACH_REG)); /* We need something to tag the possible REG_EQUAL notes on to. */ emit_move_insn (operands[0], operands[0]); DONE; }") (define_insn "smulsi3_highpart_i" [(set (reg:SI MACH_REG) (truncate:SI (lshiftrt:DI (mult:DI (sign_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) (const_int 32)))) (clobber (reg:SI MACL_REG))] "TARGET_SH2" "dmuls.l %1,%0" [(set_attr "type" "dmpy")]) (define_expand "smulsi3_highpart" [(parallel [(set (reg:SI MACH_REG) (truncate:SI (lshiftrt:DI (mult:DI (sign_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) (sign_extend:DI (match_operand:SI 2 "arith_reg_operand" ""))) (const_int 32)))) (clobber (reg:SI MACL_REG))]) (set (match_operand:SI 0 "arith_reg_operand" "") (reg:SI MACH_REG))] "TARGET_SH2" " { rtx first, last; first = emit_insn (gen_smulsi3_highpart_i (operands[1], operands[2])); last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACH_REG)); /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); /* expand_binop can't find a suitable code in mul_highpart_optab to make a REG_EQUAL note from, so make one here. See also {,u}mulhisi. ??? Alternatively, we could put this at the calling site of expand_binop, i.e. expand_mult_highpart. */ REG_NOTES (last) = gen_rtx_EXPR_LIST (REG_EQUAL, copy_rtx (SET_SRC (single_set (first))), REG_NOTES (last)); DONE; }") (define_insn "umulsi3_highpart_i" [(set (reg:SI MACH_REG) (truncate:SI (lshiftrt:DI (mult:DI (zero_extend:DI (match_operand:SI 0 "arith_reg_operand" "r")) (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "r"))) (const_int 32)))) (clobber (reg:SI MACL_REG))] "TARGET_SH2" "dmulu.l %1,%0" [(set_attr "type" "dmpy")]) (define_expand "umulsi3_highpart" [(parallel [(set (reg:SI MACH_REG) (truncate:SI (lshiftrt:DI (mult:DI (zero_extend:DI (match_operand:SI 1 "arith_reg_operand" "")) (zero_extend:DI (match_operand:SI 2 "arith_reg_operand" ""))) (const_int 32)))) (clobber (reg:SI MACL_REG))]) (set (match_operand:SI 0 "arith_reg_operand" "") (reg:SI MACH_REG))] "TARGET_SH2" " { rtx first, last; first = emit_insn (gen_umulsi3_highpart_i (operands[1], operands[2])); last = emit_move_insn (operands[0], gen_rtx_REG (SImode, MACH_REG)); /* Wrap the sequence in REG_LIBCALL / REG_RETVAL notes so that loop invariant code motion can move it. */ REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last, REG_NOTES (first)); REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last)); DONE; }") ;; ------------------------------------------------------------------------- ;; Logical operations ;; ------------------------------------------------------------------------- (define_insn "*andsi3_compact" [(set (match_operand:SI 0 "arith_reg_operand" "=r,z") (and:SI (match_operand:SI 1 "arith_reg_operand" "%0,0") (match_operand:SI 2 "logical_operand" "r,K08")))] "TARGET_SH1" "and %2,%0" [(set_attr "type" "arith")]) ;; If the constant is 255, then emit an extu.b instruction instead of an ;; and, since that will give better code. (define_expand "andsi3" [(set (match_operand:SI 0 "arith_reg_operand" "") (and:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "logical_operand" "")))] "TARGET_SH1" " { if (GET_CODE (operands[2]) == CONST_INT && INTVAL (operands[2]) == 255) { emit_insn (gen_zero_extendqisi2 (operands[0], gen_lowpart (QImode, operands[1]))); DONE; } }") (define_insn_and_split "anddi3" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r,r") (and:DI (match_operand:DI 1 "arith_reg_operand" "%r,r,r") (match_operand:DI 2 "and_operand" "r,I10,J16")))] "TARGET_SHMEDIA" "@ and %1, %2, %0 andi %1, %2, %0 #" "reload_completed && ! logical_operand (operands[2], DImode)" [(const_int 0)] " { if (INTVAL (operands[2]) == (unsigned) 0xffffffff) emit_insn (gen_mshflo_l_di (operands[0], operands[1], CONST0_RTX (DImode))); else emit_insn (gen_mshfhi_l_di (operands[0], CONST0_RTX (DImode), operands[1])); DONE; }" [(set_attr "type" "arith_media")]) (define_insn "andcdi3" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (and:DI (match_operand:DI 1 "arith_reg_operand" "r") (not:DI (match_operand:DI 2 "arith_reg_operand" "r"))))] "TARGET_SHMEDIA" "andc %1,%2,%0" [(set_attr "type" "arith_media")]) (define_insn "iorsi3" [(set (match_operand:SI 0 "arith_reg_operand" "=r,z") (ior:SI (match_operand:SI 1 "arith_reg_operand" "%0,0") (match_operand:SI 2 "logical_operand" "r,K08")))] "TARGET_SH1" "or %2,%0" [(set_attr "type" "arith")]) (define_insn "iordi3" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (ior:DI (match_operand:DI 1 "arith_reg_operand" "%r,r") (match_operand:DI 2 "logical_operand" "r,I10")))] "TARGET_SHMEDIA" "@ or %1, %2, %0 ori %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "xorsi3" [(set (match_operand:SI 0 "arith_reg_operand" "=z,r") (xor:SI (match_operand:SI 1 "arith_reg_operand" "%0,0") (match_operand:SI 2 "logical_operand" "K08,r")))] "TARGET_SH1" "xor %2,%0" [(set_attr "type" "arith")]) (define_insn "xordi3" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (xor:DI (match_operand:DI 1 "arith_reg_operand" "%r,r") (match_operand:DI 2 "shmedia_6bit_operand" "r,I06")))] "TARGET_SHMEDIA" "@ xor %1, %2, %0 xori %1, %2, %0" [(set_attr "type" "arith_media")]) ;; Combiner bridge pattern for 2 * sign extend -> logical op -> truncate. ;; converts 2 * sign extend -> logical op into logical op -> sign extend (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (sign_extend:DI (match_operator 4 "binary_logical_operator" [(match_operand 1 "any_register_operand" "") (match_operand 2 "any_register_operand" "")])))] "TARGET_SHMEDIA" [(set (match_dup 5) (match_dup 4)) (set (match_dup 0) (sign_extend:DI (match_dup 5)))] " { enum machine_mode inmode = GET_MODE (operands[1]); int offset = 0; if (GET_CODE (operands[0]) == SUBREG) { offset = SUBREG_BYTE (operands[0]); operands[0] = SUBREG_REG (operands[0]); } if (GET_CODE (operands[0]) != REG) abort (); if (! TARGET_LITTLE_ENDIAN) offset += 8 - GET_MODE_SIZE (inmode); operands[5] = gen_rtx_SUBREG (inmode, operands[0], offset); }") ;; ------------------------------------------------------------------------- ;; Shifts and rotates ;; ------------------------------------------------------------------------- (define_expand "rotldi3" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (rotate:DI (match_operand:DI 1 "arith_reg_operand" "r") (match_operand:HI 2 "mextr_bit_offset" "i")))] "TARGET_SHMEDIA" "if (! mextr_bit_offset (operands[2], HImode)) FAIL;") (define_insn "rotldi3_mextr" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (rotate:DI (match_operand:DI 1 "arith_reg_operand" "r") (match_operand:HI 2 "mextr_bit_offset" "i")))] "TARGET_SHMEDIA" "* { static char templ[16]; sprintf (templ, \"mextr%d\\t%%1,%%1,%%0\", 8 - (int) (INTVAL (operands[2]) >> 3)); return templ; }" [(set_attr "type" "arith_media")]) (define_expand "rotrdi3" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (rotatert:DI (match_operand:DI 1 "arith_reg_operand" "r") (match_operand:HI 2 "mextr_bit_offset" "i")))] "TARGET_SHMEDIA" "if (! mextr_bit_offset (operands[2], HImode)) FAIL;") (define_insn "rotrdi3_mextr" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (rotatert:DI (match_operand:DI 1 "arith_reg_operand" "r") (match_operand:HI 2 "mextr_bit_offset" "i")))] "TARGET_SHMEDIA" "* { static char templ[16]; sprintf (templ, \"mextr%d\\t%%1,%%1,%%0\", (int) INTVAL (operands[2]) >> 3); return templ; }" [(set_attr "type" "arith_media")]) (define_insn "rotlsi3_1" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (rotate:SI (match_operand:SI 1 "arith_reg_operand" "0") (const_int 1))) (set (reg:SI T_REG) (lshiftrt:SI (match_dup 1) (const_int 31)))] "TARGET_SH1" "rotl %0" [(set_attr "type" "arith")]) (define_insn "rotlsi3_31" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (rotate:SI (match_operand:SI 1 "arith_reg_operand" "0") (const_int 31))) (clobber (reg:SI T_REG))] "TARGET_SH1" "rotr %0" [(set_attr "type" "arith")]) (define_insn "rotlsi3_16" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (rotate:SI (match_operand:SI 1 "arith_reg_operand" "r") (const_int 16)))] "TARGET_SH1" "swap.w %1,%0" [(set_attr "type" "arith")]) (define_expand "rotlsi3" [(set (match_operand:SI 0 "arith_reg_operand" "") (rotate:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "immediate_operand" "")))] "TARGET_SH1" " { static const char rot_tab[] = { 000, 000, 000, 000, 000, 000, 010, 001, 001, 001, 011, 013, 003, 003, 003, 003, 003, 003, 003, 003, 003, 013, 012, 002, 002, 002, 010, 000, 000, 000, 000, 000, }; int count, choice; if (GET_CODE (operands[2]) != CONST_INT) FAIL; count = INTVAL (operands[2]); choice = rot_tab[count]; if (choice & 010 && SH_DYNAMIC_SHIFT_COST <= 1) FAIL; choice &= 7; switch (choice) { case 0: emit_move_insn (operands[0], operands[1]); count -= (count & 16) * 2; break; case 3: emit_insn (gen_rotlsi3_16 (operands[0], operands[1])); count -= 16; break; case 1: case 2: { rtx parts[2]; parts[0] = gen_reg_rtx (SImode); parts[1] = gen_reg_rtx (SImode); emit_insn (gen_rotlsi3_16 (parts[2-choice], operands[1])); parts[choice-1] = operands[1]; emit_insn (gen_ashlsi3 (parts[0], parts[0], GEN_INT (8))); emit_insn (gen_lshrsi3 (parts[1], parts[1], GEN_INT (8))); emit_insn (gen_iorsi3 (operands[0], parts[0], parts[1])); count = (count & ~16) - 8; } } for (; count > 0; count--) emit_insn (gen_rotlsi3_1 (operands[0], operands[0])); for (; count < 0; count++) emit_insn (gen_rotlsi3_31 (operands[0], operands[0])); DONE; }") (define_insn "*rotlhi3_8" [(set (match_operand:HI 0 "arith_reg_operand" "=r") (rotate:HI (match_operand:HI 1 "arith_reg_operand" "r") (const_int 8)))] "TARGET_SH1" "swap.b %1,%0" [(set_attr "type" "arith")]) (define_expand "rotlhi3" [(set (match_operand:HI 0 "arith_reg_operand" "") (rotate:HI (match_operand:HI 1 "arith_reg_operand" "") (match_operand:HI 2 "immediate_operand" "")))] "TARGET_SH1" " { if (GET_CODE (operands[2]) != CONST_INT || INTVAL (operands[2]) != 8) FAIL; }") ;; ;; shift left ;; This pattern is used by init_expmed for computing the costs of shift ;; insns. (define_insn_and_split "ashlsi3_std" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r,r,r") (ashift:SI (match_operand:SI 1 "arith_reg_operand" "0,0,0,0") (match_operand:SI 2 "nonmemory_operand" "r,M,P27,?ri"))) (clobber (match_scratch:SI 3 "=X,X,X,&r"))] "TARGET_SH3 || (TARGET_SH1 && GET_CODE (operands[2]) == CONST_INT && CONST_OK_FOR_P27 (INTVAL (operands[2])))" "@ shld %2,%0 add %0,%0 shll%O2 %0 #" "TARGET_SH3 && reload_completed && GET_CODE (operands[2]) == CONST_INT && ! CONST_OK_FOR_P27 (INTVAL (operands[2]))" [(set (match_dup 3) (match_dup 2)) (parallel [(set (match_dup 0) (ashift:SI (match_dup 1) (match_dup 3))) (clobber (match_dup 4))])] "operands[4] = gen_rtx_SCRATCH (SImode);" [(set_attr "length" "*,*,*,4") (set_attr "type" "dyn_shift,arith,arith,arith")]) (define_insn "ashlhi3_k" [(set (match_operand:HI 0 "arith_reg_operand" "=r,r") (ashift:HI (match_operand:HI 1 "arith_reg_operand" "0,0") (match_operand:HI 2 "const_int_operand" "M,P27")))] "TARGET_SH1 && CONST_OK_FOR_P27 (INTVAL (operands[2]))" "@ add %0,%0 shll%O2 %0" [(set_attr "type" "arith")]) (define_insn "ashlsi3_n" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ashift:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "const_int_operand" "n"))) (clobber (reg:SI T_REG))] "TARGET_SH1 && ! sh_dynamicalize_shift_p (operands[2])" "#" [(set (attr "length") (cond [(eq (symbol_ref "shift_insns_rtx (insn)") (const_int 1)) (const_string "2") (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 2)) (const_string "4") (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 3)) (const_string "6")] (const_string "8"))) (set_attr "type" "arith")]) (define_split [(set (match_operand:SI 0 "arith_reg_operand" "") (ashift:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "const_int_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1 && reload_completed" [(use (reg:SI R0_REG))] " { gen_shifty_op (ASHIFT, operands); DONE; }") (define_insn "ashlsi3_media" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (ashift:SI (match_operand:SI 1 "extend_reg_operand" "r,r") (match_operand:SI 2 "nonmemory_operand" "r,n")))] "TARGET_SHMEDIA" "@ shlld.l %1, %2, %0 shlli.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_expand "ashlsi3" [(parallel [(set (match_operand:SI 0 "arith_reg_operand" "") (ashift:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "nonmemory_operand" ""))) (clobber (reg:SI T_REG))])] "" " { if (TARGET_SHMEDIA) { emit_insn (gen_ashlsi3_media (operands[0], operands[1], operands[2])); DONE; } if (GET_CODE (operands[2]) == CONST_INT && sh_dynamicalize_shift_p (operands[2])) operands[2] = force_reg (SImode, operands[2]); if (TARGET_SH3) { emit_insn (gen_ashlsi3_std (operands[0], operands[1], operands[2])); DONE; } if (! immediate_operand (operands[2], GET_MODE (operands[2]))) FAIL; }") (define_insn "ashlhi3" [(set (match_operand:HI 0 "arith_reg_operand" "=r") (ashift:HI (match_operand:HI 1 "arith_reg_operand" "0") (match_operand:HI 2 "const_int_operand" "n"))) (clobber (reg:SI T_REG))] "TARGET_SH1" "#" [(set (attr "length") (cond [(eq (symbol_ref "shift_insns_rtx (insn)") (const_int 1)) (const_string "2") (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 2)) (const_string "4")] (const_string "6"))) (set_attr "type" "arith")]) (define_split [(set (match_operand:HI 0 "arith_reg_operand" "") (ashift:HI (match_operand:HI 1 "arith_reg_operand" "") (match_operand:HI 2 "const_int_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1 && reload_completed" [(use (reg:SI R0_REG))] " { gen_shifty_hi_op (ASHIFT, operands); DONE; }") ; ; arithmetic shift right ; (define_insn "ashrsi3_k" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "const_int_operand" "M"))) (clobber (reg:SI T_REG))] "TARGET_SH1 && INTVAL (operands[2]) == 1" "shar %0" [(set_attr "type" "arith")]) ;; We can't do HImode right shifts correctly unless we start out with an ;; explicit zero / sign extension; doing that would result in worse overall ;; code, so just let the machine independent code widen the mode. ;; That's why we don't have ashrhi3_k / lshrhi3_k / lshrhi3_m / lshrhi3 . ;; ??? This should be a define expand. (define_insn "ashrsi2_16" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "r") (const_int 16)))] "TARGET_SH1" "#" [(set_attr "length" "4")]) (define_split [(set (match_operand:SI 0 "arith_reg_operand" "") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") (const_int 16)))] "TARGET_SH1" [(set (match_dup 0) (rotate:SI (match_dup 1) (const_int 16))) (set (match_dup 0) (sign_extend:SI (match_dup 2)))] "operands[2] = gen_lowpart (HImode, operands[0]);") ;; ??? This should be a define expand. (define_insn "ashrsi2_31" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (const_int 31))) (clobber (reg:SI T_REG))] "TARGET_SH1" "#" [(set_attr "length" "4")]) (define_split [(set (match_operand:SI 0 "arith_reg_operand" "") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") (const_int 31))) (clobber (reg:SI T_REG))] "TARGET_SH1" [(const_int 0)] " { emit_insn (gen_ashlsi_c (operands[0], operands[1])); emit_insn (gen_subc1 (operands[0], operands[0], operands[0])); DONE; }") (define_insn "ashlsi_c" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ashift:SI (match_operand:SI 1 "arith_reg_operand" "0") (const_int 1))) (set (reg:SI T_REG) (lt:SI (match_dup 1) (const_int 0)))] "TARGET_SH1" "shll %0" [(set_attr "type" "arith")]) (define_insn "ashrsi3_d" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (neg:SI (match_operand:SI 2 "arith_reg_operand" "r"))))] "TARGET_SH3" "shad %2,%0" [(set_attr "type" "dyn_shift")]) (define_insn "ashrsi3_n" [(set (reg:SI R4_REG) (ashiftrt:SI (reg:SI R4_REG) (match_operand:SI 0 "const_int_operand" "i"))) (clobber (reg:SI T_REG)) (clobber (reg:SI PR_REG)) (use (match_operand:SI 1 "arith_reg_operand" "r"))] "TARGET_SH1" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_insn "ashrsi3_media" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (ashiftrt:SI (match_operand:SI 1 "extend_reg_operand" "r,r") (match_operand:SI 2 "nonmemory_operand" "r,n")))] "TARGET_SHMEDIA" "@ shard.l %1, %2, %0 shari.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_expand "ashrsi3" [(parallel [(set (match_operand:SI 0 "arith_reg_operand" "") (ashiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "nonmemory_operand" ""))) (clobber (reg:SI T_REG))])] "" " { if (TARGET_SHMEDIA) { emit_insn (gen_ashrsi3_media (operands[0], operands[1], operands[2])); DONE; } if (expand_ashiftrt (operands)) DONE; else FAIL; }") ;; logical shift right (define_insn "lshrsi3_d" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (neg:SI (match_operand:SI 2 "arith_reg_operand" "r"))))] "TARGET_SH3" "shld %2,%0" [(set_attr "type" "dyn_shift")]) ;; Only the single bit shift clobbers the T bit. (define_insn "lshrsi3_m" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "const_int_operand" "M"))) (clobber (reg:SI T_REG))] "TARGET_SH1 && CONST_OK_FOR_M (INTVAL (operands[2]))" "shlr %0" [(set_attr "type" "arith")]) (define_insn "lshrsi3_k" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "const_int_operand" "P27")))] "TARGET_SH1 && CONST_OK_FOR_P27 (INTVAL (operands[2])) && ! CONST_OK_FOR_M (INTVAL (operands[2]))" "shlr%O2 %0" [(set_attr "type" "arith")]) (define_insn "lshrsi3_n" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (match_operand:SI 2 "const_int_operand" "n"))) (clobber (reg:SI T_REG))] "TARGET_SH1 && ! sh_dynamicalize_shift_p (operands[2])" "#" [(set (attr "length") (cond [(eq (symbol_ref "shift_insns_rtx (insn)") (const_int 1)) (const_string "2") (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 2)) (const_string "4") (eq (symbol_ref "shift_insns_rtx (insn)") (const_int 3)) (const_string "6")] (const_string "8"))) (set_attr "type" "arith")]) (define_split [(set (match_operand:SI 0 "arith_reg_operand" "") (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "const_int_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1 && reload_completed" [(use (reg:SI R0_REG))] " { gen_shifty_op (LSHIFTRT, operands); DONE; }") (define_insn "lshrsi3_media" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (lshiftrt:SI (match_operand:SI 1 "extend_reg_operand" "r,r") (match_operand:SI 2 "nonmemory_operand" "r,n")))] "TARGET_SHMEDIA" "@ shlrd.l %1, %2, %0 shlri.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_expand "lshrsi3" [(parallel [(set (match_operand:SI 0 "arith_reg_operand" "") (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "nonmemory_operand" ""))) (clobber (reg:SI T_REG))])] "" " { if (TARGET_SHMEDIA) { emit_insn (gen_lshrsi3_media (operands[0], operands[1], operands[2])); DONE; } if (GET_CODE (operands[2]) == CONST_INT && sh_dynamicalize_shift_p (operands[2])) operands[2] = force_reg (SImode, operands[2]); if (TARGET_SH3 && arith_reg_operand (operands[2], GET_MODE (operands[2]))) { rtx count = copy_to_mode_reg (SImode, operands[2]); emit_insn (gen_negsi2 (count, count)); emit_insn (gen_lshrsi3_d (operands[0], operands[1], count)); DONE; } if (! immediate_operand (operands[2], GET_MODE (operands[2]))) FAIL; }") ;; ??? This should be a define expand. (define_insn "ashldi3_k" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (ashift:DI (match_operand:DI 1 "arith_reg_operand" "0") (const_int 1))) (clobber (reg:SI T_REG))] "TARGET_SH1" "shll %R0\;rotcl %S0" [(set_attr "length" "4") (set_attr "type" "arith")]) (define_insn "ashldi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (ashift:DI (match_operand:DI 1 "arith_reg_operand" "r,r") (match_operand:DI 2 "nonmemory_operand" "r,n")))] "TARGET_SHMEDIA" "@ shlld %1, %2, %0 shlli %1, %2, %0" [(set_attr "type" "arith_media")]) (define_expand "ashldi3" [(parallel [(set (match_operand:DI 0 "arith_reg_operand" "") (ashift:DI (match_operand:DI 1 "arith_reg_operand" "") (match_operand:DI 2 "immediate_operand" ""))) (clobber (reg:SI T_REG))])] "" " { if (TARGET_SHMEDIA) { emit_insn (gen_ashldi3_media (operands[0], operands[1], operands[2])); DONE; } if (GET_CODE (operands[2]) != CONST_INT || INTVAL (operands[2]) != 1) FAIL; }") ;; ??? This should be a define expand. (define_insn "lshrdi3_k" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (lshiftrt:DI (match_operand:DI 1 "arith_reg_operand" "0") (const_int 1))) (clobber (reg:SI T_REG))] "TARGET_SH1" "shlr %S0\;rotcr %R0" [(set_attr "length" "4") (set_attr "type" "arith")]) (define_insn "lshrdi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (lshiftrt:DI (match_operand:DI 1 "arith_reg_operand" "r,r") (match_operand:DI 2 "nonmemory_operand" "r,n")))] "TARGET_SHMEDIA" "@ shlrd %1, %2, %0 shlri %1, %2, %0" [(set_attr "type" "arith_media")]) (define_expand "lshrdi3" [(parallel [(set (match_operand:DI 0 "arith_reg_operand" "") (lshiftrt:DI (match_operand:DI 1 "arith_reg_operand" "") (match_operand:DI 2 "immediate_operand" ""))) (clobber (reg:SI T_REG))])] "" " { if (TARGET_SHMEDIA) { emit_insn (gen_lshrdi3_media (operands[0], operands[1], operands[2])); DONE; } if (GET_CODE (operands[2]) != CONST_INT || INTVAL (operands[2]) != 1) FAIL; }") ;; ??? This should be a define expand. (define_insn "ashrdi3_k" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "0") (const_int 1))) (clobber (reg:SI T_REG))] "TARGET_SH1" "shar %S0\;rotcr %R0" [(set_attr "length" "4") (set_attr "type" "arith")]) (define_insn "ashrdi3_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "r,r") (match_operand:DI 2 "nonmemory_operand" "r,n")))] "TARGET_SHMEDIA" "@ shard %1, %2, %0 shari %1, %2, %0" [(set_attr "type" "arith_media")]) (define_expand "ashrdi3" [(parallel [(set (match_operand:DI 0 "arith_reg_operand" "") (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "") (match_operand:DI 2 "immediate_operand" ""))) (clobber (reg:SI T_REG))])] "" " { if (TARGET_SHMEDIA) { emit_insn (gen_ashrdi3_media (operands[0], operands[1], operands[2])); DONE; } if (GET_CODE (operands[2]) != CONST_INT || INTVAL (operands[2]) != 1) FAIL; }") ;; combined left/right shift (define_split [(set (match_operand:SI 0 "register_operand" "") (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "") (match_operand:SI 2 "const_int_operand" "")) (match_operand:SI 3 "const_int_operand" "")))] "TARGET_SH1 && reload_completed && (unsigned)INTVAL (operands[2]) < 32" [(use (reg:SI R0_REG))] "if (gen_shl_and (operands[0], operands[2], operands[3], operands[1])) FAIL; DONE;") (define_split [(set (match_operand:SI 0 "register_operand" "") (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "") (match_operand:SI 2 "const_int_operand" "")) (match_operand:SI 3 "const_int_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1 && reload_completed && (unsigned)INTVAL (operands[2]) < 32" [(use (reg:SI R0_REG))] "if (gen_shl_and (operands[0], operands[2], operands[3], operands[1])) FAIL; DONE;") (define_insn "" [(set (match_operand:SI 0 "register_operand" "=r") (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "0") (match_operand:SI 2 "const_int_operand" "n")) (match_operand:SI 3 "const_int_operand" "n"))) (clobber (reg:SI T_REG))] "TARGET_SH1 && shl_and_kind (operands[2], operands[3], 0) == 1" "#" [(set (attr "length") (cond [(eq (symbol_ref "shl_and_length (insn)") (const_int 2)) (const_string "4") (eq (symbol_ref "shl_and_length (insn)") (const_int 3)) (const_string "6") (eq (symbol_ref "shl_and_length (insn)") (const_int 4)) (const_string "8") (eq (symbol_ref "shl_and_length (insn)") (const_int 5)) (const_string "10") (eq (symbol_ref "shl_and_length (insn)") (const_int 6)) (const_string "12") (eq (symbol_ref "shl_and_length (insn)") (const_int 7)) (const_string "14") (eq (symbol_ref "shl_and_length (insn)") (const_int 8)) (const_string "16")] (const_string "18"))) (set_attr "type" "arith")]) (define_insn "" [(set (match_operand:SI 0 "register_operand" "=z") (and:SI (ashift:SI (match_operand:SI 1 "register_operand" "0") (match_operand:SI 2 "const_int_operand" "n")) (match_operand:SI 3 "const_int_operand" "n"))) (clobber (reg:SI T_REG))] "TARGET_SH1 && shl_and_kind (operands[2], operands[3], 0) == 2" "#" [(set (attr "length") (cond [(eq (symbol_ref "shl_and_length (insn)") (const_int 2)) (const_string "4") (eq (symbol_ref "shl_and_length (insn)") (const_int 3)) (const_string "6") (eq (symbol_ref "shl_and_length (insn)") (const_int 4)) (const_string "8")] (const_string "10"))) (set_attr "type" "arith")]) ;; shift left / and combination with a scratch register: The combine pass ;; does not accept the individual instructions, even though they are ;; cheap. But it needs a precise description so that it is usable after ;; reload. (define_insn "and_shl_scratch" [(set (match_operand:SI 0 "register_operand" "=r,&r") (lshiftrt:SI (ashift:SI (and:SI (lshiftrt:SI (match_operand:SI 1 "register_operand" "r,0") (match_operand:SI 2 "const_int_operand" "N,n")) (match_operand:SI 3 "" "0,r")) (match_operand:SI 4 "const_int_operand" "n,n")) (match_operand:SI 5 "const_int_operand" "n,n"))) (clobber (reg:SI T_REG))] "TARGET_SH1" "#" [(set (attr "length") (cond [(eq (symbol_ref "shl_and_scr_length (insn)") (const_int 2)) (const_string "4") (eq (symbol_ref "shl_and_scr_length (insn)") (const_int 3)) (const_string "6") (eq (symbol_ref "shl_and_scr_length (insn)") (const_int 4)) (const_string "8") (eq (symbol_ref "shl_and_scr_length (insn)") (const_int 5)) (const_string "10")] (const_string "12"))) (set_attr "type" "arith")]) (define_split [(set (match_operand:SI 0 "register_operand" "") (lshiftrt:SI (ashift:SI (and:SI (lshiftrt:SI (match_operand:SI 1 "register_operand" "") (match_operand:SI 2 "const_int_operand" "")) (match_operand:SI 3 "register_operand" "")) (match_operand:SI 4 "const_int_operand" "")) (match_operand:SI 5 "const_int_operand" ""))) (clobber (reg:SI T_REG))] "TARGET_SH1" [(use (reg:SI R0_REG))] " { rtx and_source = operands[rtx_equal_p (operands[0], operands[1]) ? 3 : 1]; if (INTVAL (operands[2])) { gen_shifty_op (LSHIFTRT, operands); } emit_insn (gen_andsi3 (operands[0], operands[0], and_source)); operands[2] = operands[4]; gen_shifty_op (ASHIFT, operands); if (INTVAL (operands[5])) { operands[2] = operands[5]; gen_shifty_op (LSHIFTRT, operands); } DONE; }") ;; signed left/right shift combination. (define_split [(set (match_operand:SI 0 "register_operand" "") (sign_extract:SI (ashift:SI (match_operand:SI 1 "register_operand" "") (match_operand:SI 2 "const_int_operand" "")) (match_operand:SI 3 "const_int_operand" "") (const_int 0))) (clobber (reg:SI T_REG))] "TARGET_SH1" [(use (reg:SI R0_REG))] "if (gen_shl_sext (operands[0], operands[2], operands[3], operands[1])) FAIL; DONE;") (define_insn "shl_sext_ext" [(set (match_operand:SI 0 "register_operand" "=r") (sign_extract:SI (ashift:SI (match_operand:SI 1 "register_operand" "0") (match_operand:SI 2 "const_int_operand" "n")) (match_operand:SI 3 "const_int_operand" "n") (const_int 0))) (clobber (reg:SI T_REG))] "TARGET_SH1 && (unsigned)shl_sext_kind (operands[2], operands[3], 0) - 1 < 5" "#" [(set (attr "length") (cond [(eq (symbol_ref "shl_sext_length (insn)") (const_int 1)) (const_string "2") (eq (symbol_ref "shl_sext_length (insn)") (const_int 2)) (const_string "4") (eq (symbol_ref "shl_sext_length (insn)") (const_int 3)) (const_string "6") (eq (symbol_ref "shl_sext_length (insn)") (const_int 4)) (const_string "8") (eq (symbol_ref "shl_sext_length (insn)") (const_int 5)) (const_string "10") (eq (symbol_ref "shl_sext_length (insn)") (const_int 6)) (const_string "12") (eq (symbol_ref "shl_sext_length (insn)") (const_int 7)) (const_string "14") (eq (symbol_ref "shl_sext_length (insn)") (const_int 8)) (const_string "16")] (const_string "18"))) (set_attr "type" "arith")]) (define_insn "shl_sext_sub" [(set (match_operand:SI 0 "register_operand" "=z") (sign_extract:SI (ashift:SI (match_operand:SI 1 "register_operand" "0") (match_operand:SI 2 "const_int_operand" "n")) (match_operand:SI 3 "const_int_operand" "n") (const_int 0))) (clobber (reg:SI T_REG))] "TARGET_SH1 && (shl_sext_kind (operands[2], operands[3], 0) & ~1) == 6" "#" [(set (attr "length") (cond [(eq (symbol_ref "shl_sext_length (insn)") (const_int 3)) (const_string "6") (eq (symbol_ref "shl_sext_length (insn)") (const_int 4)) (const_string "8") (eq (symbol_ref "shl_sext_length (insn)") (const_int 5)) (const_string "10") (eq (symbol_ref "shl_sext_length (insn)") (const_int 6)) (const_string "12")] (const_string "14"))) (set_attr "type" "arith")]) ;; These patterns are found in expansions of DImode shifts by 16, and ;; allow the xtrct instruction to be generated from C source. (define_insn "xtrct_left" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ior:SI (ashift:SI (match_operand:SI 1 "arith_reg_operand" "r") (const_int 16)) (lshiftrt:SI (match_operand:SI 2 "arith_reg_operand" "0") (const_int 16))))] "TARGET_SH1" "xtrct %1,%0" [(set_attr "type" "arith")]) (define_insn "xtrct_right" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (ior:SI (lshiftrt:SI (match_operand:SI 1 "arith_reg_operand" "0") (const_int 16)) (ashift:SI (match_operand:SI 2 "arith_reg_operand" "r") (const_int 16))))] "TARGET_SH1" "xtrct %2,%0" [(set_attr "type" "arith")]) ;; ------------------------------------------------------------------------- ;; Unary arithmetic ;; ------------------------------------------------------------------------- (define_insn "negc" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (neg:SI (plus:SI (reg:SI T_REG) (match_operand:SI 1 "arith_reg_operand" "r")))) (set (reg:SI T_REG) (ne:SI (ior:SI (reg:SI T_REG) (match_dup 1)) (const_int 0)))] "TARGET_SH1" "negc %1,%0" [(set_attr "type" "arith")]) (define_insn "*negdi_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (neg:DI (match_operand:DI 1 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "sub r63, %1, %0" [(set_attr "type" "arith_media")]) (define_expand "negdi2" [(set (match_operand:DI 0 "arith_reg_operand" "") (neg:DI (match_operand:DI 1 "arith_reg_operand" "")))] "" " { if (TARGET_SH1) { int low_word = (TARGET_LITTLE_ENDIAN ? 0 : 1); int high_word = (TARGET_LITTLE_ENDIAN ? 1 : 0); rtx low_src = operand_subword (operands[1], low_word, 0, DImode); rtx high_src = operand_subword (operands[1], high_word, 0, DImode); rtx low_dst = operand_subword (operands[0], low_word, 1, DImode); rtx high_dst = operand_subword (operands[0], high_word, 1, DImode); emit_insn (gen_clrt ()); emit_insn (gen_negc (low_dst, low_src)); emit_insn (gen_negc (high_dst, high_src)); DONE; } }") (define_insn "negsi2" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (neg:SI (match_operand:SI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "neg %1,%0" [(set_attr "type" "arith")]) (define_insn "one_cmplsi2" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (not:SI (match_operand:SI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "not %1,%0" [(set_attr "type" "arith")]) (define_expand "one_cmpldi2" [(set (match_operand:DI 0 "arith_reg_operand" "") (xor:DI (match_operand:DI 1 "arith_reg_operand" "") (const_int -1)))] "TARGET_SHMEDIA" "") ;; ------------------------------------------------------------------------- ;; Zero extension instructions ;; ------------------------------------------------------------------------- (define_insn "zero_extendsidi2" [(set (match_operand:DI 0 "register_operand" "=r") (zero_extend:DI (match_operand:SI 1 "extend_reg_operand" "r")))] "TARGET_SHMEDIA" "addz.l %1, r63, %0" [(set_attr "type" "arith_media")]) (define_insn "zero_extendhidi2" [(set (match_operand:DI 0 "register_operand" "=r,r") (zero_extend:DI (match_operand:HI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ # ld%M1.uw %m1, %0" [(set_attr "type" "*,load_media")]) (define_split [(set (match_operand:DI 0 "register_operand" "") (zero_extend:DI (match_operand:HI 1 "extend_reg_operand" "")))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (ashift:DI (subreg:DI (match_dup 1) 0) (const_int 48))) (set (match_dup 0) (lshiftrt:DI (match_dup 0) (const_int 48)))] " { if (GET_CODE (operands[1]) == TRUNCATE) operands[1] = XEXP (operands[1], 0); }") ;; ??? when a truncated input to a zero_extend is reloaded, reload will ;; reload the entire truncate expression. (define_insn_and_split "*loaddi_trunc" [(set (match_operand 0 "int_gpr_dest" "=r") (truncate (match_operand:DI 1 "memory_operand" "m")))] "TARGET_SHMEDIA && reload_completed" "#" "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (match_dup 1))] "operands[0] = gen_rtx_REG (DImode, true_regnum (operands[0]));") (define_insn "zero_extendqidi2" [(set (match_operand:DI 0 "register_operand" "=r,r") (zero_extend:DI (match_operand:QI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ andi %1, 255, %0 ld%M1.ub %m1, %0" [(set_attr "type" "arith_media,load_media")]) (define_expand "zero_extendhisi2" [(set (match_operand:SI 0 "arith_reg_operand" "") (zero_extend:SI (match_operand:HI 1 "general_extend_operand" "")))] "" " { if (! TARGET_SHMEDIA && ! arith_reg_operand (operands[1], HImode)) operands[1] = copy_to_mode_reg (HImode, operands[1]); }") (define_insn "*zero_extendhisi2_compact" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (zero_extend:SI (match_operand:HI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "extu.w %1,%0" [(set_attr "type" "arith")]) (define_insn "*zero_extendhisi2_media" [(set (match_operand:SI 0 "register_operand" "=r,r") (zero_extend:SI (match_operand:HI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ # ld%M1.uw %m1, %0" [(set_attr "type" "arith_media,load_media")]) (define_split [(set (match_operand:SI 0 "register_operand" "") (zero_extend:SI (match_operand:HI 1 "extend_reg_operand" "")))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (ashift:SI (subreg:SI (match_dup 1) 0) (const_int 16))) (set (match_dup 0) (lshiftrt:SI (match_dup 0) (const_int 16)))] " { if (GET_CODE (operands[1]) == TRUNCATE) operands[1] = XEXP (operands[1], 0); }") (define_expand "zero_extendqisi2" [(set (match_operand:SI 0 "arith_reg_operand" "") (zero_extend:SI (match_operand:QI 1 "general_extend_operand" "")))] "" " { if (! TARGET_SHMEDIA && ! arith_reg_operand (operands[1], QImode)) operands[1] = copy_to_mode_reg (QImode, operands[1]); }") (define_insn "*zero_extendqisi2_compact" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (zero_extend:SI (match_operand:QI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "extu.b %1,%0" [(set_attr "type" "arith")]) (define_insn "*zero_extendqisi2_media" [(set (match_operand:SI 0 "register_operand" "=r,r") (zero_extend:SI (match_operand:QI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ andi %1, 255, %0 ld%M1.ub %m1, %0" [(set_attr "type" "arith_media,load_media")]) (define_insn "zero_extendqihi2" [(set (match_operand:HI 0 "arith_reg_operand" "=r") (zero_extend:HI (match_operand:QI 1 "arith_reg_operand" "r")))] "TARGET_SH1" "extu.b %1,%0" [(set_attr "type" "arith")]) ;; ------------------------------------------------------------------------- ;; Sign extension instructions ;; ------------------------------------------------------------------------- ;; ??? This should be a define expand. ;; ??? Or perhaps it should be dropped? ;; convert_move generates good code for SH[1-4]. (define_insn "extendsidi2" [(set (match_operand:DI 0 "register_operand" "=r,r") (sign_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m")))] "TARGET_SHMEDIA" "@ add.l %1, r63, %0 ld%M1.l %m1, %0" [(set_attr "type" "arith_media,load_media")]) (define_insn "extendhidi2" [(set (match_operand:DI 0 "register_operand" "=r,r") (sign_extend:DI (match_operand:HI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ # ld%M1.w %m1, %0" [(set_attr "type" "*,load_media")]) (define_split [(set (match_operand:DI 0 "register_operand" "") (sign_extend:DI (match_operand:HI 1 "extend_reg_operand" "")))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (ashift:DI (subreg:DI (match_dup 1) 0) (const_int 48))) (set (match_dup 0) (ashiftrt:DI (match_dup 0) (const_int 48)))] " { if (GET_CODE (operands[1]) == TRUNCATE) operands[1] = XEXP (operands[1], 0); }") (define_insn "extendqidi2" [(set (match_operand:DI 0 "register_operand" "=r,r") (sign_extend:DI (match_operand:QI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ # ld%M1.b %m1, %0" [(set_attr "type" "*,load_media")]) (define_split [(set (match_operand:DI 0 "register_operand" "") (sign_extend:DI (match_operand:QI 1 "extend_reg_operand" "")))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (ashift:DI (subreg:DI (match_dup 1) 0) (const_int 56))) (set (match_dup 0) (ashiftrt:DI (match_dup 0) (const_int 56)))] " { if (GET_CODE (operands[1]) == TRUNCATE) operands[1] = XEXP (operands[1], 0); }") (define_expand "extendhisi2" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (sign_extend:SI (match_operand:HI 1 "general_extend_operand" "r,m")))] "" "") (define_insn "*extendhisi2_compact" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (sign_extend:SI (match_operand:HI 1 "general_movsrc_operand" "r,m")))] "TARGET_SH1" "@ exts.w %1,%0 mov.w %1,%0" [(set_attr "type" "arith,load")]) (define_insn "*extendhisi2_media" [(set (match_operand:SI 0 "register_operand" "=r,r") (sign_extend:SI (match_operand:HI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ # ld%M1.w %m1, %0" [(set_attr "type" "arith_media,load_media")]) (define_split [(set (match_operand:SI 0 "register_operand" "") (sign_extend:SI (match_operand:HI 1 "extend_reg_operand" "")))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (ashift:SI (subreg:SI (match_dup 1) 0) (const_int 16))) (set (match_dup 0) (ashiftrt:SI (match_dup 0) (const_int 16)))] " { if (GET_CODE (operands[1]) == TRUNCATE) operands[1] = XEXP (operands[1], 0); }") (define_expand "extendqisi2" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (sign_extend:SI (match_operand:QI 1 "general_extend_operand" "r,m")))] "" "") (define_insn "*extendqisi2_compact" [(set (match_operand:SI 0 "arith_reg_operand" "=r,r") (sign_extend:SI (match_operand:QI 1 "general_movsrc_operand" "r,m")))] "TARGET_SH1" "@ exts.b %1,%0 mov.b %1,%0" [(set_attr "type" "arith,load")]) (define_insn "*extendqisi2_media" [(set (match_operand:SI 0 "register_operand" "=r,r") (sign_extend:SI (match_operand:QI 1 "general_extend_operand" "r,m")))] "TARGET_SHMEDIA" "@ # ld%M1.b %m1, %0" [(set_attr "type" "arith_media,load_media")]) (define_split [(set (match_operand:SI 0 "register_operand" "") (sign_extend:SI (match_operand:QI 1 "extend_reg_operand" "")))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 0) (ashift:SI (subreg:SI (match_dup 1) 0) (const_int 24))) (set (match_dup 0) (ashiftrt:SI (match_dup 0) (const_int 24)))] " { if (GET_CODE (operands[1]) == TRUNCATE) operands[1] = XEXP (operands[1], 0); }") (define_insn "extendqihi2" [(set (match_operand:HI 0 "arith_reg_operand" "=r,r") (sign_extend:HI (match_operand:QI 1 "general_movsrc_operand" "r,m")))] "TARGET_SH1" "@ exts.b %1,%0 mov.b %1,%0" [(set_attr "type" "arith,load")]) /* It would seem useful to combine the truncXi patterns into the movXi patterns, but unary operators are ignored when matching constraints, so we need separate patterns. */ (define_insn "truncdisi2" [(set (match_operand:SI 0 "general_movdst_operand" "=r,m,m,f,r,f") (truncate:SI (match_operand:DI 1 "register_operand" "r,r,f,r,f,f")))] "TARGET_SHMEDIA" "@ add.l %1, r63, %0 st%M0.l %m0, %1 fst%M0.s %m0, %T1 fmov.ls %1, %0 fmov.sl %T1, %0 fmov.s %T1, %0" [(set_attr "type" "arith_media,store_media,fstore_media,fload_media,fpconv_media,fmove_media")]) (define_insn "truncdihi2" [(set (match_operand:HI 0 "general_movdst_operand" "=?r,m") (truncate:HI (match_operand:DI 1 "register_operand" "r,r")))] "TARGET_SHMEDIA" "@ shlli\\t%1,48,%0\;shlri\\t%0,48,%0 st%M0.w %m0, %1" [(set_attr "type" "arith_media,store_media") (set_attr "length" "8,4")]) ; N.B. This should agree with LOAD_EXTEND_OP and movqi. ; Because we use zero extension, we can't provide signed QImode compares ; using a simple compare or conditional banch insn. (define_insn "truncdiqi2" [(set (match_operand:QI 0 "general_movdst_operand" "=r,m") (truncate:QI (match_operand:DI 1 "register_operand" "r,r")))] "TARGET_SHMEDIA" "@ andi %1, 255, %0 st%M0.b %m0, %1" [(set_attr "type" "arith_media,store")]) ;; ------------------------------------------------------------------------- ;; Move instructions ;; ------------------------------------------------------------------------- ;; define push and pop so it is easy for sh.c ;; We can't use push and pop on SHcompact because the stack must always ;; be 8-byte aligned. (define_expand "push" [(set (mem:SI (pre_dec:SI (reg:SI SP_REG))) (match_operand:SI 0 "register_operand" "r,l,x"))] "TARGET_SH1 && ! TARGET_SH5" "") (define_expand "pop" [(set (match_operand:SI 0 "register_operand" "=r,l,x") (mem:SI (post_inc:SI (reg:SI SP_REG))))] "TARGET_SH1 && ! TARGET_SH5" "") (define_expand "push_e" [(parallel [(set (mem:SF (pre_dec:SI (reg:SI SP_REG))) (match_operand:SF 0 "" "")) (use (reg:PSI FPSCR_REG)) (clobber (scratch:SI))])] "TARGET_SH1 && ! TARGET_SH5" "") (define_insn "push_fpul" [(set (mem:SF (pre_dec:SI (reg:SI SP_REG))) (reg:SF FPUL_REG))] "TARGET_SH2E && ! TARGET_SH5" "sts.l fpul,@-r15" [(set_attr "type" "store") (set_attr "late_fp_use" "yes") (set_attr "hit_stack" "yes")]) ;; DFmode pushes for sh4 require a lot of what is defined for movdf_i4, ;; so use that. (define_expand "push_4" [(parallel [(set (mem:DF (pre_dec:SI (reg:SI SP_REG))) (match_operand:DF 0 "" "")) (use (reg:PSI FPSCR_REG)) (clobber (scratch:SI))])] "TARGET_SH1 && ! TARGET_SH5" "") (define_expand "pop_e" [(parallel [(set (match_operand:SF 0 "" "") (mem:SF (post_inc:SI (reg:SI SP_REG)))) (use (reg:PSI FPSCR_REG)) (clobber (scratch:SI))])] "TARGET_SH1 && ! TARGET_SH5" "") (define_insn "pop_fpul" [(set (reg:SF FPUL_REG) (mem:SF (post_inc:SI (reg:SI SP_REG))))] "TARGET_SH2E && ! TARGET_SH5" "lds.l @r15+,fpul" [(set_attr "type" "load") (set_attr "hit_stack" "yes")]) (define_expand "pop_4" [(parallel [(set (match_operand:DF 0 "" "") (mem:DF (post_inc:SI (reg:SI SP_REG)))) (use (reg:PSI FPSCR_REG)) (clobber (scratch:SI))])] "TARGET_SH1 && ! TARGET_SH5" "") (define_expand "push_fpscr" [(const_int 0)] "TARGET_SH2E" " { rtx insn = emit_insn (gen_fpu_switch (gen_rtx (MEM, PSImode, gen_rtx (PRE_DEC, Pmode, stack_pointer_rtx)), get_fpscr_rtx ())); REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); DONE; }") (define_expand "pop_fpscr" [(const_int 0)] "TARGET_SH2E" " { rtx insn = emit_insn (gen_fpu_switch (get_fpscr_rtx (), gen_rtx (MEM, PSImode, gen_rtx (POST_INC, Pmode, stack_pointer_rtx)))); REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); DONE; }") ;; These two patterns can happen as the result of optimization, when ;; comparisons get simplified to a move of zero or 1 into the T reg. ;; They don't disappear completely, because the T reg is a fixed hard reg. (define_insn "clrt" [(set (reg:SI T_REG) (const_int 0))] "TARGET_SH1" "clrt") (define_insn "sett" [(set (reg:SI T_REG) (const_int 1))] "TARGET_SH1" "sett") ;; t/r must come after r/r, lest reload will try to reload stuff like ;; (set (subreg:SI (mem:QI (plus:SI (reg:SI SP_REG) (const_int 12)) 0) 0) ;; (made from (set (subreg:SI (reg:QI ###) 0) ) into T. (define_insn "movsi_i" [(set (match_operand:SI 0 "general_movdst_operand" "=r,r,t,r,r,r,r,m,<,<,x,l,x,l,r") (match_operand:SI 1 "general_movsrc_operand" "Q,rI08,r,mr,x,l,t,r,x,l,r,r,>,>,i"))] "TARGET_SH1 && ! TARGET_SH2E && (register_operand (operands[0], SImode) || register_operand (operands[1], SImode))" "@ mov.l %1,%0 mov %1,%0 cmp/pl %1 mov.l %1,%0 sts %1,%0 sts %1,%0 movt %0 mov.l %1,%0 sts.l %1,%0 sts.l %1,%0 lds %1,%0 lds %1,%0 lds.l %1,%0 lds.l %1,%0 fake %1,%0" [(set_attr "type" "pcload_si,move,mt_group,load_si,mac_gp,prget,move,store,store,pstore,move,prset,load,pload,pcload_si") (set_attr "length" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,*")]) ;; t/r must come after r/r, lest reload will try to reload stuff like ;; (subreg:SI (reg:SF FR14_REG) 0) into T (compiling stdlib/strtod.c -m3e -O2) ;; ??? This allows moves from macl to fpul to be recognized, but these moves ;; will require a reload. ;; ??? We can't include f/f because we need the proper FPSCR setting when ;; TARGET_FMOVD is in effect, and mode switching is done before reload. (define_insn "movsi_ie" [(set (match_operand:SI 0 "general_movdst_operand" "=r,r,t,r,r,r,r,m,<,<,x,l,x,l,y,<,r,y,r,*f,y,*f,y") (match_operand:SI 1 "general_movsrc_operand" "Q,rI08,r,mr,x,l,t,r,x,l,r,r,>,>,>,y,i,r,y,y,*f,*f,y"))] "TARGET_SH2E && (register_operand (operands[0], SImode) || register_operand (operands[1], SImode))" "@ mov.l %1,%0 mov %1,%0 cmp/pl %1 mov.l %1,%0 sts %1,%0 sts %1,%0 movt %0 mov.l %1,%0 sts.l %1,%0 sts.l %1,%0 lds %1,%0 lds %1,%0 lds.l %1,%0 lds.l %1,%0 lds.l %1,%0 sts.l %1,%0 fake %1,%0 lds %1,%0 sts %1,%0 fsts fpul,%0 flds %1,fpul fmov %1,%0 ! move optimized away" [(set_attr "type" "pcload_si,move,*,load_si,mac_gp,prget,move,store,store,pstore,move,prset,load,pload,load,store,pcload_si,gp_fpul,fpul_gp,fmove,fmove,fmove,nil") (set_attr "late_fp_use" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,yes,*,*,yes,*,*,*,*") (set_attr "length" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,*,0")]) (define_insn "movsi_i_lowpart" [(set (strict_low_part (match_operand:SI 0 "general_movdst_operand" "+r,r,r,r,r,r,m,r")) (match_operand:SI 1 "general_movsrc_operand" "Q,rI08,mr,x,l,t,r,i"))] "TARGET_SH1 && (register_operand (operands[0], SImode) || register_operand (operands[1], SImode))" "@ mov.l %1,%0 mov %1,%0 mov.l %1,%0 sts %1,%0 sts %1,%0 movt %0 mov.l %1,%0 fake %1,%0" [(set_attr "type" "pcload,move,load,move,prget,move,store,pcload")]) (define_insn_and_split "load_ra" [(set (match_operand:SI 0 "general_movdst_operand" "") (unspec:SI [(match_operand 1 "register_operand" "")] UNSPEC_RA))] "TARGET_SH1" "#" "&& ! rtx_equal_function_value_matters" [(set (match_dup 0) (match_dup 1))] " { if (TARGET_SHCOMPACT && current_function_has_nonlocal_label) operands[1] = gen_rtx_MEM (SImode, return_address_pointer_rtx); }") (define_insn "*movsi_media" [(set (match_operand:SI 0 "general_movdst_operand" "=r,r,r,r,m,f,m,f,r,f,*b,r,b") (match_operand:SI 1 "general_movsrc_operand" "r,I16C16,nCpg,m,rZ,m,f,rZ,f,f,r,*b,Csy"))] "TARGET_SHMEDIA_FPU && (register_operand (operands[0], SImode) || sh_register_operand (operands[1], SImode))" "@ add.l %1, r63, %0 movi %1, %0 # ld%M1.l %m1, %0 st%M0.l %m0, %N1 fld%M1.s %m1, %0 fst%M0.s %m0, %1 fmov.ls %N1, %0 fmov.sl %1, %0 fmov.s %1, %0 ptabs %1, %0 gettr %1, %0 pt %1, %0" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,fload_media,fstore_media,fload_media,fpconv_media,fmove_media,ptabs_media,gettr_media,pt_media") (set_attr "length" "4,4,8,4,4,4,4,4,4,4,4,4,12")]) (define_insn "*movsi_media_nofpu" [(set (match_operand:SI 0 "general_movdst_operand" "=r,r,r,r,m,*b,r,b") (match_operand:SI 1 "general_movsrc_operand" "r,I16C16,nCpg,m,rZ,r,*b,Csy"))] "TARGET_SHMEDIA && (register_operand (operands[0], SImode) || sh_register_operand (operands[1], SImode))" "@ add.l %1, r63, %0 movi %1, %0 # ld%M1.l %m1, %0 st%M0.l %m0, %N1 ptabs %1, %0 gettr %1, %0 pt %1, %0" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,ptabs_media,gettr_media,pt_media") (set_attr "length" "4,4,8,4,4,4,4,12")]) (define_split [(set (match_operand:SI 0 "arith_reg_operand" "") (match_operand:SI 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && MOVI_SHORI_BASE_OPERAND_P (operands[1])" [(set (subreg:DI (match_dup 0) 0) (match_dup 2))] " { operands[2] = shallow_copy_rtx (operands[1]); PUT_MODE (operands[2], DImode); }") (define_split [(set (match_operand:SI 0 "register_operand" "") (match_operand:SI 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && ((GET_CODE (operands[1]) == CONST_INT && ! CONST_OK_FOR_I16 (INTVAL (operands[1]))) || GET_CODE (operands[1]) == CONST_DOUBLE)" [(set (subreg:DI (match_dup 0) 0) (match_dup 1))]) (define_expand "movsi" [(set (match_operand:SI 0 "general_movdst_operand" "") (match_operand:SI 1 "general_movsrc_operand" ""))] "" "{ if (prepare_move_operands (operands, SImode)) DONE; }") (define_expand "ic_invalidate_line" [(parallel [(unspec_volatile [(match_operand:SI 0 "register_operand" "+r") (match_dup 1)] UNSPEC_ICACHE) (clobber (scratch:SI))])] "TARGET_HARD_SH4 || TARGET_SH5" " { if (TARGET_SHMEDIA) { emit_insn (gen_ic_invalidate_line_media (operands[0])); DONE; } else if (TARGET_SHCOMPACT) { operands[1] = function_symbol (\"__ic_invalidate\"); operands[1] = force_reg (Pmode, operands[1]); emit_insn (gen_ic_invalidate_line_compact (operands[0], operands[1])); DONE; } operands[0] = force_reg (Pmode, operands[0]); operands[1] = force_reg (Pmode, GEN_INT (trunc_int_for_mode (0xf0000008, Pmode))); }") ;; The address %0 is assumed to be 4-aligned at least. Thus, by ORing ;; 0xf0000008, we get the low-oder bits *1*00 (binary), which fits ;; the requirement *1*00 for associative address writes. The alignment of ;; %0 implies that its least significant bit is cleared, ;; thus we clear the V bit of a matching entry if there is one. (define_insn "ic_invalidate_line_i" [(unspec_volatile [(match_operand:SI 0 "register_operand" "r") (match_operand:SI 1 "register_operand" "r")] UNSPEC_ICACHE) (clobber (match_scratch:SI 2 "=&r"))] "TARGET_HARD_SH4" "ocbwb\\t@%0\;extu.w\\t%0,%2\;or\\t%1,%2\;mov.l\\t%0,@%2" [(set_attr "length" "8") (set_attr "type" "cwb")]) ;; ??? could make arg 0 an offsettable memory operand to allow to save ;; an add in the code that calculates the address. (define_insn "ic_invalidate_line_media" [(unspec_volatile [(match_operand 0 "register_operand" "r")] UNSPEC_ICACHE)] "TARGET_SHMEDIA" "ocbwb %0,0\;synco\;icbi %0, 0\;synci" [(set_attr "length" "16") (set_attr "type" "invalidate_line_media")]) (define_insn "ic_invalidate_line_compact" [(unspec_volatile [(match_operand:SI 0 "register_operand" "z") (match_operand:SI 1 "register_operand" "r")] UNSPEC_ICACHE) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_expand "initialize_trampoline" [(match_operand:SI 0 "" "") (match_operand:SI 1 "" "") (match_operand:SI 2 "" "")] "TARGET_SHCOMPACT" " { rtx sfun, tramp; tramp = force_reg (Pmode, operands[0]); sfun = force_reg (Pmode, function_symbol (\"__init_trampoline\")); emit_move_insn (gen_rtx_REG (SImode, R2_REG), operands[1]); emit_move_insn (gen_rtx_REG (SImode, R3_REG), operands[2]); emit_insn (gen_initialize_trampoline_compact (tramp, sfun)); DONE; }") (define_insn "initialize_trampoline_compact" [(unspec_volatile [(match_operand:SI 0 "register_operand" "z") (match_operand:SI 1 "register_operand" "r") (reg:SI R2_REG) (reg:SI R3_REG)] UNSPEC_INIT_TRAMP) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT" "jsr @%1%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_insn "movqi_i" [(set (match_operand:QI 0 "general_movdst_operand" "=r,r,m,r,r,l") (match_operand:QI 1 "general_movsrc_operand" "ri,m,r,t,l,r"))] "TARGET_SH1 && (arith_reg_operand (operands[0], QImode) || arith_reg_operand (operands[1], QImode))" "@ mov %1,%0 mov.b %1,%0 mov.b %1,%0 movt %0 sts %1,%0 lds %1,%0" [(set_attr "type" "move,load,store,move,move,move")]) (define_insn "*movqi_media" [(set (match_operand:QI 0 "general_movdst_operand" "=r,r,r,m") (match_operand:QI 1 "general_movsrc_operand" "r,I16C16,m,rZ"))] "TARGET_SHMEDIA && (arith_reg_operand (operands[0], QImode) || arith_reg_or_0_operand (operands[1], QImode))" "@ add.l %1, r63, %0 movi %1, %0 ld%M1.ub %m1, %0 st%M0.b %m0, %N1" [(set_attr "type" "arith_media,arith_media,load_media,store_media")]) (define_expand "movqi" [(set (match_operand:QI 0 "general_operand" "") (match_operand:QI 1 "general_operand" ""))] "" "{ if (prepare_move_operands (operands, QImode)) DONE; }") (define_expand "reload_inqi" [(set (match_operand:SI 2 "" "=&r") (match_operand:QI 1 "inqhi_operand" "")) (set (match_operand:QI 0 "arith_reg_operand" "=r") (truncate:QI (match_dup 3)))] "TARGET_SHMEDIA" " { rtx inner = XEXP (operands[1], 0); int regno = REGNO (inner); regno += HARD_REGNO_NREGS (regno, GET_MODE (inner)) - 1; operands[1] = gen_rtx_REG (SImode, regno); operands[3] = gen_rtx_REG (DImode, REGNO (operands[2])); }") /* When storing r0, we have to avoid reg+reg addressing. */ (define_insn "movhi_i" [(set (match_operand:HI 0 "general_movdst_operand" "=r,r,r,r,m,r,l,r") (match_operand:HI 1 "general_movsrc_operand" "Q,rI08,m,t,r,l,r,i"))] "TARGET_SH1 && (arith_reg_operand (operands[0], HImode) || arith_reg_operand (operands[1], HImode)) && (GET_CODE (operands[0]) != MEM || GET_CODE (XEXP (operands[0], 0)) != PLUS || GET_CODE (XEXP (XEXP (operands[0], 0), 1)) != REG || ! refers_to_regno_p (R0_REG, R0_REG + 1, operands[1], (rtx *)0))" "@ mov.w %1,%0 mov %1,%0 mov.w %1,%0 movt %0 mov.w %1,%0 sts %1,%0 lds %1,%0 fake %1,%0" [(set_attr "type" "pcload,move,load,move,store,move,move,pcload")]) (define_insn "*movhi_media" [(set (match_operand:HI 0 "general_movdst_operand" "=r,r,r,r,m") (match_operand:HI 1 "general_movsrc_operand" "r,I16C16,n,m,rZ"))] "TARGET_SHMEDIA && (arith_reg_operand (operands[0], HImode) || arith_reg_or_0_operand (operands[1], HImode))" "@ add.l %1, r63, %0 movi %1, %0 # ld%M1.w %m1, %0 st%M0.w %m0, %N1" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media")]) (define_split [(set (match_operand:HI 0 "register_operand" "") (match_operand:HI 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && ! CONST_OK_FOR_I16 (INTVAL (operands[1]))" [(set (subreg:DI (match_dup 0) 0) (match_dup 1))]) (define_expand "movhi" [(set (match_operand:HI 0 "general_movdst_operand" "") (match_operand:HI 1 "general_movsrc_operand" ""))] "" "{ if (prepare_move_operands (operands, HImode)) DONE; }") (define_expand "reload_inhi" [(set (match_operand:SI 2 "" "=&r") (match_operand:HI 1 "inqhi_operand" "")) (set (match_operand:HI 0 "arith_reg_operand" "=r") (truncate:HI (match_dup 3)))] "TARGET_SHMEDIA" " { rtx inner = XEXP (operands[1], 0); int regno = REGNO (inner); regno += HARD_REGNO_NREGS (regno, GET_MODE (inner)) - 1; operands[1] = gen_rtx_REG (SImode, regno); operands[3] = gen_rtx_REG (DImode, REGNO (operands[2])); }") ;; x/r can be created by inlining/cse, e.g. for execute/961213-1.c ;; compiled with -m2 -ml -O3 -funroll-loops (define_insn "*movdi_i" [(set (match_operand:DI 0 "general_movdst_operand" "=r,r,r,m,r,r,r,*!x") (match_operand:DI 1 "general_movsrc_operand" "Q,r,m,r,I08,i,x,r"))] "TARGET_SH1 && (arith_reg_operand (operands[0], DImode) || arith_reg_operand (operands[1], DImode))" "* return output_movedouble (insn, operands, DImode);" [(set_attr "length" "4") (set_attr "type" "pcload,move,load,store,move,pcload,move,move")]) ;; If the output is a register and the input is memory or a register, we have ;; to be careful and see which word needs to be loaded first. (define_split [(set (match_operand:DI 0 "general_movdst_operand" "") (match_operand:DI 1 "general_movsrc_operand" ""))] "TARGET_SH1 && reload_completed" [(set (match_dup 2) (match_dup 3)) (set (match_dup 4) (match_dup 5))] " { int regno; if ((GET_CODE (operands[0]) == MEM && GET_CODE (XEXP (operands[0], 0)) == PRE_DEC) || (GET_CODE (operands[1]) == MEM && GET_CODE (XEXP (operands[1], 0)) == POST_INC)) FAIL; if (GET_CODE (operands[0]) == REG) regno = REGNO (operands[0]); else if (GET_CODE (operands[0]) == SUBREG) regno = subreg_regno (operands[0]); else if (GET_CODE (operands[0]) == MEM) regno = -1; else abort (); if (regno == -1 || ! refers_to_regno_p (regno, regno + 1, operands[1], 0)) { operands[2] = operand_subword (operands[0], 0, 0, DImode); operands[3] = operand_subword (operands[1], 0, 0, DImode); operands[4] = operand_subword (operands[0], 1, 0, DImode); operands[5] = operand_subword (operands[1], 1, 0, DImode); } else { operands[2] = operand_subword (operands[0], 1, 0, DImode); operands[3] = operand_subword (operands[1], 1, 0, DImode); operands[4] = operand_subword (operands[0], 0, 0, DImode); operands[5] = operand_subword (operands[1], 0, 0, DImode); } if (operands[2] == 0 || operands[3] == 0 || operands[4] == 0 || operands[5] == 0) FAIL; }") (define_insn "*movdi_media" [(set (match_operand:DI 0 "general_movdst_operand" "=r,r,r,rl,m,f,m,f,r,f,*b,r,b") (match_operand:DI 1 "general_movsrc_operand" "r,I16C16,nCpgF,m,rlZ,m,f,rZ,f,f,r,*b,Csy"))] "TARGET_SHMEDIA_FPU && (register_operand (operands[0], DImode) || sh_register_operand (operands[1], DImode))" "@ add %1, r63, %0 movi %1, %0 # ld%M1.q %m1, %0 st%M0.q %m0, %N1 fld%M1.d %m1, %0 fst%M0.d %m0, %1 fmov.qd %N1, %0 fmov.dq %1, %0 fmov.d %1, %0 ptabs %1, %0 gettr %1, %0 pt %1, %0" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,fload_media,fstore_media,fload_media,dfpconv_media,fmove_media,ptabs_media,gettr_media,pt_media") (set_attr "length" "4,4,16,4,4,4,4,4,4,4,4,4,*")]) (define_insn "*movdi_media_nofpu" [(set (match_operand:DI 0 "general_movdst_operand" "=r,r,r,rl,m,*b,r,b") (match_operand:DI 1 "general_movsrc_operand" "r,I16C16,nCpgF,m,rlZ,r,*b,Csy"))] "TARGET_SHMEDIA && (register_operand (operands[0], DImode) || sh_register_operand (operands[1], DImode))" "@ add %1, r63, %0 movi %1, %0 # ld%M1.q %m1, %0 st%M0.q %m0, %N1 ptabs %1, %0 gettr %1, %0 pt %1, %0" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media,ptabs_media,gettr_media,pt_media") (set_attr "length" "4,4,16,4,4,4,4,*")]) (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (match_operand:DI 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && MOVI_SHORI_BASE_OPERAND_P (operands[1])" [(set (match_dup 0) (match_dup 1))] " { rtx insn; if (TARGET_SHMEDIA64) insn = emit_insn (gen_movdi_const (operands[0], operands[1])); else insn = emit_insn (gen_movdi_const_32bit (operands[0], operands[1])); REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, operands[1], REG_NOTES (insn)); DONE; }") (define_expand "movdi_const" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (const:DI (sign_extend:DI (truncate:HI (ashiftrt:DI (match_operand:DI 1 "immediate_operand" "s") (const_int 48)))))) (set (match_dup 0) (ior:DI (ashift:DI (match_dup 0) (const_int 16)) (zero_extend:DI (truncate:HI (const:DI (sign_extend:DI (truncate:HI (ashiftrt:SI (match_dup 1) (const_int 32))))))))) (set (match_dup 0) (ior:DI (ashift:DI (match_dup 0) (const_int 16)) (zero_extend:DI (truncate:HI (const:DI (sign_extend:DI (truncate:HI (ashiftrt:SI (match_dup 1) (const_int 16))))))))) (set (match_dup 0) (ior:DI (ashift:DI (match_dup 0) (const_int 16)) (zero_extend:DI (truncate:HI (const:DI (sign_extend:DI (truncate:HI (match_dup 1))))))))] "TARGET_SHMEDIA64 && reload_completed && MOVI_SHORI_BASE_OPERAND_P (operands[1])" " { sh_mark_label (operands[1], 4); }") (define_expand "movdi_const_32bit" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (const:DI (sign_extend:DI (truncate:HI (ashiftrt:DI (match_operand:DI 1 "immediate_operand" "s") (const_int 16)))))) (set (match_dup 0) (ior:DI (ashift:DI (match_dup 0) (const_int 16)) (zero_extend:DI (truncate:HI (const:DI (sign_extend:DI (truncate:HI (match_dup 1))))))))] "TARGET_SHMEDIA32 && reload_completed && MOVI_SHORI_BASE_OPERAND_P (operands[1])" " { sh_mark_label (operands[1], 2); }") (define_expand "movdi_const_16bit" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (const:DI (sign_extend:DI (truncate:HI (match_operand:DI 1 "immediate_operand" "s")))))] "TARGET_SHMEDIA && flag_pic && reload_completed && GET_CODE (operands[1]) == SYMBOL_REF" "") (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (match_operand:DI 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && GET_CODE (operands[1]) == CONST_INT && ! CONST_OK_FOR_I16 (INTVAL (operands[1]))" [(set (match_dup 0) (match_dup 2)) (match_dup 1)] " { unsigned HOST_WIDE_INT val = INTVAL (operands[1]); unsigned HOST_WIDE_INT low = val; unsigned HOST_WIDE_INT high = val; unsigned HOST_WIDE_INT sign; unsigned HOST_WIDE_INT val2 = val ^ (val-1); /* Sign-extend the 16 least-significant bits. */ low &= 0xffff; low ^= 0x8000; low -= 0x8000; /* Arithmetic shift right the word by 16 bits. */ high >>= 16; sign = 1; sign <<= (HOST_BITS_PER_WIDE_INT - 16 - 1); high ^= sign; high -= sign; do { /* If we can't generate the constant with a two-insn movi / shori sequence, try some other strategies. */ if (! CONST_OK_FOR_I16 (high)) { /* Try constant load / left shift. We know VAL != 0. */ val2 = val ^ (val-1); if (val2 > 0x1ffff) { int trailing_zeroes = exact_log2 ((val2 >> 16) + 1) + 15; if (CONST_OK_FOR_I16 (val >> trailing_zeroes) || (! CONST_OK_FOR_I16 (high >> 16) && CONST_OK_FOR_I16 (val >> (trailing_zeroes + 16)))) { val2 = (HOST_WIDE_INT) val >> trailing_zeroes; operands[1] = gen_ashldi3_media (operands[0], operands[0], GEN_INT (trailing_zeroes)); break; } } /* Try constant load / right shift. */ val2 = (val >> 15) + 1; if (val2 == (val2 & -val2)) { int shift = 49 - exact_log2 (val2); val2 = trunc_int_for_mode (val << shift, DImode); if (CONST_OK_FOR_I16 (val2)) { operands[1] = gen_lshrdi3_media (operands[0], operands[0], GEN_INT (shift)); break; } } /* Try mperm.w . */ val2 = val & 0xffff; if ((val >> 16 & 0xffff) == val2 && (val >> 32 & 0xffff) == val2 && (val >> 48 & 0xffff) == val2) { val2 = (HOST_WIDE_INT) val >> 48; operands[1] = gen_rtx_REG (V4HImode, true_regnum (operands[0])); operands[1] = gen_mperm_w0 (operands[1], operands[1]); break; } /* Try movi / mshflo.l */ val2 = (HOST_WIDE_INT) val >> 32; if (val2 == trunc_int_for_mode (val, SImode)) { operands[1] = gen_mshflo_l_di (operands[0], operands[0], operands[0]); break; } /* Try movi / mshflo.l w/ r63. */ val2 = val + ((HOST_WIDE_INT) -1 << 32); if ((HOST_WIDE_INT) val2 < 0 && CONST_OK_FOR_I16 (val2)) { operands[1] = gen_mshflo_l_di (operands[0], operands[0], GEN_INT (0)); break; } } val2 = high; operands[1] = gen_shori_media (operands[0], operands[0], GEN_INT (low)); } while (0); operands[2] = GEN_INT (val2); }") (define_split [(set (match_operand:DI 0 "arith_reg_operand" "") (match_operand:DI 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && GET_CODE (operands[1]) == CONST_DOUBLE" [(set (match_dup 0) (match_dup 2)) (set (match_dup 0) (ior:DI (ashift:DI (match_dup 0) (const_int 16)) (zero_extend:DI (truncate:HI (match_dup 1)))))] " { unsigned HOST_WIDE_INT low = CONST_DOUBLE_LOW (operands[1]); unsigned HOST_WIDE_INT high = CONST_DOUBLE_HIGH (operands[1]); unsigned HOST_WIDE_INT val = low; unsigned HOST_WIDE_INT sign; /* Sign-extend the 16 least-significant bits. */ val &= 0xffff; val ^= 0x8000; val -= 0x8000; operands[1] = GEN_INT (val); /* Arithmetic shift right the double-word by 16 bits. */ low >>= 16; low |= (high & 0xffff) << (HOST_BITS_PER_WIDE_INT - 16); high >>= 16; sign = 1; sign <<= (HOST_BITS_PER_WIDE_INT - 16 - 1); high ^= sign; high -= sign; /* This will only be true if high is a sign-extension of low, i.e., it must be either 0 or (unsigned)-1, and be zero iff the most-significant bit of low is set. */ if (high + (low >> (HOST_BITS_PER_WIDE_INT - 1)) == 0) operands[2] = GEN_INT (low); else operands[2] = immed_double_const (low, high, DImode); }") (define_insn "shori_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r,r") (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_operand" "0,0") (const_int 16)) (zero_extend:DI (truncate:HI (match_operand:DI 2 "immediate_operand" "I16C16,nF")))))] "TARGET_SHMEDIA" "@ shori %u2, %0 #" [(set_attr "type" "arith_media,*")]) (define_expand "movdi" [(set (match_operand:DI 0 "general_movdst_operand" "") (match_operand:DI 1 "general_movsrc_operand" ""))] "" "{ if (prepare_move_operands (operands, DImode)) DONE; }") (define_insn "movdf_media" [(set (match_operand:DF 0 "general_movdst_operand" "=f,f,r,r,r,f,m,r,m") (match_operand:DF 1 "general_movsrc_operand" "f,rZ,f,r,F,m,f,m,rZ"))] "TARGET_SHMEDIA_FPU && (register_operand (operands[0], DFmode) || sh_register_operand (operands[1], DFmode))" "@ fmov.d %1, %0 fmov.qd %N1, %0 fmov.dq %1, %0 add %1, r63, %0 # fld%M1.d %m1, %0 fst%M0.d %m0, %1 ld%M1.q %m1, %0 st%M0.q %m0, %N1" [(set_attr "type" "fmove_media,fload_media,dfpconv_media,arith_media,*,fload_media,fstore_media,load_media,store_media")]) (define_insn "movdf_media_nofpu" [(set (match_operand:DF 0 "general_movdst_operand" "=r,r,r,m") (match_operand:DF 1 "general_movsrc_operand" "r,F,m,rZ"))] "TARGET_SHMEDIA && (register_operand (operands[0], DFmode) || sh_register_operand (operands[1], DFmode))" "@ add %1, r63, %0 # ld%M1.q %m1, %0 st%M0.q %m0, %N1" [(set_attr "type" "arith_media,*,load_media,store_media")]) (define_split [(set (match_operand:DF 0 "arith_reg_operand" "") (match_operand:DF 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed" [(set (match_dup 3) (match_dup 2))] " { int endian = WORDS_BIG_ENDIAN ? 1 : 0; long values[2]; REAL_VALUE_TYPE value; REAL_VALUE_FROM_CONST_DOUBLE (value, operands[1]); REAL_VALUE_TO_TARGET_DOUBLE (value, values); if (HOST_BITS_PER_WIDE_INT >= 64) operands[2] = immed_double_const ((unsigned long) values[endian] | ((HOST_WIDE_INT) values[1 - endian] << 32), 0, DImode); else if (HOST_BITS_PER_WIDE_INT == 32) operands[2] = immed_double_const (values[endian], values[1 - endian], DImode); else abort (); operands[3] = gen_rtx_REG (DImode, true_regnum (operands[0])); }") ;; ??? This should be a define expand. (define_insn "movdf_k" [(set (match_operand:DF 0 "general_movdst_operand" "=r,r,r,m") (match_operand:DF 1 "general_movsrc_operand" "r,FQ,m,r"))] "TARGET_SH1 && (! TARGET_SH4 || reload_completed /* ??? We provide some insn so that direct_{load,store}[DFmode] get set */ || (GET_CODE (operands[0]) == REG && REGNO (operands[0]) == 3) || (GET_CODE (operands[1]) == REG && REGNO (operands[1]) == 3)) && (arith_reg_operand (operands[0], DFmode) || arith_reg_operand (operands[1], DFmode))" "* return output_movedouble (insn, operands, DFmode);" [(set_attr "length" "4") (set_attr "type" "move,pcload,load,store")]) ;; All alternatives of movdf_i4 are split for ! TARGET_FMOVD. ;; However, the d/F/c/z alternative cannot be split directly; it is converted ;; with special code in machine_dependent_reorg into a load of the R0_REG and ;; the d/m/c/X alternative, which is split later into single-precision ;; instructions. And when not optimizing, no splits are done before fixing ;; up pcloads, so we need usable length information for that. (define_insn "movdf_i4" [(set (match_operand:DF 0 "general_movdst_operand" "=d,r,d,d,m,r,r,m,!??r,!???d") (match_operand:DF 1 "general_movsrc_operand" "d,r,F,m,d,FQ,m,r,d,r")) (use (match_operand:PSI 2 "fpscr_operand" "c,c,c,c,c,c,c,c,c,c")) (clobber (match_scratch:SI 3 "=X,X,&z,X,X,X,X,X,X,X"))] "TARGET_SH4 && (arith_reg_operand (operands[0], DFmode) || arith_reg_operand (operands[1], DFmode))" "@ fmov %1,%0 # # fmov.d %1,%0 fmov.d %1,%0 # # # # #" [(set_attr_alternative "length" [(if_then_else (eq_attr "fmovd" "yes") (const_int 2) (const_int 4)) (const_int 4) (if_then_else (eq_attr "fmovd" "yes") (const_int 4) (const_int 6)) (if_then_else (eq_attr "fmovd" "yes") (const_int 2) (const_int 6)) (if_then_else (eq_attr "fmovd" "yes") (const_int 2) (const_int 6)) (const_int 4) (const_int 8) (const_int 8) ;; these need only 8 bytes for @(r0,rn) ;; We can't use 4-byte push/pop on SHcompact, so we have to ;; increment or decrement r15 explicitly. (if_then_else (ne (symbol_ref "TARGET_SHCOMPACT") (const_int 0)) (const_int 10) (const_int 8)) (if_then_else (ne (symbol_ref "TARGET_SHCOMPACT") (const_int 0)) (const_int 10) (const_int 8))]) (set_attr "type" "fmove,move,pcfload,fload,store,pcload,load,store,load,fload") (set_attr "late_fp_use" "*,*,*,*,yes,*,*,*,*,*") (set (attr "fp_mode") (if_then_else (eq_attr "fmovd" "yes") (const_string "double") (const_string "none")))]) ;; Moving DFmode between fp/general registers through memory ;; (the top of the stack) is faster than moving through fpul even for ;; little endian. Because the type of an instruction is important for its ;; scheduling, it is beneficial to split these operations, rather than ;; emitting them in one single chunk, even if this will expose a stack ;; use that will prevent scheduling of other stack accesses beyond this ;; instruction. (define_split [(set (match_operand:DF 0 "register_operand" "") (match_operand:DF 1 "register_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 "=X"))] "TARGET_SH4 && reload_completed && (true_regnum (operands[0]) < 16) != (true_regnum (operands[1]) < 16)" [(const_int 0)] " { rtx insn, tos; if (TARGET_SH5 && true_regnum (operands[1]) < 16) { emit_move_insn (stack_pointer_rtx, plus_constant (stack_pointer_rtx, -8)); tos = gen_rtx_MEM (DFmode, stack_pointer_rtx); } else tos = gen_rtx (MEM, DFmode, gen_rtx (PRE_DEC, Pmode, stack_pointer_rtx)); insn = emit_insn (gen_movdf_i4 (tos, operands[1], operands[2])); if (! (TARGET_SH5 && true_regnum (operands[1]) < 16)) REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); if (TARGET_SH5 && true_regnum (operands[0]) < 16) tos = gen_rtx_MEM (DFmode, stack_pointer_rtx); else tos = gen_rtx (MEM, DFmode, gen_rtx (POST_INC, Pmode, stack_pointer_rtx)); insn = emit_insn (gen_movdf_i4 (operands[0], tos, operands[2])); if (TARGET_SH5 && true_regnum (operands[0]) < 16) emit_move_insn (stack_pointer_rtx, plus_constant (stack_pointer_rtx, 8)); else REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, stack_pointer_rtx, NULL_RTX); DONE; }") ;; local-alloc sometimes allocates scratch registers even when not required, ;; so we must be prepared to handle these. ;; Remove the use and clobber from a movdf_i4 so that we can use movdf_k. (define_split [(set (match_operand:DF 0 "general_movdst_operand" "") (match_operand:DF 1 "general_movsrc_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 ""))] "TARGET_SH4 && reload_completed && true_regnum (operands[0]) < 16 && true_regnum (operands[1]) < 16" [(set (match_dup 0) (match_dup 1))] " { /* If this was a reg <-> mem operation with base + index reg addressing, we have to handle this in a special way. */ rtx mem = operands[0]; int store_p = 1; if (! memory_operand (mem, DFmode)) { mem = operands[1]; store_p = 0; } if (GET_CODE (mem) == SUBREG && SUBREG_BYTE (mem) == 0) mem = SUBREG_REG (mem); if (GET_CODE (mem) == MEM) { rtx addr = XEXP (mem, 0); if (GET_CODE (addr) == PLUS && GET_CODE (XEXP (addr, 0)) == REG && GET_CODE (XEXP (addr, 1)) == REG) { int offset; rtx reg0 = gen_rtx (REG, Pmode, 0); rtx regop = operands[store_p], word0 ,word1; if (GET_CODE (regop) == SUBREG) alter_subreg (®op); if (REGNO (XEXP (addr, 0)) == REGNO (XEXP (addr, 1))) offset = 2; else offset = 4; mem = copy_rtx (mem); PUT_MODE (mem, SImode); word0 = gen_rtx (SUBREG, SImode, regop, 0); alter_subreg (&word0); word1 = gen_rtx (SUBREG, SImode, regop, 4); alter_subreg (&word1); if (store_p || ! refers_to_regno_p (REGNO (word0), REGNO (word0) + 1, addr, 0)) { emit_insn (store_p ? gen_movsi_ie (mem, word0) : gen_movsi_ie (word0, mem)); emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (offset))); mem = copy_rtx (mem); emit_insn (store_p ? gen_movsi_ie (mem, word1) : gen_movsi_ie (word1, mem)); emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (-offset))); } else { emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (offset))); emit_insn (gen_movsi_ie (word1, mem)); emit_insn (gen_addsi3 (reg0, reg0, GEN_INT (-offset))); mem = copy_rtx (mem); emit_insn (gen_movsi_ie (word0, mem)); } DONE; } } }") ;; Split away the clobber of r0 after machine_dependent_reorg has fixed pcloads. (define_split [(set (match_operand:DF 0 "register_operand" "") (match_operand:DF 1 "memory_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (reg:SI R0_REG))] "TARGET_SH4 && reload_completed" [(parallel [(set (match_dup 0) (match_dup 1)) (use (match_dup 2)) (clobber (scratch:SI))])] "") (define_expand "reload_indf" [(parallel [(set (match_operand:DF 0 "register_operand" "=f") (match_operand:DF 1 "immediate_operand" "FQ")) (use (reg:PSI FPSCR_REG)) (clobber (match_operand:SI 2 "register_operand" "=&z"))])] "TARGET_SH1" "") (define_expand "reload_outdf" [(parallel [(set (match_operand:DF 0 "register_operand" "=r,f") (match_operand:DF 1 "register_operand" "af,r")) (clobber (match_operand:SI 2 "register_operand" "=&y,y"))])] "TARGET_SH1" "") ;; Simplify no-op moves. (define_split [(set (match_operand:SF 0 "register_operand" "") (match_operand:SF 1 "register_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 ""))] "TARGET_SH2E && reload_completed && true_regnum (operands[0]) == true_regnum (operands[1])" [(set (match_dup 0) (match_dup 0))] "") ;; fmovd substitute post-reload splits (define_split [(set (match_operand:DF 0 "register_operand" "") (match_operand:DF 1 "register_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 ""))] "TARGET_SH4 && ! TARGET_FMOVD && reload_completed && FP_OR_XD_REGISTER_P (true_regnum (operands[0])) && FP_OR_XD_REGISTER_P (true_regnum (operands[1]))" [(const_int 0)] " { int dst = true_regnum (operands[0]), src = true_regnum (operands[1]); emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, dst), gen_rtx (REG, SFmode, src), operands[2])); emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, dst + 1), gen_rtx (REG, SFmode, src + 1), operands[2])); DONE; }") (define_split [(set (match_operand:DF 0 "register_operand" "") (mem:DF (match_operand:SI 1 "register_operand" ""))) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 ""))] "TARGET_SH4 && ! TARGET_FMOVD && reload_completed && FP_OR_XD_REGISTER_P (true_regnum (operands[0])) && find_regno_note (insn, REG_DEAD, true_regnum (operands[1]))" [(const_int 0)] " { int regno = true_regnum (operands[0]); rtx insn; rtx mem2 = gen_rtx (MEM, SFmode, gen_rtx (POST_INC, Pmode, operands[1])); insn = emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, regno + !! TARGET_LITTLE_ENDIAN), mem2, operands[2])); REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, operands[1], NULL_RTX); insn = emit_insn (gen_movsf_ie (gen_rtx (REG, SFmode, regno + ! TARGET_LITTLE_ENDIAN), gen_rtx (MEM, SFmode, operands[1]), operands[2])); DONE; }") (define_split [(set (match_operand:DF 0 "register_operand" "") (match_operand:DF 1 "memory_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 ""))] "TARGET_SH4 && ! TARGET_FMOVD && reload_completed && FP_OR_XD_REGISTER_P (true_regnum (operands[0]))" [(const_int 0)] " { int regno = true_regnum (operands[0]); rtx addr, insn, adjust = NULL_RTX; rtx mem2 = copy_rtx (operands[1]); rtx reg0 = gen_rtx_REG (SFmode, regno + !! TARGET_LITTLE_ENDIAN); rtx reg1 = gen_rtx_REG (SFmode, regno + ! TARGET_LITTLE_ENDIAN); PUT_MODE (mem2, SFmode); operands[1] = copy_rtx (mem2); addr = XEXP (mem2, 0); if (GET_CODE (addr) != POST_INC) { /* If we have to modify the stack pointer, the value that we have read with post-increment might be modified by an interrupt, so write it back. */ if (REGNO (addr) == STACK_POINTER_REGNUM) adjust = gen_push_e (reg0); else adjust = gen_addsi3 (addr, addr, GEN_INT (-4)); XEXP (mem2, 0) = addr = gen_rtx_POST_INC (SImode, addr); } addr = XEXP (addr, 0); insn = emit_insn (gen_movsf_ie (reg0, mem2, operands[2])); REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_INC, addr, NULL_RTX); insn = emit_insn (gen_movsf_ie (reg1, operands[1], operands[2])); if (adjust) emit_insn (adjust); else REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_INC, addr, NULL_RTX); DONE; }") (define_split [(set (match_operand:DF 0 "memory_operand" "") (match_operand:DF 1 "register_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (match_scratch:SI 3 ""))] "TARGET_SH4 && ! TARGET_FMOVD && reload_completed && FP_OR_XD_REGISTER_P (true_regnum (operands[1]))" [(const_int 0)] " { int regno = true_regnum (operands[1]); rtx insn, addr, adjust = NULL_RTX; operands[0] = copy_rtx (operands[0]); PUT_MODE (operands[0], SFmode); insn = emit_insn (gen_movsf_ie (operands[0], gen_rtx (REG, SFmode, regno + ! TARGET_LITTLE_ENDIAN), operands[2])); operands[0] = copy_rtx (operands[0]); addr = XEXP (operands[0], 0); if (GET_CODE (addr) != PRE_DEC) { adjust = gen_addsi3 (addr, addr, GEN_INT (4)); emit_insn_before (adjust, insn); XEXP (operands[0], 0) = addr = gen_rtx (PRE_DEC, SImode, addr); } addr = XEXP (addr, 0); if (! adjust) REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, addr, NULL_RTX); insn = emit_insn (gen_movsf_ie (operands[0], gen_rtx (REG, SFmode, regno + !! TARGET_LITTLE_ENDIAN), operands[2])); REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, addr, NULL_RTX); DONE; }") ;; If the output is a register and the input is memory or a register, we have ;; to be careful and see which word needs to be loaded first. (define_split [(set (match_operand:DF 0 "general_movdst_operand" "") (match_operand:DF 1 "general_movsrc_operand" ""))] "TARGET_SH1 && reload_completed" [(set (match_dup 2) (match_dup 3)) (set (match_dup 4) (match_dup 5))] " { int regno; if ((GET_CODE (operands[0]) == MEM && GET_CODE (XEXP (operands[0], 0)) == PRE_DEC) || (GET_CODE (operands[1]) == MEM && GET_CODE (XEXP (operands[1], 0)) == POST_INC)) FAIL; if (GET_CODE (operands[0]) == REG) regno = REGNO (operands[0]); else if (GET_CODE (operands[0]) == SUBREG) regno = subreg_regno (operands[0]); else if (GET_CODE (operands[0]) == MEM) regno = -1; else abort (); if (regno == -1 || ! refers_to_regno_p (regno, regno + 1, operands[1], 0)) { operands[2] = operand_subword (operands[0], 0, 0, DFmode); operands[3] = operand_subword (operands[1], 0, 0, DFmode); operands[4] = operand_subword (operands[0], 1, 0, DFmode); operands[5] = operand_subword (operands[1], 1, 0, DFmode); } else { operands[2] = operand_subword (operands[0], 1, 0, DFmode); operands[3] = operand_subword (operands[1], 1, 0, DFmode); operands[4] = operand_subword (operands[0], 0, 0, DFmode); operands[5] = operand_subword (operands[1], 0, 0, DFmode); } if (operands[2] == 0 || operands[3] == 0 || operands[4] == 0 || operands[5] == 0) FAIL; }") ;; If a base address generated by LEGITIMIZE_ADDRESS for SImode is ;; used only once, let combine add in the index again. (define_split [(set (match_operand:SI 0 "register_operand" "") (match_operand:SI 1 "" "")) (clobber (match_operand 2 "register_operand" ""))] "TARGET_SH1 && ! reload_in_progress && ! reload_completed" [(use (reg:SI R0_REG))] " { rtx addr, reg, const_int; if (GET_CODE (operands[1]) != MEM) FAIL; addr = XEXP (operands[1], 0); if (GET_CODE (addr) != PLUS) FAIL; reg = XEXP (addr, 0); const_int = XEXP (addr, 1); if (! (BASE_REGISTER_RTX_P (reg) && INDEX_REGISTER_RTX_P (operands[2]) && GET_CODE (const_int) == CONST_INT)) FAIL; emit_move_insn (operands[2], const_int); emit_move_insn (operands[0], change_address (operands[1], VOIDmode, gen_rtx_PLUS (SImode, reg, operands[2]))); DONE; }") (define_split [(set (match_operand:SI 1 "" "") (match_operand:SI 0 "register_operand" "")) (clobber (match_operand 2 "register_operand" ""))] "TARGET_SH1 && ! reload_in_progress && ! reload_completed" [(use (reg:SI R0_REG))] " { rtx addr, reg, const_int; if (GET_CODE (operands[1]) != MEM) FAIL; addr = XEXP (operands[1], 0); if (GET_CODE (addr) != PLUS) FAIL; reg = XEXP (addr, 0); const_int = XEXP (addr, 1); if (! (BASE_REGISTER_RTX_P (reg) && INDEX_REGISTER_RTX_P (operands[2]) && GET_CODE (const_int) == CONST_INT)) FAIL; emit_move_insn (operands[2], const_int); emit_move_insn (change_address (operands[1], VOIDmode, gen_rtx_PLUS (SImode, reg, operands[2])), operands[0]); DONE; }") (define_expand "movdf" [(set (match_operand:DF 0 "general_movdst_operand" "") (match_operand:DF 1 "general_movsrc_operand" ""))] "" " { if (prepare_move_operands (operands, DFmode)) DONE; if (TARGET_SHMEDIA) { if (TARGET_SHMEDIA_FPU) emit_insn (gen_movdf_media (operands[0], operands[1])); else emit_insn (gen_movdf_media_nofpu (operands[0], operands[1])); DONE; } if (TARGET_SH4) { emit_df_insn (gen_movdf_i4 (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") ;;This is incompatible with the way gcc uses subregs. ;;(define_insn "movv2sf_i" ;; [(set (match_operand:V2SF 0 "nonimmediate_operand" "=f,f,m") ;; (match_operand:V2SF 1 "nonimmediate_operand" "f,m,f"))] ;; "TARGET_SHMEDIA_FPU ;; && (fp_arith_reg_operand (operands[0], V2SFmode) ;; || fp_arith_reg_operand (operands[1], V2SFmode))" ;; "@ ;; # ;; fld%M1.p %m1, %0 ;; fst%M0.p %m0, %1" ;; [(set_attr "type" "*,fload_media,fstore_media")]) (define_insn_and_split "movv2sf_i" [(set (match_operand:V2SF 0 "general_movdst_operand" "=f,rf,r,m,mf") (match_operand:V2SF 1 "general_operand" "fm,rfm?,F?,f,rfZ?"))] "TARGET_SHMEDIA_FPU" "#" "TARGET_SHMEDIA_FPU && reload_completed" [(set (match_dup 0) (match_dup 1))] " { operands[0] = simplify_gen_subreg (DFmode, operands[0], V2SFmode, 0); operands[1] = simplify_gen_subreg (DFmode, operands[1], V2SFmode, 0); }") (define_expand "movv2sf" [(set (match_operand:V2SF 0 "general_movdst_operand" "") (match_operand:V2SF 1 "nonimmediate_operand" ""))] "TARGET_SHMEDIA_FPU" " { if (prepare_move_operands (operands, V2SFmode)) DONE; }") (define_expand "addv2sf3" [(match_operand:V2SF 0 "fp_arith_reg_operand" "") (match_operand:V2SF 1 "fp_arith_reg_operand" "") (match_operand:V2SF 2 "fp_arith_reg_operand" "")] "TARGET_SHMEDIA_FPU" " { sh_expand_binop_v2sf (PLUS, operands[0], operands[1], operands[2]); DONE; }") (define_expand "subv2sf3" [(match_operand:V2SF 0 "fp_arith_reg_operand" "") (match_operand:V2SF 1 "fp_arith_reg_operand" "") (match_operand:V2SF 2 "fp_arith_reg_operand" "")] "TARGET_SHMEDIA_FPU" " { sh_expand_binop_v2sf (MINUS, operands[0], operands[1], operands[2]); DONE; }") (define_expand "mulv2sf3" [(match_operand:V2SF 0 "fp_arith_reg_operand" "") (match_operand:V2SF 1 "fp_arith_reg_operand" "") (match_operand:V2SF 2 "fp_arith_reg_operand" "")] "TARGET_SHMEDIA_FPU" " { sh_expand_binop_v2sf (MULT, operands[0], operands[1], operands[2]); DONE; }") (define_expand "divv2sf3" [(match_operand:V2SF 0 "fp_arith_reg_operand" "") (match_operand:V2SF 1 "fp_arith_reg_operand" "") (match_operand:V2SF 2 "fp_arith_reg_operand" "")] "TARGET_SHMEDIA_FPU" " { sh_expand_binop_v2sf (DIV, operands[0], operands[1], operands[2]); DONE; }") (define_insn_and_split "*movv4sf_i" [(set (match_operand:V4SF 0 "nonimmediate_operand" "=f,f,m") (match_operand:V4SF 1 "general_operand" "fZ,m,fZ"))] "TARGET_SHMEDIA_FPU" "#" "&& reload_completed" [(const_int 0)] " { int i; for (i = 0; i < 4/2; i++) { rtx x, y; if (GET_CODE (operands[0]) == MEM) x = gen_rtx_MEM (V2SFmode, plus_constant (XEXP (operands[0], 0), i * GET_MODE_SIZE (V2SFmode))); else x = simplify_gen_subreg (V2SFmode, operands[0], V4SFmode, i * 8); if (GET_CODE (operands[1]) == MEM) y = gen_rtx_MEM (V2SFmode, plus_constant (XEXP (operands[1], 0), i * GET_MODE_SIZE (V2SFmode))); else y = simplify_gen_subreg (V2SFmode, operands[1], V4SFmode, i * 8); emit_insn (gen_movv2sf_i (x, y)); } DONE; }" [(set_attr "length" "8")]) (define_expand "movv4sf" [(set (match_operand:V4SF 0 "nonimmediate_operand" "") (match_operand:V4SF 1 "general_operand" ""))] "TARGET_SHMEDIA_FPU" " { if (prepare_move_operands (operands, V4SFmode)) DONE; }") (define_insn_and_split "*movv16sf_i" [(set (match_operand:V16SF 0 "nonimmediate_operand" "=f,f,m") (match_operand:V16SF 1 "nonimmediate_operand" "f,m,f"))] "TARGET_SHMEDIA_FPU" "#" "&& reload_completed" [(const_int 0)] " { int i; for (i = 0; i < 16/2; i++) { rtx x,y; if (GET_CODE (operands[0]) == MEM) x = gen_rtx_MEM (V2SFmode, plus_constant (XEXP (operands[0], 0), i * GET_MODE_SIZE (V2SFmode))); else { x = gen_rtx_SUBREG (V2SFmode, operands[0], i * 8); alter_subreg (&x); } if (GET_CODE (operands[1]) == MEM) y = gen_rtx_MEM (V2SFmode, plus_constant (XEXP (operands[1], 0), i * GET_MODE_SIZE (V2SFmode))); else { y = gen_rtx_SUBREG (V2SFmode, operands[1], i * 8); alter_subreg (&y); } emit_insn (gen_movv2sf_i (x, y)); } DONE; }" [(set_attr "length" "32")]) (define_expand "movv16sf" [(set (match_operand:V16SF 0 "nonimmediate_operand" "=f,f,m") (match_operand:V16SF 1 "nonimmediate_operand" "f,m,f"))] "TARGET_SHMEDIA_FPU" " { if (prepare_move_operands (operands, V16SFmode)) DONE; }") (define_insn "movsf_media" [(set (match_operand:SF 0 "general_movdst_operand" "=f,f,r,r,r,f,m,r,m") (match_operand:SF 1 "general_movsrc_operand" "f,rZ,f,r,F,m,f,m,rZ"))] "TARGET_SHMEDIA_FPU && (register_operand (operands[0], SFmode) || sh_register_operand (operands[1], SFmode))" "@ fmov.s %1, %0 fmov.ls %N1, %0 fmov.sl %1, %0 add.l %1, r63, %0 # fld%M1.s %m1, %0 fst%M0.s %m0, %1 ld%M1.l %m1, %0 st%M0.l %m0, %N1" [(set_attr "type" "fmove_media,fload_media,fpconv_media,arith_media,*,fload_media,fstore_media,load_media,store_media")]) (define_insn "movsf_media_nofpu" [(set (match_operand:SF 0 "general_movdst_operand" "=r,r,r,m") (match_operand:SF 1 "general_movsrc_operand" "r,F,m,rZ"))] "TARGET_SHMEDIA && (register_operand (operands[0], SFmode) || sh_register_operand (operands[1], SFmode))" "@ add.l %1, r63, %0 # ld%M1.l %m1, %0 st%M0.l %m0, %N1" [(set_attr "type" "arith_media,*,load_media,store_media")]) (define_split [(set (match_operand:SF 0 "arith_reg_operand" "") (match_operand:SF 1 "immediate_operand" ""))] "TARGET_SHMEDIA && reload_completed && ! FP_REGISTER_P (true_regnum (operands[0]))" [(set (match_dup 3) (match_dup 2))] " { long values; REAL_VALUE_TYPE value; REAL_VALUE_FROM_CONST_DOUBLE (value, operands[1]); REAL_VALUE_TO_TARGET_SINGLE (value, values); operands[2] = GEN_INT (values); operands[3] = gen_rtx_REG (DImode, true_regnum (operands[0])); }") (define_insn "movsf_i" [(set (match_operand:SF 0 "general_movdst_operand" "=r,r,r,r,m,l,r") (match_operand:SF 1 "general_movsrc_operand" "r,G,FQ,mr,r,r,l"))] "TARGET_SH1 && (! TARGET_SH2E /* ??? We provide some insn so that direct_{load,store}[SFmode] get set */ || (GET_CODE (operands[0]) == REG && REGNO (operands[0]) == 3) || (GET_CODE (operands[1]) == REG && REGNO (operands[1]) == 3)) && (arith_reg_operand (operands[0], SFmode) || arith_reg_operand (operands[1], SFmode))" "@ mov %1,%0 mov #0,%0 mov.l %1,%0 mov.l %1,%0 mov.l %1,%0 lds %1,%0 sts %1,%0" [(set_attr "type" "move,move,pcload,load,store,move,move")]) ;; We may not split the ry/yr/XX alternatives to movsi_ie, since ;; update_flow_info would not know where to put REG_EQUAL notes ;; when the destination changes mode. (define_insn "movsf_ie" [(set (match_operand:SF 0 "general_movdst_operand" "=f,r,f,f,fy,f,m,r,r,m,f,y,y,rf,r,y,<,y,y") (match_operand:SF 1 "general_movsrc_operand" "f,r,G,H,FQ,mf,f,FQ,mr,r,y,f,>,fr,y,r,y,>,y")) (use (match_operand:PSI 2 "fpscr_operand" "c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c,c")) (clobber (match_scratch:SI 3 "=X,X,Bsc,Bsc,&z,X,X,X,X,X,X,X,X,y,X,X,X,X,X"))] "TARGET_SH2E && (arith_reg_operand (operands[0], SFmode) || arith_reg_operand (operands[1], SFmode) || arith_reg_operand (operands[3], SImode) || (fpul_operand (operands[0], SFmode) && memory_operand (operands[1], SFmode) && GET_CODE (XEXP (operands[1], 0)) == POST_INC) || (fpul_operand (operands[1], SFmode) && memory_operand (operands[0], SFmode) && GET_CODE (XEXP (operands[0], 0)) == PRE_DEC))" "@ fmov %1,%0 mov %1,%0 fldi0 %0 fldi1 %0 # fmov.s %1,%0 fmov.s %1,%0 mov.l %1,%0 mov.l %1,%0 mov.l %1,%0 fsts fpul,%0 flds %1,fpul lds.l %1,%0 # sts %1,%0 lds %1,%0 sts.l %1,%0 lds.l %1,%0 ! move optimized away" [(set_attr "type" "fmove,move,fmove,fmove,pcfload,fload,store,pcload,load,store,fmove,fmove,load,*,fpul_gp,gp_fpul,store,load,nil") (set_attr "late_fp_use" "*,*,*,*,*,*,yes,*,*,*,*,*,*,*,yes,*,yes,*,*") (set_attr "length" "*,*,*,*,4,*,*,*,*,*,2,2,2,4,2,2,2,2,0") (set (attr "fp_mode") (if_then_else (eq_attr "fmovd" "yes") (const_string "single") (const_string "none")))]) (define_split [(set (match_operand:SF 0 "register_operand" "") (match_operand:SF 1 "register_operand" "")) (use (match_operand:PSI 2 "fpscr_operand" "")) (clobber (reg:SI FPUL_REG))] "TARGET_SH1" [(parallel [(set (reg:SF FPUL_REG) (match_dup 1)) (use (match_dup 2)) (clobber (scratch:SI))]) (parallel [(set (match_dup 0) (reg:SF FPUL_REG)) (use (match_dup 2)) (clobber (scratch:SI))])] "") (define_expand "movsf" [(set (match_operand:SF 0 "general_movdst_operand" "") (match_operand:SF 1 "general_movsrc_operand" ""))] "" " { if (prepare_move_operands (operands, SFmode)) DONE; if (TARGET_SHMEDIA) { if (TARGET_SHMEDIA_FPU) emit_insn (gen_movsf_media (operands[0], operands[1])); else emit_insn (gen_movsf_media_nofpu (operands[0], operands[1])); DONE; } if (TARGET_SH2E) { emit_sf_insn (gen_movsf_ie (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "mov_nop" [(set (match_operand 0 "any_register_operand" "") (match_dup 0))] "TARGET_SH2E" "" [(set_attr "length" "0") (set_attr "type" "nil")]) (define_expand "reload_insf" [(parallel [(set (match_operand:SF 0 "register_operand" "=a") (match_operand:SF 1 "immediate_operand" "FQ")) (use (reg:PSI FPSCR_REG)) (clobber (match_operand:SI 2 "register_operand" "=&z"))])] "TARGET_SH1" "") (define_expand "reload_insi" [(parallel [(set (match_operand:SF 0 "register_operand" "=y") (match_operand:SF 1 "immediate_operand" "FQ")) (clobber (match_operand:SI 2 "register_operand" "=&z"))])] "TARGET_SH1" "") (define_insn "*movsi_y" [(set (match_operand:SI 0 "register_operand" "=y,y") (match_operand:SI 1 "immediate_operand" "Qi,I08")) (clobber (match_scratch:SI 2 "=&z,r"))] "TARGET_SH2E && (reload_in_progress || reload_completed)" "#" [(set_attr "length" "4") (set_attr "type" "pcload,move")]) (define_split [(set (match_operand:SI 0 "register_operand" "") (match_operand:SI 1 "immediate_operand" "")) (clobber (match_operand:SI 2 "register_operand" ""))] "TARGET_SH1" [(set (match_dup 2) (match_dup 1)) (set (match_dup 0) (match_dup 2))] "") (define_split [(set (match_operand:SI 0 "register_operand" "") (match_operand:SI 1 "memory_operand" "")) (clobber (reg:SI R0_REG))] "TARGET_SH1" [(set (match_dup 0) (match_dup 1))] "") ;; ------------------------------------------------------------------------ ;; Define the real conditional branch instructions. ;; ------------------------------------------------------------------------ (define_insn "branch_true" [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "TARGET_SH1" "* return output_branch (1, insn, operands);" [(set_attr "type" "cbranch")]) (define_insn "branch_false" [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "TARGET_SH1" "* return output_branch (0, insn, operands);" [(set_attr "type" "cbranch")]) ;; Patterns to prevent reorg from re-combining a condbranch with a branch ;; which destination is too far away. ;; The const_int_operand is distinct for each branch target; it avoids ;; unwanted matches with redundant_insn. (define_insn "block_branch_redirect" [(set (pc) (unspec [(match_operand 0 "const_int_operand" "")] UNSPEC_BBR))] "TARGET_SH1" "" [(set_attr "length" "0")]) ;; This one has the additional purpose to record a possible scratch register ;; for the following branch. ;; ??? Unfortunately, just setting the scratch register is not good enough, ;; because the insn then might be deemed dead and deleted. And we can't ;; make the use in the jump insn explicit because that would disable ;; delay slot scheduling from the target. (define_insn "indirect_jump_scratch" [(set (match_operand:SI 0 "register_operand" "=r") (unspec:SI [(match_operand 1 "const_int_operand" "")] UNSPEC_BBR)) (set (pc) (unspec [(const_int 0)] UNSPEC_BBR))] "TARGET_SH1" "" [(set_attr "length" "0")]) ;; This one is used to preemt an insn from beyond the bra / braf / jmp ;; being pulled into the delay slot of a condbranch that has been made to ;; jump around the unconditional jump because it was out of range. (define_insn "stuff_delay_slot" [(set (pc) (unspec [(match_operand 0 "const_int_operand" "") (pc)] UNSPEC_BBR)) (set (reg:SI T_REG) (match_operand 1 "const_int_operand" ""))] "TARGET_SH1" "" [(set_attr "length" "0") (set_attr "cond_delay_slot" "yes")]) ;; Conditional branch insns (define_expand "beq_media" [(set (pc) (if_then_else (eq (match_operand:DI 1 "arith_reg_operand" "r,r") (match_operand:DI 2 "arith_operand" "r,I06")) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" "") (define_insn "*beq_media_i" [(set (pc) (if_then_else (match_operator 3 "equality_comparison_operator" [(match_operand:DI 1 "arith_reg_operand" "r,r") (match_operand:DI 2 "arith_operand" "r,I06")]) (match_operand:DI 0 "target_operand" "b,b") (pc)))] "TARGET_SHMEDIA" "@ b%o3%' %1, %2, %0 b%o3i%' %1, %2, %0" [(set_attr "type" "cbranch_media")]) (define_expand "bne_media" [(set (pc) (if_then_else (ne (match_operand:DI 1 "arith_reg_operand" "r,r") (match_operand:DI 2 "arith_operand" "r,I06")) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" "") (define_expand "bgt_media" [(set (pc) (if_then_else (gt (match_operand:DI 1 "arith_reg_or_0_operand" "r") (match_operand:DI 2 "arith_reg_or_0_operand" "r")) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" "") (define_expand "bge_media" [(set (pc) (if_then_else (ge (match_operand:DI 1 "arith_reg_or_0_operand" "r") (match_operand:DI 2 "arith_reg_or_0_operand" "r")) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" "") (define_expand "bgtu_media" [(set (pc) (if_then_else (gtu (match_operand:DI 1 "arith_reg_or_0_operand" "r") (match_operand:DI 2 "arith_reg_or_0_operand" "r")) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" "") (define_expand "bgeu_media" [(set (pc) (if_then_else (geu (match_operand:DI 1 "arith_reg_or_0_operand" "r") (match_operand:DI 2 "arith_reg_or_0_operand" "r")) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" "") (define_insn "*bgt_media_i" [(set (pc) (if_then_else (match_operator 3 "greater_comparison_operator" [(match_operand:DI 1 "arith_reg_or_0_operand" "rN") (match_operand:DI 2 "arith_reg_or_0_operand" "rN")]) (match_operand:DI 0 "target_operand" "b") (pc)))] "TARGET_SHMEDIA" "b%o3%' %N1, %N2, %0" [(set_attr "type" "cbranch_media")]) ;; These are only needed to make invert_jump() happy. (define_insn "*blt_media_i" [(set (pc) (if_then_else (match_operator 3 "less_comparison_operator" [(match_operand:DI 1 "arith_reg_or_0_operand" "rN") (match_operand:DI 2 "arith_reg_or_0_operand" "rN")]) (match_operand:DI 0 "target_operand" "b") (pc)))] "TARGET_SHMEDIA" "b%o3%' %N2, %N1, %0" [(set_attr "type" "cbranch_media")]) (define_expand "beq" [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (sh_compare_op0) != DImode) { rtx tmp = gen_reg_rtx (DImode); emit_insn (gen_seq (tmp)); emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); DONE; } sh_compare_op0 = force_reg (DImode, sh_compare_op0); emit_jump_insn (gen_beq_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } from_compare (operands, EQ); }") (define_expand "bne" [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (sh_compare_op0) != DImode) { rtx tmp = gen_reg_rtx (DImode); emit_insn (gen_seq (tmp)); emit_jump_insn (gen_beq_media (operands[0], tmp, const0_rtx)); DONE; } sh_compare_op0 = force_reg (DImode, sh_compare_op0); emit_jump_insn (gen_bne_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } from_compare (operands, EQ); }") (define_expand "bgt" [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (sh_compare_op0) != DImode) { rtx tmp = gen_reg_rtx (DImode); emit_insn (gen_sgt (tmp)); emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); DONE; } if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bgt_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } from_compare (operands, GT); }") (define_expand "blt" [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (sh_compare_op0) != DImode) { rtx tmp = gen_reg_rtx (DImode); emit_insn (gen_slt (tmp)); emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); DONE; } if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bgt_media (operands[0], sh_compare_op1, sh_compare_op0)); DONE; } if (GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) { rtx tmp = sh_compare_op0; sh_compare_op0 = sh_compare_op1; sh_compare_op1 = tmp; emit_insn (gen_bgt (operands[0])); DONE; } from_compare (operands, GE); }") (define_expand "ble" [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (sh_compare_op0) != DImode) { rtx tmp = gen_reg_rtx (DImode); emit_insn (gen_sle (tmp)); emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); DONE; } if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bge_media (operands[0], sh_compare_op1, sh_compare_op0)); DONE; } if (TARGET_SH2E && TARGET_IEEE && GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) { rtx tmp = sh_compare_op0; sh_compare_op0 = sh_compare_op1; sh_compare_op1 = tmp; emit_insn (gen_bge (operands[0])); DONE; } from_compare (operands, GT); }") (define_expand "bge" [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (sh_compare_op0) != DImode) { rtx tmp = gen_reg_rtx (DImode); emit_insn (gen_sge (tmp)); emit_jump_insn (gen_bne_media (operands[0], tmp, const0_rtx)); DONE; } if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bge_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } if (TARGET_SH2E && ! TARGET_IEEE && GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) { rtx tmp = sh_compare_op0; sh_compare_op0 = sh_compare_op1; sh_compare_op1 = tmp; emit_insn (gen_ble (operands[0])); DONE; } from_compare (operands, GE); }") (define_expand "bgtu" [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bgtu_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } from_compare (operands, GTU); }") (define_expand "bltu" [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bgtu_media (operands[0], sh_compare_op1, sh_compare_op0)); DONE; } from_compare (operands, GEU); }") (define_expand "bgeu" [(set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bgeu_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } from_compare (operands, GEU); }") (define_expand "bleu" [(set (pc) (if_then_else (eq (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 0 "" "")) (pc)))] "" " { if (TARGET_SHMEDIA) { if (sh_compare_op0 != const0_rtx) sh_compare_op0 = force_reg (DImode, sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (DImode, sh_compare_op1); emit_jump_insn (gen_bgeu_media (operands[0], sh_compare_op1, sh_compare_op0)); DONE; } from_compare (operands, GTU); }") (define_expand "bunordered" [(set (match_dup 1) (unordered:DI (match_dup 2) (match_dup 3))) (set (pc) (if_then_else (ne (match_dup 1) (const_int 0)) (label_ref:DI (match_operand 0 "" "")) (pc)))] "TARGET_SHMEDIA" " { operands[1] = gen_reg_rtx (DImode); operands[2] = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); operands[3] = force_reg (GET_MODE (sh_compare_op1), sh_compare_op1); }") ;; ------------------------------------------------------------------------ ;; Jump and linkage insns ;; ------------------------------------------------------------------------ (define_insn "jump_compact" [(set (pc) (label_ref (match_operand 0 "" "")))] "TARGET_SH1" "* { /* The length is 16 if the delay slot is unfilled. */ if (get_attr_length(insn) > 4) return output_far_jump(insn, operands[0]); else return \"bra %l0%#\"; }" [(set_attr "type" "jump") (set_attr "needs_delay_slot" "yes")]) ;; ??? It would be much saner to explicitly use the scratch register ;; in the jump insn, and have indirect_jump_scratch only set it, ;; but fill_simple_delay_slots would refuse to do delay slot filling ;; from the target then, as it uses simplejump_p. ;;(define_insn "jump_compact_far" ;; [(set (pc) ;; (label_ref (match_operand 0 "" ""))) ;; (use (match_operand 1 "register_operand" "r")] ;; "TARGET_SH1" ;; "* return output_far_jump(insn, operands[0], operands[1]);" ;; [(set_attr "type" "jump") ;; (set_attr "needs_delay_slot" "yes")]) (define_insn "jump_media" [(set (pc) (match_operand:DI 0 "target_operand" "b"))] "TARGET_SHMEDIA" "blink %0, r63" [(set_attr "type" "jump_media")]) (define_expand "jump" [(set (pc) (label_ref (match_operand 0 "" "")))] "" " { if (TARGET_SH1) emit_jump_insn (gen_jump_compact (operands[0])); else if (TARGET_SHMEDIA) { if (reload_in_progress || reload_completed) FAIL; emit_jump_insn (gen_jump_media (gen_rtx_LABEL_REF (DImode, operands[0]))); } DONE; }") (define_insn "force_mode_for_call" [(use (reg:PSI FPSCR_REG))] "TARGET_SHCOMPACT" "" [(set_attr "length" "0") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double")))]) (define_insn "calli" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) (match_operand 1 "" "")) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))] "TARGET_SH1" "jsr @%0%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes") (set_attr "fp_set" "unknown")]) ;; This is a pc-rel call, using bsrf, for use with PIC. (define_insn "calli_pcrel" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) (match_operand 1 "" "")) (use (reg:PSI FPSCR_REG)) (use (reg:SI PIC_REG)) (use (match_operand 2 "" "")) (clobber (reg:SI PR_REG))] "TARGET_SH2" "bsrf %0\\n%O2:%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes") (set_attr "fp_set" "unknown")]) (define_insn_and_split "call_pcrel" [(call (mem:SI (match_operand:SI 0 "symbol_ref_operand" "")) (match_operand 1 "" "")) (use (reg:PSI FPSCR_REG)) (use (reg:SI PIC_REG)) (clobber (reg:SI PR_REG)) (clobber (match_scratch:SI 2 "=r"))] "TARGET_SH2" "#" "reload_completed" [(const_int 0)] " { rtx lab = PATTERN (gen_call_site ()); if (SYMBOL_REF_LOCAL_P (operands[0])) emit_insn (gen_sym_label2reg (operands[2], operands[0], lab)); else emit_insn (gen_symPLT_label2reg (operands[2], operands[0], lab)); emit_call_insn (gen_calli_pcrel (operands[2], operands[1], lab)); DONE; }" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes") (set_attr "fp_set" "unknown")]) (define_insn "call_compact" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) (match_operand 1 "" "")) (match_operand 2 "immediate_operand" "n") (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && ! (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%0%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_insn "call_compact_rettramp" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) (match_operand 1 "" "")) (match_operand 2 "immediate_operand" "n") (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI R10_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%0%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_insn "call_media" [(call (mem:DI (match_operand:DI 0 "target_reg_operand" "b")) (match_operand 1 "" "")) (clobber (reg:DI PR_MEDIA_REG))] "TARGET_SHMEDIA" "blink %0, r18" [(set_attr "type" "jump_media")]) (define_insn "call_valuei" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) (match_operand 2 "" ""))) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))] "TARGET_SH1" "jsr @%1%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes") (set_attr "fp_set" "unknown")]) (define_insn "call_valuei_pcrel" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) (match_operand 2 "" ""))) (use (reg:PSI FPSCR_REG)) (use (reg:SI PIC_REG)) (use (match_operand 3 "" "")) (clobber (reg:SI PR_REG))] "TARGET_SH2" "bsrf %1\\n%O3:%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes") (set_attr "fp_set" "unknown")]) (define_insn_and_split "call_value_pcrel" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "symbol_ref_operand" "")) (match_operand 2 "" ""))) (use (reg:PSI FPSCR_REG)) (use (reg:SI PIC_REG)) (clobber (reg:SI PR_REG)) (clobber (match_scratch:SI 3 "=r"))] "TARGET_SH2" "#" "reload_completed" [(const_int 0)] " { rtx lab = PATTERN (gen_call_site ()); if (SYMBOL_REF_LOCAL_P (operands[1])) emit_insn (gen_sym_label2reg (operands[3], operands[1], lab)); else emit_insn (gen_symPLT_label2reg (operands[3], operands[1], lab)); emit_call_insn (gen_call_valuei_pcrel (operands[0], operands[3], operands[2], lab)); DONE; }" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes") (set_attr "fp_set" "unknown")]) (define_insn "call_value_compact" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) (match_operand 2 "" ""))) (match_operand 3 "immediate_operand" "n") (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && ! (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%1%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_insn "call_value_compact_rettramp" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) (match_operand 2 "" ""))) (match_operand 3 "immediate_operand" "n") (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI R10_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%1%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_insn "call_value_media" [(set (match_operand 0 "" "=rf") (call (mem:DI (match_operand:DI 1 "target_reg_operand" "b")) (match_operand 2 "" ""))) (clobber (reg:DI PR_MEDIA_REG))] "TARGET_SHMEDIA" "blink %1, r18" [(set_attr "type" "jump_media")]) (define_expand "call" [(parallel [(call (mem:SI (match_operand 0 "arith_reg_operand" "")) (match_operand 1 "" "")) (match_operand 2 "" "") (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))])] "" " { if (TARGET_SHMEDIA) { operands[0] = XEXP (operands[0], 0); if (flag_pic && GET_CODE (operands[0]) == SYMBOL_REF) { if (! SYMBOL_REF_LOCAL_P (operands[0])) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, operands[0])); operands[0] = reg; } else { operands[0] = gen_sym2PIC (operands[0]); PUT_MODE (operands[0], Pmode); } } if (GET_MODE (operands[0]) == SImode) { if (GET_CODE (operands[0]) == REG) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); else if (GET_CODE (operands[0]) == SUBREG) { operands[0] = SUBREG_REG (operands[0]); if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); } else { operands[0] = shallow_copy_rtx (operands[0]); PUT_MODE (operands[0], DImode); } } if (! target_reg_operand (operands[0], DImode)) operands[0] = copy_to_mode_reg (DImode, operands[0]); emit_call_insn (gen_call_media (operands[0], operands[1])); DONE; } else if (TARGET_SHCOMPACT && operands[2] && INTVAL (operands[2])) { rtx cookie_rtx = operands[2]; long cookie = INTVAL (cookie_rtx); rtx func = XEXP (operands[0], 0); rtx r0, r1; if (flag_pic) { if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, func)); func = reg; } else func = legitimize_pic_address (func, Pmode, 0); } r0 = gen_rtx_REG (SImode, R0_REG); r1 = gen_rtx_REG (SImode, R1_REG); /* Since such a call function may use all call-clobbered registers, we force a mode switch earlier, so that we don't run out of registers when adjusting fpscr for the call. */ emit_insn (gen_force_mode_for_call ()); operands[0] = function_symbol (\"__GCC_shcompact_call_trampoline\"); if (flag_pic) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, operands[0])); operands[0] = reg; } operands[0] = force_reg (SImode, operands[0]); emit_move_insn (r0, func); emit_move_insn (r1, cookie_rtx); if (cookie & CALL_COOKIE_RET_TRAMP (1)) emit_call_insn (gen_call_compact_rettramp (operands[0], operands[1], operands[2])); else emit_call_insn (gen_call_compact (operands[0], operands[1], operands[2])); DONE; } else if (TARGET_SHCOMPACT && flag_pic && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (XEXP (operands[0], 0))) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, XEXP (operands[0], 0))); XEXP (operands[0], 0) = reg; } if (flag_pic && TARGET_SH2 && GET_CODE (operands[0]) == MEM && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF) { emit_call_insn (gen_call_pcrel (XEXP (operands[0], 0), operands[1])); DONE; } else { operands[0] = force_reg (SImode, XEXP (operands[0], 0)); operands[1] = operands[2]; } emit_call_insn (gen_calli (operands[0], operands[1])); DONE; }") (define_insn "call_pop_compact" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) (match_operand 1 "" "")) (match_operand 2 "immediate_operand" "n") (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand 3 "immediate_operand" "n"))) (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && ! (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%0%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_insn "call_pop_compact_rettramp" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "r")) (match_operand 1 "" "")) (match_operand 2 "immediate_operand" "n") (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand 3 "immediate_operand" "n"))) (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI R10_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && (INTVAL (operands[2]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%0%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_expand "call_pop" [(parallel [(call (mem:SI (match_operand 0 "arith_reg_operand" "")) (match_operand 1 "" "")) (match_operand 2 "" "") (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand 3 "" "")))])] "TARGET_SHCOMPACT" " { if (operands[2] && INTVAL (operands[2])) { rtx cookie_rtx = operands[2]; long cookie = INTVAL (cookie_rtx); rtx func = XEXP (operands[0], 0); rtx r0, r1; if (flag_pic) { if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, func)); func = reg; } else func = legitimize_pic_address (func, Pmode, 0); } r0 = gen_rtx_REG (SImode, R0_REG); r1 = gen_rtx_REG (SImode, R1_REG); /* Since such a call function may use all call-clobbered registers, we force a mode switch earlier, so that we don't run out of registers when adjusting fpscr for the call. */ emit_insn (gen_force_mode_for_call ()); operands[0] = function_symbol (\"__GCC_shcompact_call_trampoline\"); if (flag_pic) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, operands[0])); operands[0] = reg; } operands[0] = force_reg (SImode, operands[0]); emit_move_insn (r0, func); emit_move_insn (r1, cookie_rtx); if (cookie & CALL_COOKIE_RET_TRAMP (1)) emit_call_insn (gen_call_pop_compact_rettramp (operands[0], operands[1], operands[2], operands[3])); else emit_call_insn (gen_call_pop_compact (operands[0], operands[1], operands[2], operands[3])); DONE; } abort (); }") (define_expand "call_value" [(parallel [(set (match_operand 0 "arith_reg_operand" "") (call (mem:SI (match_operand 1 "arith_reg_operand" "")) (match_operand 2 "" ""))) (match_operand 3 "" "") (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))])] "" " { if (TARGET_SHMEDIA) { operands[1] = XEXP (operands[1], 0); if (flag_pic && GET_CODE (operands[1]) == SYMBOL_REF) { if (! SYMBOL_REF_LOCAL_P (operands[1])) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, operands[1])); operands[1] = reg; } else { operands[1] = gen_sym2PIC (operands[1]); PUT_MODE (operands[1], Pmode); } } if (GET_MODE (operands[1]) == SImode) { if (GET_CODE (operands[1]) == REG) operands[1] = gen_rtx_SUBREG (DImode, operands[1], 0); else if (GET_CODE (operands[1]) == SUBREG) { operands[1] = SUBREG_REG (operands[1]); if (GET_MODE (operands[1]) != DImode) operands[1] = gen_rtx_SUBREG (DImode, operands[1], 0); } else { operands[1] = shallow_copy_rtx (operands[1]); PUT_MODE (operands[1], DImode); } } if (! target_reg_operand (operands[1], DImode)) operands[1] = copy_to_mode_reg (DImode, operands[1]); emit_call_insn (gen_call_value_media (operands[0], operands[1], operands[2])); DONE; } else if (TARGET_SHCOMPACT && operands[3] && INTVAL (operands[3])) { rtx cookie_rtx = operands[3]; long cookie = INTVAL (cookie_rtx); rtx func = XEXP (operands[1], 0); rtx r0, r1; if (flag_pic) { if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, func)); func = reg; } else func = legitimize_pic_address (func, Pmode, 0); } r0 = gen_rtx_REG (SImode, R0_REG); r1 = gen_rtx_REG (SImode, R1_REG); /* Since such a call function may use all call-clobbered registers, we force a mode switch earlier, so that we don't run out of registers when adjusting fpscr for the call. */ emit_insn (gen_force_mode_for_call ()); operands[1] = function_symbol (\"__GCC_shcompact_call_trampoline\"); if (flag_pic) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, operands[1])); operands[1] = reg; } operands[1] = force_reg (SImode, operands[1]); emit_move_insn (r0, func); emit_move_insn (r1, cookie_rtx); if (cookie & CALL_COOKIE_RET_TRAMP (1)) emit_call_insn (gen_call_value_compact_rettramp (operands[0], operands[1], operands[2], operands[3])); else emit_call_insn (gen_call_value_compact (operands[0], operands[1], operands[2], operands[3])); DONE; } else if (TARGET_SHCOMPACT && flag_pic && GET_CODE (XEXP (operands[1], 0)) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (XEXP (operands[1], 0))) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, XEXP (operands[1], 0))); XEXP (operands[1], 0) = reg; } if (flag_pic && TARGET_SH2 && GET_CODE (operands[1]) == MEM && GET_CODE (XEXP (operands[1], 0)) == SYMBOL_REF) { emit_call_insn (gen_call_value_pcrel (operands[0], XEXP (operands[1], 0), operands[2])); DONE; } else operands[1] = force_reg (SImode, XEXP (operands[1], 0)); emit_call_insn (gen_call_valuei (operands[0], operands[1], operands[2])); DONE; }") (define_insn "sibcalli" [(call (mem:SI (match_operand:SI 0 "register_operand" "k")) (match_operand 1 "" "")) (use (reg:PSI FPSCR_REG)) (return)] "TARGET_SH1" "jmp @%0%#" [(set_attr "needs_delay_slot" "yes") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "type" "jump_ind")]) (define_insn "sibcalli_pcrel" [(call (mem:SI (match_operand:SI 0 "arith_reg_operand" "k")) (match_operand 1 "" "")) (use (match_operand 2 "" "")) (use (reg:PSI FPSCR_REG)) (return)] "TARGET_SH2" "braf %0\\n%O2:%#" [(set_attr "needs_delay_slot" "yes") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "type" "jump_ind")]) (define_insn_and_split "sibcall_pcrel" [(call (mem:SI (match_operand:SI 0 "symbol_ref_operand" "")) (match_operand 1 "" "")) (use (reg:PSI FPSCR_REG)) (clobber (match_scratch:SI 2 "=k")) (return)] "TARGET_SH2" "#" "reload_completed" [(const_int 0)] " { rtx lab = PATTERN (gen_call_site ()); rtx call_insn; emit_insn (gen_sym_label2reg (operands[2], operands[0], lab)); call_insn = emit_call_insn (gen_sibcalli_pcrel (operands[2], operands[1], lab)); SIBLING_CALL_P (call_insn) = 1; DONE; }" [(set_attr "needs_delay_slot" "yes") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "type" "jump_ind")]) (define_insn "sibcall_compact" [(call (mem:SI (match_operand:SI 0 "register_operand" "k,k")) (match_operand 1 "" "")) (return) (use (match_operand:SI 2 "register_operand" "z,x")) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) ;; We want to make sure the `x' above will only match MACH_REG ;; because sibcall_epilogue may clobber MACL_REG. (clobber (reg:SI MACL_REG))] "TARGET_SHCOMPACT" "@ jmp @%0%# jmp @%0\\n sts %2, r0" [(set_attr "needs_delay_slot" "yes,no") (set_attr "length" "2,4") (set (attr "fp_mode") (const_string "single")) (set_attr "type" "jump_ind")]) (define_insn "sibcall_media" [(call (mem:DI (match_operand:DI 0 "target_reg_operand" "k")) (match_operand 1 "" "")) (use (reg:SI PR_MEDIA_REG)) (return)] "TARGET_SHMEDIA" "blink %0, r63" [(set_attr "type" "jump_media")]) (define_expand "sibcall" [(parallel [(call (mem:SI (match_operand 0 "arith_reg_operand" "")) (match_operand 1 "" "")) (match_operand 2 "" "") (use (reg:PSI FPSCR_REG)) (return)])] "" " { if (TARGET_SHMEDIA) { operands[0] = XEXP (operands[0], 0); if (flag_pic && GET_CODE (operands[0]) == SYMBOL_REF) { if (! SYMBOL_REF_LOCAL_P (operands[0])) { rtx reg = gen_reg_rtx (Pmode); /* We must not use GOTPLT for sibcalls, because PIC_REG must be restored before the PLT code gets to run. */ emit_insn (gen_symGOT2reg (reg, operands[0])); operands[0] = reg; } else { operands[0] = gen_sym2PIC (operands[0]); PUT_MODE (operands[0], Pmode); } } if (GET_MODE (operands[0]) == SImode) { if (GET_CODE (operands[0]) == REG) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); else if (GET_CODE (operands[0]) == SUBREG) { operands[0] = SUBREG_REG (operands[0]); if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); } else { operands[0] = shallow_copy_rtx (operands[0]); PUT_MODE (operands[0], DImode); } } if (! target_reg_operand (operands[0], DImode)) operands[0] = copy_to_mode_reg (DImode, operands[0]); emit_call_insn (gen_sibcall_media (operands[0], operands[1])); DONE; } else if (TARGET_SHCOMPACT && operands[2] && (INTVAL (operands[2]) & ~ CALL_COOKIE_RET_TRAMP (1))) { rtx cookie_rtx = operands[2]; long cookie = INTVAL (cookie_rtx); rtx func = XEXP (operands[0], 0); rtx mach, r1; if (flag_pic) { if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOT2reg (reg, func)); func = reg; } else func = legitimize_pic_address (func, Pmode, 0); } /* FIXME: if we could tell whether all argument registers are already taken, we could decide whether to force the use of MACH_REG or to stick to R0_REG. Unfortunately, there's no simple way to tell. We could use the CALL_COOKIE, but we can't currently tell a register used for regular argument passing from one that is unused. If we leave it up to reload to decide which register to use, it seems to always choose R0_REG, which leaves no available registers in SIBCALL_REGS to hold the address of the trampoline. */ mach = gen_rtx_REG (SImode, MACH_REG); r1 = gen_rtx_REG (SImode, R1_REG); /* Since such a call function may use all call-clobbered registers, we force a mode switch earlier, so that we don't run out of registers when adjusting fpscr for the call. */ emit_insn (gen_force_mode_for_call ()); operands[0] = function_symbol (\"__GCC_shcompact_call_trampoline\"); if (flag_pic) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOT2reg (reg, operands[0])); operands[0] = reg; } operands[0] = force_reg (SImode, operands[0]); /* We don't need a return trampoline, since the callee will return directly to the upper caller. */ if (cookie & CALL_COOKIE_RET_TRAMP (1)) { cookie &= ~ CALL_COOKIE_RET_TRAMP (1); cookie_rtx = GEN_INT (cookie); } emit_move_insn (mach, func); emit_move_insn (r1, cookie_rtx); emit_call_insn (gen_sibcall_compact (operands[0], operands[1], mach)); DONE; } else if (TARGET_SHCOMPACT && flag_pic && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (XEXP (operands[0], 0))) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOT2reg (reg, XEXP (operands[0], 0))); XEXP (operands[0], 0) = reg; } if (flag_pic && TARGET_SH2 && GET_CODE (operands[0]) == MEM && GET_CODE (XEXP (operands[0], 0)) == SYMBOL_REF /* The PLT needs the PIC register, but the epilogue would have to restore it, so we can only use PC-relative PIC calls for static functions. */ && SYMBOL_REF_LOCAL_P (XEXP (operands[0], 0))) { emit_call_insn (gen_sibcall_pcrel (XEXP (operands[0], 0), operands[1])); DONE; } else operands[0] = force_reg (SImode, XEXP (operands[0], 0)); emit_call_insn (gen_sibcalli (operands[0], operands[1])); DONE; }") (define_expand "sibcall_value" [(set (match_operand 0 "" "") (call (match_operand 1 "" "") (match_operand 2 "" ""))) (match_operand 3 "" "")] "" " { emit_call_insn (gen_sibcall (operands[1], operands[2], operands[3])); DONE; }") (define_insn "call_value_pop_compact" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) (match_operand 2 "" ""))) (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand 4 "immediate_operand" "n"))) (match_operand 3 "immediate_operand" "n") (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && ! (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%1%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_insn "call_value_pop_compact_rettramp" [(set (match_operand 0 "" "=rf") (call (mem:SI (match_operand:SI 1 "arith_reg_operand" "r")) (match_operand 2 "" ""))) (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand 4 "immediate_operand" "n"))) (match_operand 3 "immediate_operand" "n") (use (reg:SI R0_REG)) (use (reg:SI R1_REG)) (use (reg:PSI FPSCR_REG)) (clobber (reg:SI R10_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && (INTVAL (operands[3]) & CALL_COOKIE_RET_TRAMP (1))" "jsr @%1%#" [(set_attr "type" "call") (set (attr "fp_mode") (if_then_else (eq_attr "fpu_single" "yes") (const_string "single") (const_string "double"))) (set_attr "needs_delay_slot" "yes")]) (define_expand "call_value_pop" [(parallel [(set (match_operand 0 "arith_reg_operand" "") (call (mem:SI (match_operand 1 "arith_reg_operand" "")) (match_operand 2 "" ""))) (match_operand 3 "" "") (set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand 4 "" "")))])] "TARGET_SHCOMPACT" " { if (TARGET_SHCOMPACT && operands[3] && INTVAL (operands[3])) { rtx cookie_rtx = operands[3]; long cookie = INTVAL (cookie_rtx); rtx func = XEXP (operands[1], 0); rtx r0, r1; if (flag_pic) { if (GET_CODE (func) == SYMBOL_REF && ! SYMBOL_REF_LOCAL_P (func)) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, func)); func = reg; } else func = legitimize_pic_address (func, Pmode, 0); } r0 = gen_rtx_REG (SImode, R0_REG); r1 = gen_rtx_REG (SImode, R1_REG); /* Since such a call function may use all call-clobbered registers, we force a mode switch earlier, so that we don't run out of registers when adjusting fpscr for the call. */ emit_insn (gen_force_mode_for_call ()); operands[1] = function_symbol (\"__GCC_shcompact_call_trampoline\"); if (flag_pic) { rtx reg = gen_reg_rtx (Pmode); emit_insn (gen_symGOTPLT2reg (reg, operands[1])); operands[1] = reg; } operands[1] = force_reg (SImode, operands[1]); emit_move_insn (r0, func); emit_move_insn (r1, cookie_rtx); if (cookie & CALL_COOKIE_RET_TRAMP (1)) emit_call_insn (gen_call_value_pop_compact_rettramp (operands[0], operands[1], operands[2], operands[3], operands[4])); else emit_call_insn (gen_call_value_pop_compact (operands[0], operands[1], operands[2], operands[3], operands[4])); DONE; } abort (); }") (define_expand "sibcall_epilogue" [(return)] "" " { sh_expand_epilogue (); if (TARGET_SHCOMPACT) { rtx insn, set; /* If epilogue clobbers r0, preserve it in macl. */ for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) if ((set = single_set (insn)) && GET_CODE (SET_DEST (set)) == REG && REGNO (SET_DEST (set)) == R0_REG) { rtx r0 = gen_rtx_REG (SImode, R0_REG); rtx tmp = gen_rtx_REG (SImode, MACL_REG); rtx i; /* We can't tell at this point whether the sibcall is a sibcall_compact and, if it is, whether it uses r0 or mach as operand 2, so let the instructions that preserve r0 be optimized away if r0 turns out to be dead. */ i = emit_insn_before (gen_rtx_SET (SImode, tmp, r0), insn); REG_NOTES (i) = gen_rtx_EXPR_LIST (REG_MAYBE_DEAD, const0_rtx, REG_NOTES (i)); i = emit_move_insn (r0, tmp); REG_NOTES (i) = gen_rtx_EXPR_LIST (REG_MAYBE_DEAD, const0_rtx, REG_NOTES (i)); break; } } DONE; }") (define_insn "indirect_jump_compact" [(set (pc) (match_operand:SI 0 "arith_reg_operand" "r"))] "TARGET_SH1" "jmp @%0%#" [(set_attr "needs_delay_slot" "yes") (set_attr "type" "jump_ind")]) (define_expand "indirect_jump" [(set (pc) (match_operand 0 "register_operand" ""))] "" " { if (TARGET_SHMEDIA && GET_MODE (operands[0]) == SImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); }") ;; The use of operand 1 / 2 helps us distinguish case table jumps ;; which can be present in structured code from indirect jumps which can not ;; be present in structured code. This allows -fprofile-arcs to work. ;; For SH1 processors. (define_insn "casesi_jump_1" [(set (pc) (match_operand:SI 0 "register_operand" "r")) (use (label_ref (match_operand 1 "" "")))] "TARGET_SH1" "jmp @%0%#" [(set_attr "needs_delay_slot" "yes") (set_attr "type" "jump_ind")]) ;; For all later processors. (define_insn "casesi_jump_2" [(set (pc) (plus:SI (match_operand:SI 0 "register_operand" "r") (label_ref (match_operand 1 "" "")))) (use (label_ref (match_operand 2 "" "")))] "TARGET_SH2 && (! INSN_UID (operands[1]) || prev_real_insn (operands[1]) == insn)" "braf %0%#" [(set_attr "needs_delay_slot" "yes") (set_attr "type" "jump_ind")]) (define_insn "casesi_jump_media" [(set (pc) (match_operand:DI 0 "target_reg_operand" "b")) (use (label_ref (match_operand 1 "" "")))] "TARGET_SHMEDIA" "blink %0, r63" [(set_attr "type" "jump_media")]) ;; Call subroutine returning any type. ;; ??? This probably doesn't work. (define_expand "untyped_call" [(parallel [(call (match_operand 0 "" "") (const_int 0)) (match_operand 1 "" "") (match_operand 2 "" "")])] "TARGET_SH2E || TARGET_SHMEDIA" " { int i; emit_call_insn (gen_call (operands[0], const0_rtx, const0_rtx)); for (i = 0; i < XVECLEN (operands[2], 0); i++) { rtx set = XVECEXP (operands[2], 0, i); emit_move_insn (SET_DEST (set), SET_SRC (set)); } /* The optimizer does not know that the call sets the function value registers we stored in the result block. We avoid problems by claiming that all hard registers are used and clobbered at this point. */ emit_insn (gen_blockage ()); DONE; }") ;; ------------------------------------------------------------------------ ;; Misc insns ;; ------------------------------------------------------------------------ (define_insn "dect" [(set (reg:SI T_REG) (eq:SI (match_operand:SI 0 "arith_reg_operand" "+r") (const_int 1))) (set (match_dup 0) (plus:SI (match_dup 0) (const_int -1)))] "TARGET_SH2" "dt %0" [(set_attr "type" "arith")]) (define_insn "nop" [(const_int 0)] "" "nop") ;; Load address of a label. This is only generated by the casesi expand, ;; and by machine_dependent_reorg (fixing up fp moves). ;; This must use unspec, because this only works for labels that are ;; within range, (define_insn "mova" [(set (reg:SI R0_REG) (unspec:SI [(label_ref (match_operand 0 "" ""))] UNSPEC_MOVA))] "TARGET_SH1" "mova %O0,r0" [(set_attr "in_delay_slot" "no") (set_attr "type" "arith")]) ;; machine_dependent_reorg will make this a `mova'. (define_insn "mova_const" [(set (reg:SI R0_REG) (unspec:SI [(match_operand 0 "immediate_operand" "i")] UNSPEC_MOVA))] "TARGET_SH1" "#" [(set_attr "in_delay_slot" "no") (set_attr "type" "arith")]) (define_expand "GOTaddr2picreg" [(set (reg:SI R0_REG) (unspec:SI [(const:SI (unspec:SI [(match_dup 1)] UNSPEC_PIC))] UNSPEC_MOVA)) (set (match_dup 0) (const:SI (unspec:SI [(match_dup 1)] UNSPEC_PIC))) (set (match_dup 0) (plus:SI (match_dup 0) (reg:SI R0_REG)))] "" " { operands[0] = gen_rtx_REG (Pmode, PIC_REG); operands[1] = gen_rtx_SYMBOL_REF (VOIDmode, GOT_SYMBOL_NAME); if (TARGET_SH5) operands[1] = gen_datalabel_ref (operands[1]); if (TARGET_SHMEDIA) { rtx tr = gen_rtx_REG (DImode, TR0_REG); rtx dipic = operands[0]; rtx lab = PATTERN (gen_call_site ()); rtx insn, equiv; equiv = operands[1]; operands[1] = gen_rtx_MINUS (DImode, operands[1], gen_rtx_CONST (DImode, gen_rtx_MINUS (DImode, gen_rtx_CONST (DImode, lab), pc_rtx))); operands[1] = gen_sym2PIC (operands[1]); PUT_MODE (operands[1], DImode); if (GET_MODE (dipic) != DImode) dipic = gen_rtx_SUBREG (DImode, dipic, 0); if (TARGET_SHMEDIA64) emit_insn (gen_movdi_const (dipic, operands[1])); else emit_insn (gen_movdi_const_32bit (dipic, operands[1])); emit_insn (gen_ptrel (tr, dipic, lab)); if (GET_MODE (operands[0]) != GET_MODE (tr)) tr = gen_lowpart (GET_MODE (operands[0]), tr); insn = emit_move_insn (operands[0], tr); REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, equiv, REG_NOTES (insn)); DONE; } } ") (define_insn "*ptb" [(set (match_operand:DI 0 "target_reg_operand" "=b") (const:DI (unspec:DI [(match_operand:DI 1 "" "Csy")] UNSPEC_DATALABEL)))] "TARGET_SHMEDIA && flag_pic && EXTRA_CONSTRAINT_Csy (operands[1])" "ptb/u datalabel %1, %0" [(set_attr "type" "pt_media") (set_attr "length" "*")]) (define_insn "ptrel" [(set (match_operand:DI 0 "target_reg_operand" "=b") (plus:DI (match_operand:DI 1 "register_operand" "r") (pc))) (match_operand:DI 2 "" "")] "TARGET_SHMEDIA" "%O2: ptrel/u %1, %0" [(set_attr "type" "ptabs_media")]) (define_expand "builtin_setjmp_receiver" [(match_operand 0 "" "")] "flag_pic" " { emit_insn (gen_GOTaddr2picreg ()); DONE; }") (define_expand "call_site" [(unspec [(match_dup 0)] UNSPEC_CALLER)] "TARGET_SH1" " { static HOST_WIDE_INT i = 0; operands[0] = GEN_INT (i); i++; }") (define_expand "sym_label2reg" [(set (match_operand:SI 0 "" "") (const:SI (minus:SI (const:SI (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_PIC)) (const:SI (plus:SI (match_operand:SI 2 "" "") (const_int 2))))))] "TARGET_SH1" "") (define_expand "symGOT_load" [(set (match_dup 2) (match_operand 1 "" "")) (set (match_dup 3) (plus (match_dup 2) (reg PIC_REG))) (set (match_operand 0 "" "") (mem (match_dup 3)))] "" " { rtx insn; operands[2] = no_new_pseudos ? operands[0] : gen_reg_rtx (Pmode); operands[3] = no_new_pseudos ? operands[0] : gen_reg_rtx (Pmode); if (TARGET_SHMEDIA) { rtx reg = operands[2]; if (GET_MODE (reg) != DImode) reg = gen_rtx_SUBREG (DImode, reg, 0); if (flag_pic > 1) emit_insn (gen_movdi_const_32bit (reg, operands[1])); else emit_insn (gen_movdi_const_16bit (reg, operands[1])); } else emit_move_insn (operands[2], operands[1]); emit_move_insn (operands[3], gen_rtx_PLUS (Pmode, operands[2], gen_rtx_REG (Pmode, PIC_REG))); insn = emit_move_insn (operands[0], gen_rtx_MEM (Pmode, operands[3])); REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, XVECEXP (XEXP (operands[1], 0), 0, 0), REG_NOTES (insn)); DONE; }") (define_expand "sym2GOT" [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOT))] "" "") (define_expand "symGOT2reg" [(match_operand 0 "" "") (match_operand 1 "" "")] "" " { rtx gotsym, insn; gotsym = gen_sym2GOT (operands[1]); PUT_MODE (gotsym, Pmode); insn = emit_insn (gen_symGOT_load (operands[0], gotsym)); RTX_UNCHANGING_P (SET_SRC (PATTERN (insn))) = 1; DONE; }") (define_expand "sym2GOTPLT" [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOTPLT))] "" "") (define_expand "symGOTPLT2reg" [(match_operand 0 "" "") (match_operand 1 "" "")] "" " { emit_insn (gen_symGOT_load (operands[0], gen_sym2GOTPLT (operands[1]))); DONE; }") (define_expand "sym2GOTOFF" [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOTOFF))] "" "") (define_expand "symGOTOFF2reg" [(match_operand 0 "" "") (match_operand 1 "" "")] "" " { rtx gotoffsym, insn; rtx t = no_new_pseudos ? operands[0] : gen_reg_rtx (GET_MODE (operands[0])); gotoffsym = gen_sym2GOTOFF (operands[1]); PUT_MODE (gotoffsym, Pmode); emit_move_insn (t, gotoffsym); insn = emit_move_insn (operands[0], gen_rtx_PLUS (Pmode, t, gen_rtx_REG (Pmode, PIC_REG))); REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_EQUAL, operands[1], REG_NOTES (insn)); DONE; }") (define_expand "symPLT_label2reg" [(set (match_operand:SI 0 "" "") (const:SI (minus:SI (const:SI (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_PLT)) (const:SI (minus:SI (const:SI (plus:SI (match_operand:SI 2 "" "") (const_int 2))) (const:SI (unspec:SI [(pc)] UNSPEC_PIC))))))) ;; Even though the PIC register is not really used by the call ;; sequence in which this is expanded, the PLT code assumes the PIC ;; register is set, so we must not skip its initialization. Since ;; we only use this expand as part of calling sequences, and never ;; to take the address of a function, this is the best point to ;; insert the (use). Using the PLT to take the address of a ;; function would be wrong, not only because the PLT entry could ;; then be called from a function that doesn't initialize the PIC ;; register to the proper GOT, but also because pointers to the ;; same function might not compare equal, should they be set by ;; different shared libraries. (use (reg:SI PIC_REG))] "TARGET_SH1" "") (define_expand "sym2PIC" [(const (unspec [(match_operand:SI 0 "" "")] UNSPEC_PIC))] "" "") ;; TLS code generation. ;; ??? this should be a define_insn_and_split ;; See the thread [PATCH/RFA] SH TLS support on gcc-patches ;; ;; for details. (define_insn "tls_global_dynamic" [(set (match_operand:SI 0 "register_operand" "=&z") (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_TLSGD)) (use (reg:PSI FPSCR_REG)) (use (reg:SI PIC_REG)) (clobber (reg:SI PR_REG)) (clobber (scratch:SI))] "TARGET_SH1" "* { return \"\\ mov.l\\t1f,r4\\n\\ \\tmova\\t2f,r0\\n\\ \\tmov.l\\t2f,r1\\n\\ \\tadd\\tr0,r1\\n\\ \\tjsr\\t@r1\\n\\ \\tadd\\tr12,r4\\n\\ \\tbra\\t3f\\n\\ \\tnop\\n\\ \\t.align\\t2\\n\\ 1:\\t.long\\t%a1@TLSGD\\n\\ 2:\\t.long\\t__tls_get_addr@PLT\\n\\ 3:\"; }" [(set_attr "type" "tls_load") (set_attr "length" "26")]) (define_insn "tls_local_dynamic" [(set (match_operand:SI 0 "register_operand" "=&z") (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_TLSLDM)) (use (reg:PSI FPSCR_REG)) (use (reg:SI PIC_REG)) (clobber (reg:SI PR_REG)) (clobber (scratch:SI))] "TARGET_SH1" "* { return \"\\ mov.l\\t1f,r4\\n\\ \\tmova\\t2f,r0\\n\\ \\tmov.l\\t2f,r1\\n\\ \\tadd\\tr0,r1\\n\\ \\tjsr\\t@r1\\n\\ \\tadd\\tr12,r4\\n\\ \\tbra\\t3f\\n\\ \\tnop\\n\\ \\t.align\\t2\\n\\ 1:\\t.long\\t%a1@TLSLDM\\n\\ 2:\\t.long\\t__tls_get_addr@PLT\\n\\ 3:\"; }" [(set_attr "type" "tls_load") (set_attr "length" "26")]) (define_expand "sym2DTPOFF" [(const (unspec [(match_operand 0 "" "")] UNSPEC_DTPOFF))] "" "") (define_expand "symDTPOFF2reg" [(match_operand 0 "" "") (match_operand 1 "" "") (match_operand 2 "" "")] "" " { rtx dtpoffsym, insn; rtx t = no_new_pseudos ? operands[0] : gen_reg_rtx (GET_MODE (operands[0])); dtpoffsym = gen_sym2DTPOFF (operands[1]); PUT_MODE (dtpoffsym, Pmode); emit_move_insn (t, dtpoffsym); insn = emit_move_insn (operands[0], gen_rtx_PLUS (Pmode, t, operands[2])); DONE; }") (define_expand "sym2GOTTPOFF" [(const (unspec [(match_operand 0 "" "")] UNSPEC_GOTTPOFF))] "" "") (define_insn "tls_initial_exec" [(set (match_operand:SI 0 "register_operand" "=&r") (unspec:SI [(match_operand:SI 1 "" "")] UNSPEC_TLSIE)) (use (reg:SI GBR_REG)) (use (reg:SI PIC_REG)) (clobber (reg:SI R0_REG))] "" "* { return \"\\ mov.l\\t1f,r0\\n\\ \\tstc\\tgbr,%0\\n\\ \\tmov.l\\t@(r0,r12),r0\\n\\ \\tbra\\t2f\\n\\ \\tadd\\tr0,%0\\n\\ \\t.align\\t2\\n\\ 1:\\t.long\\t%a1\\n\\ 2:\"; }" [(set_attr "type" "tls_load") (set_attr "length" "16")]) (define_expand "sym2TPOFF" [(const (unspec [(match_operand 0 "" "")] UNSPEC_TPOFF))] "" "") (define_expand "symTPOFF2reg" [(match_operand 0 "" "") (match_operand 1 "" "")] "" " { rtx tpoffsym, insn; tpoffsym = gen_sym2TPOFF (operands[1]); PUT_MODE (tpoffsym, Pmode); insn = emit_move_insn (operands[0], tpoffsym); DONE; }") (define_insn "load_gbr" [(set (match_operand:SI 0 "register_operand" "") (reg:SI GBR_REG)) (use (reg:SI GBR_REG))] "" "stc gbr,%0" [(set_attr "type" "tls_load")]) ;; case instruction for switch statements. ;; Operand 0 is index ;; operand 1 is the minimum bound ;; operand 2 is the maximum bound - minimum bound + 1 ;; operand 3 is CODE_LABEL for the table; ;; operand 4 is the CODE_LABEL to go to if index out of range. (define_expand "casesi" [(match_operand:SI 0 "arith_reg_operand" "") (match_operand:SI 1 "arith_reg_operand" "") (match_operand:SI 2 "arith_reg_operand" "") (match_operand 3 "" "") (match_operand 4 "" "")] "" " { rtx reg = gen_reg_rtx (SImode); rtx reg2 = gen_reg_rtx (SImode); if (TARGET_SHMEDIA) { rtx reg = gen_reg_rtx (DImode); rtx reg2 = gen_reg_rtx (DImode); rtx reg3 = gen_reg_rtx (DImode); rtx reg4 = gen_reg_rtx (DImode); rtx reg5 = gen_reg_rtx (DImode); operands[0] = convert_modes (DImode, SImode, operands[0], 0); operands[1] = convert_modes (DImode, SImode, operands[1], 0); operands[2] = convert_modes (DImode, SImode, operands[2], 1); emit_jump_insn (gen_bgt_media (operands[4], operands[1], operands[0])); emit_move_insn (reg, gen_rtx_MINUS (DImode, operands[0], operands[1])); emit_jump_insn (gen_bgtu_media (operands[4], reg, operands[2])); emit_insn (gen_casesi_shift_media (reg2, reg, operands[3])); emit_move_insn (reg3, gen_datalabel_ref (gen_rtx_LABEL_REF (DImode, operands[3]))); emit_insn (gen_casesi_load_media (reg4, reg3, reg2, operands[3])); emit_move_insn (reg5, gen_rtx_PLUS (DImode, reg3, reg4)); emit_jump_insn (gen_casesi_jump_media (reg5, operands[3])); emit_barrier (); DONE; } operands[1] = copy_to_mode_reg (SImode, operands[1]); operands[2] = copy_to_mode_reg (SImode, operands[2]); /* If optimizing, casesi_worker depends on the mode of the instruction before label it 'uses' - operands[3]. */ emit_insn (gen_casesi_0 (operands[0], operands[1], operands[2], operands[4], reg)); emit_insn (gen_casesi_worker_0 (reg2, reg, operands[3])); if (TARGET_SH2) emit_jump_insn (gen_casesi_jump_2 (reg2, gen_label_rtx (), operands[3])); else emit_jump_insn (gen_casesi_jump_1 (reg2, operands[3])); /* For SH2 and newer, the ADDR_DIFF_VEC is not actually relative to operands[3], but to lab. We will fix this up in machine_dependent_reorg. */ emit_barrier (); DONE; }") (define_expand "casesi_0" [(set (match_operand:SI 4 "" "") (match_operand:SI 0 "arith_reg_operand" "")) (set (match_dup 4) (minus:SI (match_dup 4) (match_operand:SI 1 "arith_operand" ""))) (set (reg:SI T_REG) (gtu:SI (match_dup 4) (match_operand:SI 2 "arith_reg_operand" ""))) (set (pc) (if_then_else (ne (reg:SI T_REG) (const_int 0)) (label_ref (match_operand 3 "" "")) (pc)))] "TARGET_SH1" "") ;; ??? reload might clobber r0 if we use it explicitly in the RTL before ;; reload; using a R0_REGS pseudo reg is likely to give poor code. ;; So we keep the use of r0 hidden in a R0_REGS clobber until after reload. (define_insn "casesi_worker_0" [(set (match_operand:SI 0 "register_operand" "=r,r") (unspec:SI [(match_operand:SI 1 "register_operand" "0,r") (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) (clobber (match_scratch:SI 3 "=X,1")) (clobber (match_scratch:SI 4 "=&z,z"))] "TARGET_SH1" "#") (define_split [(set (match_operand:SI 0 "register_operand" "") (unspec:SI [(match_operand:SI 1 "register_operand" "") (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) (clobber (match_scratch:SI 3 "")) (clobber (match_scratch:SI 4 ""))] "TARGET_SH1 && ! TARGET_SH2 && reload_completed" [(set (reg:SI R0_REG) (unspec:SI [(label_ref (match_dup 2))] UNSPEC_MOVA)) (parallel [(set (match_dup 0) (unspec:SI [(reg:SI R0_REG) (match_dup 1) (label_ref (match_dup 2))] UNSPEC_CASESI)) (clobber (match_dup 3))]) (set (match_dup 0) (plus:SI (match_dup 0) (reg:SI R0_REG)))] "if (GET_CODE (operands[2]) == CODE_LABEL) LABEL_NUSES (operands[2])++;") (define_split [(set (match_operand:SI 0 "register_operand" "") (unspec:SI [(match_operand:SI 1 "register_operand" "") (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) (clobber (match_scratch:SI 3 "")) (clobber (match_scratch:SI 4 ""))] "TARGET_SH2 && reload_completed" [(set (reg:SI R0_REG) (unspec:SI [(label_ref (match_dup 2))] UNSPEC_MOVA)) (parallel [(set (match_dup 0) (unspec:SI [(reg:SI R0_REG) (match_dup 1) (label_ref (match_dup 2))] UNSPEC_CASESI)) (clobber (match_dup 3))])] "if (GET_CODE (operands[2]) == CODE_LABEL) LABEL_NUSES (operands[2])++;") (define_insn "*casesi_worker" [(set (match_operand:SI 0 "register_operand" "=r,r") (unspec:SI [(reg:SI R0_REG) (match_operand:SI 1 "register_operand" "0,r") (label_ref (match_operand 2 "" ""))] UNSPEC_CASESI)) (clobber (match_scratch:SI 3 "=X,1"))] "TARGET_SH1" "* { rtx diff_vec = PATTERN (next_real_insn (operands[2])); if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) abort (); switch (GET_MODE (diff_vec)) { case SImode: return \"shll2 %1\;mov.l @(r0,%1),%0\"; case HImode: return \"add %1,%1\;mov.w @(r0,%1),%0\"; case QImode: if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) return \"mov.b @(r0,%1),%0\;extu.b %0,%0\"; return \"mov.b @(r0,%1),%0\"; default: abort (); } }" [(set_attr "length" "4")]) (define_insn "casesi_shift_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (ashift:DI (match_operand:DI 1 "arith_reg_operand" "r") (unspec:DI [(label_ref:DI (match_operand 2 "" ""))] UNSPEC_CASESI)))] "TARGET_SHMEDIA" "* { rtx diff_vec = PATTERN (next_real_insn (operands[2])); if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) abort (); switch (GET_MODE (diff_vec)) { case SImode: return \"shlli %1, 2, %0\"; case HImode: return \"shlli %1, 1, %0\"; case QImode: if (rtx_equal_p (operands[0], operands[1])) return \"\"; return \"add %1, r63, %0\"; default: abort (); } }" [(set_attr "type" "arith_media")]) (define_insn "casesi_load_media" [(set (match_operand:DI 0 "arith_reg_operand" "=r") (mem:DI (unspec [(match_operand 1 "arith_reg_operand" "r") (match_operand 2 "arith_reg_operand" "r") (label_ref:DI (match_operand 3 "" ""))] 2)))] "TARGET_SHMEDIA" "* { rtx diff_vec = PATTERN (next_real_insn (operands[3])); if (GET_CODE (diff_vec) != ADDR_DIFF_VEC) abort (); switch (GET_MODE (diff_vec)) { case SImode: return \"ldx.l %1, %2, %0\"; case HImode: #if 0 if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) return \"ldx.uw %1, %2, %0\"; #endif return \"ldx.w %1, %2, %0\"; case QImode: if (ADDR_DIFF_VEC_FLAGS (diff_vec).offset_unsigned) return \"ldx.ub %1, %2, %0\"; return \"ldx.b %1, %2, %0\"; default: abort (); } }" [(set_attr "type" "load_media")]) (define_expand "return" [(return)] "reload_completed && ! sh_need_epilogue ()" " { if (TARGET_SHMEDIA) { emit_jump_insn (gen_return_media ()); DONE; } if (TARGET_SHCOMPACT && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))) { emit_jump_insn (gen_shcompact_return_tramp ()); DONE; } }") (define_insn "*return_i" [(return)] "TARGET_SH1 && ! (TARGET_SHCOMPACT && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))) && reload_completed" "%@ %#" [(set_attr "type" "return") (set_attr "needs_delay_slot" "yes")]) (define_expand "shcompact_return_tramp" [(return)] "TARGET_SHCOMPACT && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))" " { rtx reg = gen_rtx_REG (Pmode, R0_REG); rtx sym = function_symbol (\"__GCC_shcompact_return_trampoline\"); if (flag_pic) emit_insn (gen_symGOTPLT2reg (reg, sym)); else emit_move_insn (reg, sym); emit_jump_insn (gen_shcompact_return_tramp_i ()); DONE; }") (define_insn "shcompact_return_tramp_i" [(parallel [(return) (use (reg:SI R0_REG))])] "TARGET_SHCOMPACT && (current_function_args_info.call_cookie & CALL_COOKIE_RET_TRAMP (1))" "jmp @r0%#" [(set_attr "type" "jump_ind") (set_attr "needs_delay_slot" "yes")]) (define_insn "return_media_i" [(parallel [(return) (use (match_operand:DI 0 "target_reg_operand" "k"))])] "TARGET_SHMEDIA && reload_completed" "blink %0, r63" [(set_attr "type" "jump_media")]) (define_insn "return_media_rte" [(return)] "TARGET_SHMEDIA && reload_completed && current_function_interrupt" "rte" [(set_attr "type" "jump_media")]) (define_expand "return_media" [(return)] "TARGET_SHMEDIA && reload_completed" " { int tr_regno = sh_media_register_for_return (); rtx tr; if (current_function_interrupt) { emit_jump_insn (gen_return_media_rte ()); DONE; } if (tr_regno < 0) { rtx r18 = gen_rtx_REG (DImode, PR_MEDIA_REG); if (! call_used_regs[TR0_REG] || fixed_regs[TR0_REG]) abort (); tr_regno = TR0_REG; tr = gen_rtx_REG (DImode, tr_regno); emit_move_insn (tr, r18); } else tr = gen_rtx_REG (DImode, tr_regno); emit_jump_insn (gen_return_media_i (tr)); DONE; }") (define_insn "shcompact_preserve_incoming_args" [(set (match_operand:SI 0 "register_operand" "+r") (unspec:SI [(match_dup 0)] UNSPEC_COMPACT_ARGS))] "TARGET_SHCOMPACT" "" [(set_attr "length" "0")]) (define_insn "shcompact_incoming_args" [(set (reg:SI R2_REG) (unspec:SI [(reg:SI R2_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R3_REG) (unspec:SI [(reg:SI R3_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R4_REG) (unspec:SI [(reg:SI R4_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R5_REG) (unspec:SI [(reg:SI R5_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R6_REG) (unspec:SI [(reg:SI R6_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R7_REG) (unspec:SI [(reg:SI R7_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R8_REG) (unspec:SI [(reg:SI R8_REG)] UNSPEC_COMPACT_ARGS)) (set (reg:SI R9_REG) (unspec:SI [(reg:SI R9_REG)] UNSPEC_COMPACT_ARGS)) (set (mem:BLK (reg:SI MACL_REG)) (unspec:BLK [(reg:SI MACH_REG)] UNSPEC_COMPACT_ARGS)) (use (reg:SI R0_REG)) (clobber (reg:SI R0_REG)) (clobber (reg:SI MACL_REG)) (clobber (reg:SI MACH_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT" "jsr @r0%#" [(set_attr "needs_delay_slot" "yes")]) (define_insn "shmedia_save_restore_regs_compact" [(set (reg:SI SP_REG) (plus:SI (reg:SI SP_REG) (match_operand:SI 0 "immediate_operand" "i"))) (use (reg:SI R0_REG)) (clobber (reg:SI PR_REG))] "TARGET_SHCOMPACT && (INTVAL (operands[0]) == SHMEDIA_REGS_STACK_ADJUST () || INTVAL (operands[0]) == - SHMEDIA_REGS_STACK_ADJUST ())" "jsr @r0%#" [(set_attr "needs_delay_slot" "yes")]) (define_expand "prologue" [(const_int 0)] "" "sh_expand_prologue (); DONE;") (define_expand "epilogue" [(return)] "" " { sh_expand_epilogue (); emit_jump_insn (gen_return ()); DONE; }") (define_expand "eh_return" [(use (match_operand 0 "register_operand" ""))] "" { rtx tmp, ra = operands[0]; if (TARGET_SHMEDIA64) emit_insn (gen_eh_set_ra_di (ra)); else emit_insn (gen_eh_set_ra_si (ra)); DONE; }) ;; Clobber the return address on the stack. We can't expand this ;; until we know where it will be put in the stack frame. (define_insn "eh_set_ra_si" [(unspec [(match_operand:SI 0 "register_operand" "r")] UNSPEC_EH_RETURN) (clobber (match_scratch:SI 1 "=&r"))] "! TARGET_SHMEDIA64" "#") (define_insn "eh_set_ra_di" [(unspec [(match_operand:DI 0 "register_operand" "r")] UNSPEC_EH_RETURN) (clobber (match_scratch:DI 1 "=&r"))] "TARGET_SHMEDIA64" "#") (define_split [(unspec [(match_operand 0 "register_operand" "")] UNSPEC_EH_RETURN) (clobber (match_scratch 1 ""))] "reload_completed" [(const_int 0)] " { sh_set_return_address (operands[0], operands[1]); DONE; }") (define_insn "blockage" [(unspec_volatile [(const_int 0)] UNSPECV_BLOCKAGE)] "" "" [(set_attr "length" "0")]) ;; ------------------------------------------------------------------------ ;; Scc instructions ;; ------------------------------------------------------------------------ (define_insn "movt" [(set (match_operand:SI 0 "arith_reg_operand" "=r") (eq:SI (reg:SI T_REG) (const_int 1)))] "TARGET_SH1" "movt %0" [(set_attr "type" "arith")]) (define_expand "seq" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); switch (GET_MODE (sh_compare_op0)) { case DImode: emit_insn (gen_cmpeqdi_media (operands[0], sh_compare_op0, sh_compare_op1)); break; case SFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpeqsf_media (operands[0], sh_compare_op0, sh_compare_op1)); break; case DFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpeqdf_media (operands[0], sh_compare_op0, sh_compare_op1)); break; default: FAIL; } DONE; } if (sh_expand_t_scc (EQ, operands[0])) DONE; if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (EQ); }") (define_expand "slt" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); switch (GET_MODE (sh_compare_op0)) { case DImode: emit_insn (gen_cmpgtdi_media (operands[0], sh_compare_op1, sh_compare_op0)); break; case SFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgtsf_media (operands[0], sh_compare_op1, sh_compare_op0)); break; case DFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgtdf_media (operands[0], sh_compare_op1, sh_compare_op0)); break; default: FAIL; } DONE; } if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (LT); }") (define_expand "sle" [(match_operand:SI 0 "arith_reg_operand" "")] "" " { rtx tmp = sh_compare_op0; if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); switch (GET_MODE (sh_compare_op0)) { case DImode: { tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); emit_insn (gen_cmpgtdi_media (tmp, sh_compare_op0, sh_compare_op1)); emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); break; } case SFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgesf_media (operands[0], sh_compare_op1, sh_compare_op0)); break; case DFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgedf_media (operands[0], sh_compare_op1, sh_compare_op0)); break; default: FAIL; } DONE; } sh_compare_op0 = sh_compare_op1; sh_compare_op1 = tmp; emit_insn (gen_sge (operands[0])); DONE; }") (define_expand "sgt" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); switch (GET_MODE (sh_compare_op0)) { case DImode: emit_insn (gen_cmpgtdi_media (operands[0], sh_compare_op0, sh_compare_op1)); break; case SFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgtsf_media (operands[0], sh_compare_op0, sh_compare_op1)); break; case DFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgtdf_media (operands[0], sh_compare_op0, sh_compare_op1)); break; default: FAIL; } DONE; } if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (GT); }") (define_expand "sge" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); switch (GET_MODE (sh_compare_op0)) { case DImode: { rtx tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); emit_insn (gen_cmpgtdi_media (tmp, sh_compare_op1, sh_compare_op0)); emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); break; } case SFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgesf_media (operands[0], sh_compare_op0, sh_compare_op1)); break; case DFmode: if (! TARGET_SHMEDIA_FPU) FAIL; emit_insn (gen_cmpgedf_media (operands[0], sh_compare_op0, sh_compare_op1)); break; default: FAIL; } DONE; } if (! rtx_equal_function_value_matters) FAIL; if (GET_MODE_CLASS (GET_MODE (sh_compare_op0)) == MODE_FLOAT) { if (TARGET_IEEE) { rtx lab = gen_label_rtx (); prepare_scc_operands (EQ); emit_jump_insn (gen_branch_true (lab)); prepare_scc_operands (GT); emit_label (lab); emit_insn (gen_movt (operands[0])); } else emit_insn (gen_movnegt (operands[0], prepare_scc_operands (LT))); DONE; } operands[1] = prepare_scc_operands (GE); }") (define_expand "sgtu" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); emit_insn (gen_cmpgtudi_media (operands[0], sh_compare_op0, sh_compare_op1)); DONE; } if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (GTU); }") (define_expand "sltu" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); emit_insn (gen_cmpgtudi_media (operands[0], sh_compare_op1, sh_compare_op0)); DONE; } if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (LTU); }") (define_expand "sleu" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { rtx tmp; if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); emit_insn (gen_cmpgtudi_media (tmp, sh_compare_op0, sh_compare_op1)); emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); DONE; } if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (LEU); }") (define_expand "sgeu" [(set (match_operand:SI 0 "arith_reg_operand" "") (match_dup 1))] "" " { if (TARGET_SHMEDIA) { rtx tmp; if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); emit_insn (gen_cmpgtudi_media (tmp, sh_compare_op1, sh_compare_op0)); emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); DONE; } if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (GEU); }") ;; sne moves the complement of the T reg to DEST like this: ;; cmp/eq ... ;; mov #-1,temp ;; negc temp,dest ;; This is better than xoring compare result with 1 because it does ;; not require r0 and further, the -1 may be CSE-ed or lifted out of a ;; loop. (define_expand "sne" [(set (match_dup 2) (const_int -1)) (parallel [(set (match_operand:SI 0 "arith_reg_operand" "") (neg:SI (plus:SI (match_dup 1) (match_dup 2)))) (set (reg:SI T_REG) (ne:SI (ior:SI (match_dup 1) (match_dup 2)) (const_int 0)))])] "" " { if (TARGET_SHMEDIA) { rtx tmp; if (GET_MODE (operands[0]) != DImode) operands[0] = gen_rtx_SUBREG (DImode, operands[0], 0); if (! TARGET_SHMEDIA_FPU && GET_MODE (sh_compare_op0) != DImode) FAIL; sh_compare_op0 = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); if (sh_compare_op1 != const0_rtx) sh_compare_op1 = force_reg (GET_MODE (sh_compare_op1) == VOIDmode ? GET_MODE (sh_compare_op0) : GET_MODE (sh_compare_op1), sh_compare_op1); tmp = no_new_pseudos ? operands[0] : gen_reg_rtx (DImode); emit_insn (gen_seq (tmp)); emit_insn (gen_cmpeqdi_media (operands[0], tmp, const0_rtx)); DONE; } if (sh_expand_t_scc (NE, operands[0])) DONE; if (! rtx_equal_function_value_matters) FAIL; operands[1] = prepare_scc_operands (EQ); operands[2] = gen_reg_rtx (SImode); }") (define_expand "sunordered" [(set (match_operand:DI 0 "arith_reg_operand" "") (unordered:DI (match_dup 1) (match_dup 2)))] "TARGET_SHMEDIA_FPU" " { operands[1] = force_reg (GET_MODE (sh_compare_op0), sh_compare_op0); operands[2] = force_reg (GET_MODE (sh_compare_op1), sh_compare_op1); }") ;; Use the same trick for FP sle / sge (define_expand "movnegt" [(set (match_dup 2) (const_int -1)) (parallel [(set (match_operand 0 "" "") (neg:SI (plus:SI (match_dup 1) (match_dup 2)))) (set (reg:SI T_REG) (ne:SI (ior:SI (match_operand 1 "" "") (match_dup 2)) (const_int 0)))])] "TARGET_SH1" "operands[2] = gen_reg_rtx (SImode);") ;; Recognize mov #-1/negc/neg sequence, and change it to movt/add #-1. ;; This prevents a regression that occurred when we switched from xor to ;; mov/neg for sne. (define_split [(set (match_operand:SI 0 "arith_reg_operand" "") (plus:SI (reg:SI T_REG) (const_int -1)))] "TARGET_SH1" [(set (match_dup 0) (eq:SI (reg:SI T_REG) (const_int 1))) (set (match_dup 0) (plus:SI (match_dup 0) (const_int -1)))] "") ;; ------------------------------------------------------------------------- ;; Instructions to cope with inline literal tables ;; ------------------------------------------------------------------------- ; 2 byte integer in line (define_insn "consttable_2" [(unspec_volatile [(match_operand:SI 0 "general_operand" "=g") (match_operand 1 "" "")] UNSPECV_CONST2)] "" "* { if (operands[1] != const0_rtx) assemble_integer (operands[0], 2, BITS_PER_UNIT * 2, 1); return \"\"; }" [(set_attr "length" "2") (set_attr "in_delay_slot" "no")]) ; 4 byte integer in line (define_insn "consttable_4" [(unspec_volatile [(match_operand:SI 0 "general_operand" "=g") (match_operand 1 "" "")] UNSPECV_CONST4)] "" "* { if (operands[1] != const0_rtx) assemble_integer (operands[0], 4, BITS_PER_UNIT * 4, 1); return \"\"; }" [(set_attr "length" "4") (set_attr "in_delay_slot" "no")]) ; 8 byte integer in line (define_insn "consttable_8" [(unspec_volatile [(match_operand:SI 0 "general_operand" "=g") (match_operand 1 "" "")] UNSPECV_CONST8)] "" "* { if (operands[1] != const0_rtx) assemble_integer (operands[0], 8, BITS_PER_UNIT * 8, 1); return \"\"; }" [(set_attr "length" "8") (set_attr "in_delay_slot" "no")]) ; 4 byte floating point (define_insn "consttable_sf" [(unspec_volatile [(match_operand:SF 0 "general_operand" "=g") (match_operand 1 "" "")] UNSPECV_CONST4)] "" "* { if (operands[1] != const0_rtx) { REAL_VALUE_TYPE d; REAL_VALUE_FROM_CONST_DOUBLE (d, operands[0]); assemble_real (d, SFmode, GET_MODE_ALIGNMENT (SFmode)); } return \"\"; }" [(set_attr "length" "4") (set_attr "in_delay_slot" "no")]) ; 8 byte floating point (define_insn "consttable_df" [(unspec_volatile [(match_operand:DF 0 "general_operand" "=g") (match_operand 1 "" "")] UNSPECV_CONST8)] "" "* { if (operands[1] != const0_rtx) { REAL_VALUE_TYPE d; REAL_VALUE_FROM_CONST_DOUBLE (d, operands[0]); assemble_real (d, DFmode, GET_MODE_ALIGNMENT (DFmode)); } return \"\"; }" [(set_attr "length" "8") (set_attr "in_delay_slot" "no")]) ;; Alignment is needed for some constant tables; it may also be added for ;; Instructions at the start of loops, or after unconditional branches. ;; ??? We would get more accurate lengths if we did instruction ;; alignment based on the value of INSN_CURRENT_ADDRESS; the approach used ;; here is too conservative. ; align to a two byte boundary (define_expand "align_2" [(unspec_volatile [(const_int 1)] UNSPECV_ALIGN)] "" "") ; align to a four byte boundary ;; align_4 and align_log are instructions for the starts of loops, or ;; after unconditional branches, which may take up extra room. (define_expand "align_4" [(unspec_volatile [(const_int 2)] UNSPECV_ALIGN)] "" "") ; align to a cache line boundary (define_insn "align_log" [(unspec_volatile [(match_operand 0 "const_int_operand" "")] UNSPECV_ALIGN)] "" "" [(set_attr "length" "0") (set_attr "in_delay_slot" "no")]) ; emitted at the end of the literal table, used to emit the ; 32bit branch labels if needed. (define_insn "consttable_end" [(unspec_volatile [(const_int 0)] UNSPECV_CONST_END)] "" "* return output_jump_label_table ();" [(set_attr "in_delay_slot" "no")]) ; emitted at the end of the window in the literal table. (define_insn "consttable_window_end" [(unspec_volatile [(match_operand 0 "" "")] UNSPECV_WINDOW_END)] "" "" [(set_attr "length" "0") (set_attr "in_delay_slot" "no")]) ;; ------------------------------------------------------------------------- ;; Misc ;; ------------------------------------------------------------------------- ;; String/block move insn. (define_expand "movstrsi" [(parallel [(set (mem:BLK (match_operand:BLK 0 "" "")) (mem:BLK (match_operand:BLK 1 "" ""))) (use (match_operand:SI 2 "nonmemory_operand" "")) (use (match_operand:SI 3 "immediate_operand" "")) (clobber (reg:SI PR_REG)) (clobber (reg:SI R4_REG)) (clobber (reg:SI R5_REG)) (clobber (reg:SI R0_REG))])] "TARGET_SH1 && ! TARGET_SH5" " { if(expand_block_move (operands)) DONE; else FAIL; }") (define_insn "block_move_real" [(parallel [(set (mem:BLK (reg:SI R4_REG)) (mem:BLK (reg:SI R5_REG))) (use (match_operand:SI 0 "arith_reg_operand" "r")) (clobber (reg:SI PR_REG)) (clobber (reg:SI R0_REG))])] "TARGET_SH1 && ! TARGET_HARD_SH4" "jsr @%0%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_insn "block_lump_real" [(parallel [(set (mem:BLK (reg:SI R4_REG)) (mem:BLK (reg:SI R5_REG))) (use (match_operand:SI 0 "arith_reg_operand" "r")) (use (reg:SI R6_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI T_REG)) (clobber (reg:SI R4_REG)) (clobber (reg:SI R5_REG)) (clobber (reg:SI R6_REG)) (clobber (reg:SI R0_REG))])] "TARGET_SH1 && ! TARGET_HARD_SH4" "jsr @%0%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_insn "block_move_real_i4" [(parallel [(set (mem:BLK (reg:SI R4_REG)) (mem:BLK (reg:SI R5_REG))) (use (match_operand:SI 0 "arith_reg_operand" "r")) (clobber (reg:SI PR_REG)) (clobber (reg:SI R0_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R2_REG))])] "TARGET_HARD_SH4" "jsr @%0%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) (define_insn "block_lump_real_i4" [(parallel [(set (mem:BLK (reg:SI R4_REG)) (mem:BLK (reg:SI R5_REG))) (use (match_operand:SI 0 "arith_reg_operand" "r")) (use (reg:SI R6_REG)) (clobber (reg:SI PR_REG)) (clobber (reg:SI T_REG)) (clobber (reg:SI R4_REG)) (clobber (reg:SI R5_REG)) (clobber (reg:SI R6_REG)) (clobber (reg:SI R0_REG)) (clobber (reg:SI R1_REG)) (clobber (reg:SI R2_REG)) (clobber (reg:SI R3_REG))])] "TARGET_HARD_SH4" "jsr @%0%#" [(set_attr "type" "sfunc") (set_attr "needs_delay_slot" "yes")]) ;; ------------------------------------------------------------------------- ;; Floating point instructions. ;; ------------------------------------------------------------------------- ;; ??? All patterns should have a type attribute. (define_expand "fpu_switch0" [(set (match_operand:SI 0 "" "") (match_dup 2)) (set (match_dup 1) (mem:PSI (match_dup 0)))] "TARGET_SH4" " { operands[1] = get_fpscr_rtx (); operands[2] = gen_rtx_SYMBOL_REF (SImode, \"__fpscr_values\"); if (flag_pic) operands[2] = legitimize_pic_address (operands[2], SImode, no_new_pseudos ? operands[0] : 0); }") (define_expand "fpu_switch1" [(set (match_operand:SI 0 "" "") (match_dup 2)) (set (match_dup 3) (plus:SI (match_dup 0) (const_int 4))) (set (match_dup 1) (mem:PSI (match_dup 3)))] "TARGET_SH4" " { operands[1] = get_fpscr_rtx (); operands[2] = gen_rtx_SYMBOL_REF (SImode, \"__fpscr_values\"); if (flag_pic) operands[2] = legitimize_pic_address (operands[2], SImode, no_new_pseudos ? operands[0] : 0); operands[3] = no_new_pseudos ? operands[0] : gen_reg_rtx (SImode); }") (define_expand "movpsi" [(set (match_operand:PSI 0 "register_operand" "") (match_operand:PSI 1 "general_movsrc_operand" ""))] "TARGET_SH4" "") ;; The c / m alternative is a fake to guide reload to load directly into ;; fpscr, since reload doesn't know how to use post-increment. ;; GO_IF_LEGITIMATE_ADDRESS guards about bogus addresses before reload, ;; SECONDARY_INPUT_RELOAD_CLASS does this during reload, and the insn's ;; predicate after reload. ;; The mac_gp type for r/!c might look a bit odd, but it actually schedules ;; like a mac -> gpr move. (define_insn "fpu_switch" [(set (match_operand:PSI 0 "general_movdst_operand" "=c,c,r,c,c,r,m,r,<") (match_operand:PSI 1 "general_movsrc_operand" "c,>,m,m,r,r,r,!c,c"))] "TARGET_SH2E && (! reload_completed || true_regnum (operands[0]) != FPSCR_REG || GET_CODE (operands[1]) != MEM || GET_CODE (XEXP (operands[1], 0)) != PLUS)" "@ ! precision stays the same lds.l %1,fpscr mov.l %1,%0 # lds %1,fpscr mov %1,%0 mov.l %1,%0 sts fpscr,%0 sts.l fpscr,%0" [(set_attr "length" "0,2,2,4,2,2,2,2,2") (set_attr "type" "nil,mem_fpscr,load,mem_fpscr,gp_fpscr,move,store,mac_gp,store")]) (define_split [(set (reg:PSI FPSCR_REG) (mem:PSI (match_operand:SI 0 "register_operand" "")))] "TARGET_SH4 && find_regno_note (insn, REG_DEAD, true_regnum (operands[0]))" [(set (match_dup 0) (match_dup 0))] " { rtx insn = emit_insn (gen_fpu_switch (get_fpscr_rtx (), gen_rtx (MEM, PSImode, gen_rtx (POST_INC, Pmode, operands[0])))); REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, operands[0], NULL_RTX); }") (define_split [(set (reg:PSI FPSCR_REG) (mem:PSI (match_operand:SI 0 "register_operand" "")))] "TARGET_SH4" [(set (match_dup 0) (plus:SI (match_dup 0) (const_int -4)))] " { rtx insn = emit_insn (gen_fpu_switch (get_fpscr_rtx (), gen_rtx (MEM, PSImode, gen_rtx (POST_INC, Pmode, operands[0])))); REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_INC, operands[0], NULL_RTX); }") ;; ??? This uses the fp unit, but has no type indicating that. ;; If we did that, this would either give a bogus latency or introduce ;; a bogus FIFO constraint. ;; Since this insn is currently only used for prologues/epilogues, ;; it is probably best to claim no function unit, which matches the ;; current setting. (define_insn "toggle_sz" [(set (reg:PSI FPSCR_REG) (xor:PSI (reg:PSI FPSCR_REG) (const_int 1048576)))] "TARGET_SH4" "fschg" [(set_attr "fp_set" "unknown")]) (define_expand "addsf3" [(set (match_operand:SF 0 "arith_reg_operand" "") (plus:SF (match_operand:SF 1 "arith_reg_operand" "") (match_operand:SF 2 "arith_reg_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH2E) { expand_sf_binop (&gen_addsf3_i, operands); DONE; } }") (define_insn "*addsf3_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (plus:SF (match_operand:SF 1 "fp_arith_reg_operand" "%f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fadd.s %1, %2, %0" [(set_attr "type" "fparith_media")]) (define_insn_and_split "unary_sf_op" [(set (match_operand:V2SF 0 "fp_arith_reg_operand" "=f") (vec_select:V2SF (vec_concat:V2SF (vec_select:SF (match_dup 0) (parallel [(not:BI (match_operand 3 "const_int_operand" "n"))])) (match_operator:SF 2 "unary_float_operator" [(vec_select:SF (match_operand:V2SF 1 "fp_arith_reg_operand" "f") (parallel [(match_operand 4 "const_int_operand" "n")]))])) (parallel [(not:BI (match_dup 3)) (match_dup 3)])))] "TARGET_SHMEDIA_FPU" "#" "TARGET_SHMEDIA_FPU && reload_completed" [(set (match_dup 5) (match_dup 6))] " { int endian = TARGET_LITTLE_ENDIAN ? 0 : 1; rtx op1 = gen_rtx_REG (SFmode, (true_regnum (operands[1]) + (INTVAL (operands[4]) ^ endian))); operands[7] = gen_rtx_REG (SFmode, (true_regnum (operands[0]) + (INTVAL (operands[3]) ^ endian))); operands[6] = gen_rtx (GET_CODE (operands[2]), SFmode, op1); }" [(set_attr "type" "fparith_media")]) (define_insn_and_split "binary_sf_op" [(set (match_operand:V2SF 0 "fp_arith_reg_operand" "=f") (vec_select:V2SF (vec_concat:V2SF (vec_select:SF (match_dup 0) (parallel [(match_operand 7 "const_int_operand" "n")])) (match_operator:SF 3 "binary_float_operator" [(vec_select:SF (match_operand:V2SF 1 "fp_arith_reg_operand" "f") (parallel [(match_operand 5 "const_int_operand" "n")])) (vec_select:SF (match_operand:V2SF 2 "fp_arith_reg_operand" "f") (parallel [(match_operand 6 "const_int_operand" "n")]))])) (parallel [(match_dup 7) (match_operand 4 "const_int_operand" "n")])))] "TARGET_SHMEDIA_FPU && INTVAL (operands[4]) != INTVAL (operands[7])" "#" "&& reload_completed" [(set (match_dup 8) (match_dup 9))] " { int endian = TARGET_LITTLE_ENDIAN ? 0 : 1; rtx op1 = gen_rtx_REG (SFmode, (true_regnum (operands[1]) + (INTVAL (operands[5]) ^ endian))); rtx op2 = gen_rtx_REG (SFmode, (true_regnum (operands[2]) + (INTVAL (operands[6]) ^ endian))); operands[8] = gen_rtx_REG (SFmode, (true_regnum (operands[0]) + (INTVAL (operands[4]) ^ endian))); operands[9] = gen_rtx (GET_CODE (operands[3]), SFmode, op1, op2); }" [(set_attr "type" "fparith_media")]) (define_insn "addsf3_i" [(set (match_operand:SF 0 "arith_reg_operand" "=f") (plus:SF (match_operand:SF 1 "arith_reg_operand" "%0") (match_operand:SF 2 "arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH2E" "fadd %2,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_expand "subsf3" [(set (match_operand:SF 0 "fp_arith_reg_operand" "") (minus:SF (match_operand:SF 1 "fp_arith_reg_operand" "") (match_operand:SF 2 "fp_arith_reg_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH2E) { expand_sf_binop (&gen_subsf3_i, operands); DONE; } }") (define_insn "*subsf3_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (minus:SF (match_operand:SF 1 "fp_arith_reg_operand" "f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fsub.s %1, %2, %0" [(set_attr "type" "fparith_media")]) (define_insn "subsf3_i" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (minus:SF (match_operand:SF 1 "fp_arith_reg_operand" "0") (match_operand:SF 2 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH2E" "fsub %2,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) ;; Unfortunately, the combiner is unable to cope with the USE of the FPSCR ;; register in feeding fp instructions. Thus, we cannot generate fmac for ;; mixed-precision SH4 targets. To allow it to be still generated for the ;; SH3E, we use a separate insn for SH3E mulsf3. (define_expand "mulsf3" [(set (match_operand:SF 0 "fp_arith_reg_operand" "") (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "") (match_operand:SF 2 "fp_arith_reg_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) expand_sf_binop (&gen_mulsf3_i4, operands); else if (TARGET_SH2E) emit_insn (gen_mulsf3_ie (operands[0], operands[1], operands[2])); if (! TARGET_SHMEDIA) DONE; }") (define_insn "*mulsf3_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fmul.s %1, %2, %0" [(set_attr "type" "fparith_media")]) (define_insn "mulsf3_i4" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%0") (match_operand:SF 2 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH2E" "fmul %2,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_insn "mulsf3_ie" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%0") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SH2E && ! TARGET_SH4" "fmul %2,%0" [(set_attr "type" "fp")]) (define_insn "*mac_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (plus:SF (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%f") (match_operand:SF 2 "fp_arith_reg_operand" "f")) (match_operand:SF 3 "fp_arith_reg_operand" "0")))] "TARGET_SHMEDIA_FPU" "fmac.s %1, %2, %0" [(set_attr "type" "fparith_media")]) (define_insn "*macsf3" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (plus:SF (mult:SF (match_operand:SF 1 "fp_arith_reg_operand" "%w") (match_operand:SF 2 "fp_arith_reg_operand" "f")) (match_operand:SF 3 "arith_reg_operand" "0"))) (use (match_operand:PSI 4 "fpscr_operand" "c"))] "TARGET_SH2E && ! TARGET_SH4" "fmac fr0,%2,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_expand "divsf3" [(set (match_operand:SF 0 "arith_reg_operand" "") (div:SF (match_operand:SF 1 "arith_reg_operand" "") (match_operand:SF 2 "arith_reg_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH2E) { expand_sf_binop (&gen_divsf3_i, operands); DONE; } }") (define_insn "*divsf3_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (div:SF (match_operand:SF 1 "fp_arith_reg_operand" "f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fdiv.s %1, %2, %0" [(set_attr "type" "fdiv_media")]) (define_insn "divsf3_i" [(set (match_operand:SF 0 "arith_reg_operand" "=f") (div:SF (match_operand:SF 1 "arith_reg_operand" "0") (match_operand:SF 2 "arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH2E" "fdiv %2,%0" [(set_attr "type" "fdiv") (set_attr "fp_mode" "single")]) (define_insn "floatdisf2" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (float:SF (match_operand:DI 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "float.qs %1, %0" [(set_attr "type" "fpconv_media")]) (define_expand "floatsisf2" [(set (match_operand:SF 0 "fp_arith_reg_operand" "") (float:SF (match_operand:SI 1 "fpul_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { emit_sf_insn (gen_floatsisf2_i4 (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "*floatsisf2_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (float:SF (match_operand:SI 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "float.ls %1, %0" [(set_attr "type" "fpconv_media")]) (define_insn "floatsisf2_i4" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (float:SF (match_operand:SI 1 "fpul_operand" "y"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "float %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_insn "*floatsisf2_ie" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (float:SF (match_operand:SI 1 "fpul_operand" "y")))] "TARGET_SH2E && ! TARGET_SH4" "float %1,%0" [(set_attr "type" "fp")]) (define_insn "fix_truncsfdi2" [(set (match_operand:DI 0 "fp_arith_reg_operand" "=f") (fix:DI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "ftrc.sq %1, %0" [(set_attr "type" "fpconv_media")]) (define_expand "fix_truncsfsi2" [(set (match_operand:SI 0 "fpul_operand" "=y") (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { emit_sf_insn (gen_fix_truncsfsi2_i4 (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "*fix_truncsfsi2_media" [(set (match_operand:SI 0 "fp_arith_reg_operand" "=f") (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "ftrc.sl %1, %0" [(set_attr "type" "fpconv_media")]) (define_insn "fix_truncsfsi2_i4" [(set (match_operand:SI 0 "fpul_operand" "=y") (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "ftrc %1,%0" [(set_attr "type" "ftrc_s") (set_attr "fp_mode" "single")]) ;; ??? This pattern is used nowhere. fix_truncsfsi2 always expands to ;; fix_truncsfsi2_i4. ;; (define_insn "fix_truncsfsi2_i4_2" ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") ;; (fix:SI (match_operand:SF 1 "arith_reg_operand" "f"))) ;; (use (reg:PSI FPSCR_REG)) ;; (clobber (reg:SI FPUL_REG))] ;; "TARGET_SH4" ;; "#" ;; [(set_attr "length" "4") ;; (set_attr "fp_mode" "single")]) ;;(define_split ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") ;; (fix:SI (match_operand:SF 1 "arith_reg_operand" "f"))) ;; (use (match_operand:PSI 2 "fpscr_operand" "c")) ;; (clobber (reg:SI FPUL_REG))] ;; "TARGET_SH4" ;; [(parallel [(set (reg:SI FPUL_REG) (fix:SI (match_dup 1))) ;; (use (match_dup 2))]) ;; (set (match_dup 0) (reg:SI FPUL_REG))]) (define_insn "*fixsfsi" [(set (match_operand:SI 0 "fpul_operand" "=y") (fix:SI (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SH2E && ! TARGET_SH4" "ftrc %1,%0" [(set_attr "type" "fp")]) (define_insn "cmpgtsf_t" [(set (reg:SI T_REG) (gt:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SH2E && ! TARGET_SH4" "fcmp/gt %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_insn "cmpeqsf_t" [(set (reg:SI T_REG) (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SH2E && ! TARGET_SH4" "fcmp/eq %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_insn "ieee_ccmpeqsf_t" [(set (reg:SI T_REG) (ior:SI (reg:SI T_REG) (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") (match_operand:SF 1 "fp_arith_reg_operand" "f"))))] "TARGET_SH2E && TARGET_IEEE && ! TARGET_SH4" "* return output_ieee_ccmpeq (insn, operands);" [(set_attr "length" "4")]) (define_insn "cmpgtsf_t_i4" [(set (reg:SI T_REG) (gt:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") (match_operand:SF 1 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fcmp/gt %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_insn "cmpeqsf_t_i4" [(set (reg:SI T_REG) (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") (match_operand:SF 1 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fcmp/eq %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "single")]) (define_insn "*ieee_ccmpeqsf_t_4" [(set (reg:SI T_REG) (ior:SI (reg:SI T_REG) (eq:SI (match_operand:SF 0 "fp_arith_reg_operand" "f") (match_operand:SF 1 "fp_arith_reg_operand" "f")))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_IEEE && TARGET_SH4" "* return output_ieee_ccmpeq (insn, operands);" [(set_attr "length" "4") (set_attr "fp_mode" "single")]) (define_insn "cmpeqsf_media" [(set (match_operand:DI 0 "register_operand" "=r") (eq:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpeq.s %1, %2, %0" [(set_attr "type" "fcmp_media")]) (define_insn "cmpgtsf_media" [(set (match_operand:DI 0 "register_operand" "=r") (gt:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpgt.s %1, %2, %0" [(set_attr "type" "fcmp_media")]) (define_insn "cmpgesf_media" [(set (match_operand:DI 0 "register_operand" "=r") (ge:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpge.s %1, %2, %0" [(set_attr "type" "fcmp_media")]) (define_insn "cmpunsf_media" [(set (match_operand:DI 0 "register_operand" "=r") (unordered:DI (match_operand:SF 1 "fp_arith_reg_operand" "f") (match_operand:SF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpun.s %1, %2, %0" [(set_attr "type" "fcmp_media")]) (define_expand "cmpsf" [(set (reg:SI T_REG) (compare (match_operand:SF 0 "arith_operand" "") (match_operand:SF 1 "arith_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { sh_compare_op0 = operands[0]; sh_compare_op1 = operands[1]; DONE; }") (define_expand "negsf2" [(set (match_operand:SF 0 "fp_arith_reg_operand" "") (neg:SF (match_operand:SF 1 "fp_arith_reg_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH2E) { expand_sf_unop (&gen_negsf2_i, operands); DONE; } }") (define_insn "*negsf2_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (neg:SF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fneg.s %1, %0" [(set_attr "type" "fmove_media")]) (define_insn "negsf2_i" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (neg:SF (match_operand:SF 1 "fp_arith_reg_operand" "0"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH2E" "fneg %0" [(set_attr "type" "fmove") (set_attr "fp_mode" "single")]) (define_expand "sqrtsf2" [(set (match_operand:SF 0 "fp_arith_reg_operand" "") (sqrt:SF (match_operand:SF 1 "fp_arith_reg_operand" "")))] "TARGET_SH3E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH3E) { expand_sf_unop (&gen_sqrtsf2_i, operands); DONE; } }") (define_insn "*sqrtsf2_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (sqrt:SF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fsqrt.s %1, %0" [(set_attr "type" "fdiv_media")]) (define_insn "sqrtsf2_i" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (sqrt:SF (match_operand:SF 1 "fp_arith_reg_operand" "0"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH3E" "fsqrt %0" [(set_attr "type" "fdiv") (set_attr "fp_mode" "single")]) (define_expand "abssf2" [(set (match_operand:SF 0 "fp_arith_reg_operand" "") (abs:SF (match_operand:SF 1 "fp_arith_reg_operand" "")))] "TARGET_SH2E || TARGET_SHMEDIA_FPU" " { if (TARGET_SH2E) { expand_sf_unop (&gen_abssf2_i, operands); DONE; } }") (define_insn "*abssf2_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (abs:SF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fabs.s %1, %0" [(set_attr "type" "fmove_media")]) (define_insn "abssf2_i" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (abs:SF (match_operand:SF 1 "fp_arith_reg_operand" "0"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH2E" "fabs %0" [(set_attr "type" "fmove") (set_attr "fp_mode" "single")]) (define_expand "adddf3" [(set (match_operand:DF 0 "fp_arith_reg_operand" "") (plus:DF (match_operand:DF 1 "fp_arith_reg_operand" "") (match_operand:DF 2 "fp_arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_binop (&gen_adddf3_i, operands); DONE; } }") (define_insn "*adddf3_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (plus:DF (match_operand:DF 1 "fp_arith_reg_operand" "%f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fadd.d %1, %2, %0" [(set_attr "type" "dfparith_media")]) (define_insn "adddf3_i" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (plus:DF (match_operand:DF 1 "fp_arith_reg_operand" "%0") (match_operand:DF 2 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH4" "fadd %2,%0" [(set_attr "type" "dfp_arith") (set_attr "fp_mode" "double")]) (define_expand "subdf3" [(set (match_operand:DF 0 "fp_arith_reg_operand" "") (minus:DF (match_operand:DF 1 "fp_arith_reg_operand" "") (match_operand:DF 2 "fp_arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_binop (&gen_subdf3_i, operands); DONE; } }") (define_insn "*subdf3_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (minus:DF (match_operand:DF 1 "fp_arith_reg_operand" "f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fsub.d %1, %2, %0" [(set_attr "type" "dfparith_media")]) (define_insn "subdf3_i" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (minus:DF (match_operand:DF 1 "fp_arith_reg_operand" "0") (match_operand:DF 2 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH4" "fsub %2,%0" [(set_attr "type" "dfp_arith") (set_attr "fp_mode" "double")]) (define_expand "muldf3" [(set (match_operand:DF 0 "fp_arith_reg_operand" "") (mult:DF (match_operand:DF 1 "fp_arith_reg_operand" "") (match_operand:DF 2 "fp_arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_binop (&gen_muldf3_i, operands); DONE; } }") (define_insn "*muldf3_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (mult:DF (match_operand:DF 1 "fp_arith_reg_operand" "%f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fmul.d %1, %2, %0" [(set_attr "type" "dfmul_media")]) (define_insn "muldf3_i" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (mult:DF (match_operand:DF 1 "fp_arith_reg_operand" "%0") (match_operand:DF 2 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH4" "fmul %2,%0" [(set_attr "type" "dfp_arith") (set_attr "fp_mode" "double")]) (define_expand "divdf3" [(set (match_operand:DF 0 "fp_arith_reg_operand" "") (div:DF (match_operand:DF 1 "fp_arith_reg_operand" "") (match_operand:DF 2 "fp_arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_binop (&gen_divdf3_i, operands); DONE; } }") (define_insn "*divdf3_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (div:DF (match_operand:DF 1 "fp_arith_reg_operand" "f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fdiv.d %1, %2, %0" [(set_attr "type" "dfdiv_media")]) (define_insn "divdf3_i" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (div:DF (match_operand:DF 1 "fp_arith_reg_operand" "0") (match_operand:DF 2 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 3 "fpscr_operand" "c"))] "TARGET_SH4" "fdiv %2,%0" [(set_attr "type" "dfdiv") (set_attr "fp_mode" "double")]) (define_insn "floatdidf2" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (float:DF (match_operand:DI 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "float.qd %1, %0" [(set_attr "type" "dfpconv_media")]) (define_expand "floatsidf2" [(set (match_operand:DF 0 "fp_arith_reg_operand" "") (float:DF (match_operand:SI 1 "fpul_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { emit_df_insn (gen_floatsidf2_i (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "*floatsidf2_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (float:DF (match_operand:SI 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "float.ld %1, %0" [(set_attr "type" "dfpconv_media")]) (define_insn "floatsidf2_i" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (float:DF (match_operand:SI 1 "fpul_operand" "y"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "float %1,%0" [(set_attr "type" "dfp_conv") (set_attr "fp_mode" "double")]) (define_insn "fix_truncdfdi2" [(set (match_operand:DI 0 "fp_arith_reg_operand" "=f") (fix:DI (match_operand:DF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "ftrc.dq %1, %0" [(set_attr "type" "dfpconv_media")]) (define_expand "fix_truncdfsi2" [(set (match_operand:SI 0 "fpul_operand" "") (fix:SI (match_operand:DF 1 "fp_arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { emit_df_insn (gen_fix_truncdfsi2_i (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "*fix_truncdfsi2_media" [(set (match_operand:SI 0 "fp_arith_reg_operand" "=f") (fix:SI (match_operand:DF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "ftrc.dl %1, %0" [(set_attr "type" "dfpconv_media")]) (define_insn "fix_truncdfsi2_i" [(set (match_operand:SI 0 "fpul_operand" "=y") (fix:SI (match_operand:DF 1 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "ftrc %1,%0" [(set_attr "type" "dfp_conv") (set_attr "dfp_comp" "no") (set_attr "fp_mode" "double")]) ;; ??? This pattern is used nowhere. fix_truncdfsi2 always expands to ;; fix_truncdfsi2_i. ;; (define_insn "fix_truncdfsi2_i4" ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") ;; (fix:SI (match_operand:DF 1 "arith_reg_operand" "f"))) ;; (use (match_operand:PSI 2 "fpscr_operand" "c")) ;; (clobber (reg:SI FPUL_REG))] ;; "TARGET_SH4" ;; "#" ;; [(set_attr "length" "4") ;; (set_attr "fp_mode" "double")]) ;; ;; (define_split ;; [(set (match_operand:SI 0 "arith_reg_operand" "=r") ;; (fix:SI (match_operand:DF 1 "arith_reg_operand" "f"))) ;; (use (match_operand:PSI 2 "fpscr_operand" "c")) ;; (clobber (reg:SI FPUL_REG))] ;; "TARGET_SH4" ;; [(parallel [(set (reg:SI FPUL_REG) (fix:SI (match_dup 1))) ;; (use (match_dup 2))]) ;; (set (match_dup 0) (reg:SI FPUL_REG))]) (define_insn "cmpgtdf_t" [(set (reg:SI T_REG) (gt:SI (match_operand:DF 0 "arith_reg_operand" "f") (match_operand:DF 1 "arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fcmp/gt %1,%0" [(set_attr "type" "dfp_cmp") (set_attr "fp_mode" "double")]) (define_insn "cmpeqdf_t" [(set (reg:SI T_REG) (eq:SI (match_operand:DF 0 "arith_reg_operand" "f") (match_operand:DF 1 "arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fcmp/eq %1,%0" [(set_attr "type" "dfp_cmp") (set_attr "fp_mode" "double")]) (define_insn "*ieee_ccmpeqdf_t" [(set (reg:SI T_REG) (ior:SI (reg:SI T_REG) (eq:SI (match_operand:DF 0 "arith_reg_operand" "f") (match_operand:DF 1 "arith_reg_operand" "f")))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_IEEE && TARGET_SH4" "* return output_ieee_ccmpeq (insn, operands);" [(set_attr "length" "4") (set_attr "fp_mode" "double")]) (define_insn "cmpeqdf_media" [(set (match_operand:DI 0 "register_operand" "=r") (eq:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpeq.d %1,%2,%0" [(set_attr "type" "fcmp_media")]) (define_insn "cmpgtdf_media" [(set (match_operand:DI 0 "register_operand" "=r") (gt:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpgt.d %1,%2,%0" [(set_attr "type" "fcmp_media")]) (define_insn "cmpgedf_media" [(set (match_operand:DI 0 "register_operand" "=r") (ge:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpge.d %1,%2,%0" [(set_attr "type" "fcmp_media")]) (define_insn "cmpundf_media" [(set (match_operand:DI 0 "register_operand" "=r") (unordered:DI (match_operand:DF 1 "fp_arith_reg_operand" "f") (match_operand:DF 2 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcmpun.d %1,%2,%0" [(set_attr "type" "fcmp_media")]) (define_expand "cmpdf" [(set (reg:SI T_REG) (compare (match_operand:DF 0 "arith_operand" "") (match_operand:DF 1 "arith_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { sh_compare_op0 = operands[0]; sh_compare_op1 = operands[1]; DONE; }") (define_expand "negdf2" [(set (match_operand:DF 0 "arith_reg_operand" "") (neg:DF (match_operand:DF 1 "arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_unop (&gen_negdf2_i, operands); DONE; } }") (define_insn "*negdf2_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (neg:DF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fneg.d %1, %0" [(set_attr "type" "fmove_media")]) (define_insn "negdf2_i" [(set (match_operand:DF 0 "arith_reg_operand" "=f") (neg:DF (match_operand:DF 1 "arith_reg_operand" "0"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fneg %0" [(set_attr "type" "fmove") (set_attr "fp_mode" "double")]) (define_expand "sqrtdf2" [(set (match_operand:DF 0 "arith_reg_operand" "") (sqrt:DF (match_operand:DF 1 "arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_unop (&gen_sqrtdf2_i, operands); DONE; } }") (define_insn "*sqrtdf2_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (sqrt:DF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fsqrt.d %1, %0" [(set_attr "type" "dfdiv_media")]) (define_insn "sqrtdf2_i" [(set (match_operand:DF 0 "arith_reg_operand" "=f") (sqrt:DF (match_operand:DF 1 "arith_reg_operand" "0"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fsqrt %0" [(set_attr "type" "dfdiv") (set_attr "fp_mode" "double")]) (define_expand "absdf2" [(set (match_operand:DF 0 "arith_reg_operand" "") (abs:DF (match_operand:DF 1 "arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { expand_df_unop (&gen_absdf2_i, operands); DONE; } }") (define_insn "*absdf2_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (abs:DF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fabs.d %1, %0" [(set_attr "type" "fmove_media")]) (define_insn "absdf2_i" [(set (match_operand:DF 0 "arith_reg_operand" "=f") (abs:DF (match_operand:DF 1 "arith_reg_operand" "0"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fabs %0" [(set_attr "type" "fmove") (set_attr "fp_mode" "double")]) (define_expand "extendsfdf2" [(set (match_operand:DF 0 "fp_arith_reg_operand" "") (float_extend:DF (match_operand:SF 1 "fpul_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { emit_df_insn (gen_extendsfdf2_i4 (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "*extendsfdf2_media" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (float_extend:DF (match_operand:SF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcnv.sd %1, %0" [(set_attr "type" "dfpconv_media")]) (define_insn "extendsfdf2_i4" [(set (match_operand:DF 0 "fp_arith_reg_operand" "=f") (float_extend:DF (match_operand:SF 1 "fpul_operand" "y"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fcnvsd %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "double")]) (define_expand "truncdfsf2" [(set (match_operand:SF 0 "fpul_operand" "") (float_truncate:SF (match_operand:DF 1 "fp_arith_reg_operand" "")))] "TARGET_SH4 || TARGET_SHMEDIA_FPU" " { if (TARGET_SH4) { emit_df_insn (gen_truncdfsf2_i4 (operands[0], operands[1], get_fpscr_rtx ())); DONE; } }") (define_insn "*truncdfsf2_media" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (float_truncate:SF (match_operand:DF 1 "fp_arith_reg_operand" "f")))] "TARGET_SHMEDIA_FPU" "fcnv.ds %1, %0" [(set_attr "type" "dfpconv_media")]) (define_insn "truncdfsf2_i4" [(set (match_operand:SF 0 "fpul_operand" "=y") (float_truncate:SF (match_operand:DF 1 "fp_arith_reg_operand" "f"))) (use (match_operand:PSI 2 "fpscr_operand" "c"))] "TARGET_SH4" "fcnvds %1,%0" [(set_attr "type" "fp") (set_attr "fp_mode" "double")]) ;; Bit field extract patterns. These give better code for packed bitfields, ;; because they allow auto-increment addresses to be generated. (define_expand "insv" [(set (zero_extract:SI (match_operand:QI 0 "memory_operand" "") (match_operand:SI 1 "immediate_operand" "") (match_operand:SI 2 "immediate_operand" "")) (match_operand:SI 3 "general_operand" ""))] "TARGET_SH1 && ! TARGET_LITTLE_ENDIAN" " { rtx addr_target, orig_address, shift_reg, qi_val; HOST_WIDE_INT bitsize, size, v; rtx x = operands[3]; /* ??? expmed doesn't care for non-register predicates. */ if (! memory_operand (operands[0], VOIDmode) || ! immediate_operand (operands[1], VOIDmode) || ! immediate_operand (operands[2], VOIDmode) || ! general_operand (x, VOIDmode)) FAIL; /* If this isn't a 16 / 24 / 32 bit field, or if it doesn't start on a byte boundary, then fail. */ bitsize = INTVAL (operands[1]); if (bitsize < 16 || bitsize > 32 || bitsize % 8 != 0 || (INTVAL (operands[2]) % 8) != 0) FAIL; size = bitsize / 8; orig_address = XEXP (operands[0], 0); shift_reg = gen_reg_rtx (SImode); if (GET_CODE (x) == CONST_INT) { v = INTVAL (x); qi_val = force_reg (QImode, GEN_INT (trunc_int_for_mode (v, QImode))); } else { emit_insn (gen_movsi (shift_reg, operands[3])); qi_val = gen_rtx_SUBREG (QImode, shift_reg, 3); } addr_target = copy_addr_to_reg (plus_constant (orig_address, size - 1)); operands[0] = replace_equiv_address (operands[0], addr_target); emit_insn (gen_movqi (operands[0], qi_val)); while (size -= 1) { if (GET_CODE (x) == CONST_INT) qi_val = force_reg (QImode, GEN_INT (trunc_int_for_mode (v >>= 8, QImode))); else { emit_insn (gen_lshrsi3_k (shift_reg, shift_reg, GEN_INT (8))); qi_val = gen_rtx_SUBREG (QImode, shift_reg, 3); } emit_insn (gen_addsi3 (addr_target, addr_target, GEN_INT (-1))); emit_insn (gen_movqi (operands[0], qi_val)); } DONE; }") ;; ------------------------------------------------------------------------- ;; Peepholes ;; ------------------------------------------------------------------------- ;; This matches cases where a stack pointer increment at the start of the ;; epilogue combines with a stack slot read loading the return value. (define_peephole [(set (match_operand:SI 0 "arith_reg_operand" "") (mem:SI (match_operand:SI 1 "arith_reg_operand" ""))) (set (match_dup 1) (plus:SI (match_dup 1) (const_int 4)))] "TARGET_SH1 && REGNO (operands[1]) != REGNO (operands[0])" "mov.l @%1+,%0") ;; See the comment on the dt combiner pattern above. (define_peephole [(set (match_operand:SI 0 "arith_reg_operand" "=r") (plus:SI (match_dup 0) (const_int -1))) (set (reg:SI T_REG) (eq:SI (match_dup 0) (const_int 0)))] "TARGET_SH2" "dt %0") ;; These convert sequences such as `mov #k,r0; add r15,r0; mov.l @r0,rn' ;; to `mov #k,r0; mov.l @(r0,r15),rn'. These sequences are generated by ;; reload when the constant is too large for a reg+offset address. ;; ??? We would get much better code if this was done in reload. This would ;; require modifying find_reloads_address to recognize that if the constant ;; is out-of-range for an immediate add, then we get better code by reloading ;; the constant into a register than by reloading the sum into a register, ;; since the former is one instruction shorter if the address does not need ;; to be offsettable. Unfortunately this does not work, because there is ;; only one register, r0, that can be used as an index register. This register ;; is also the function return value register. So, if we try to force reload ;; to use double-reg addresses, then we end up with some instructions that ;; need to use r0 twice. The only way to fix this is to change the calling ;; convention so that r0 is not used to return values. (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (mem:SI (match_dup 0)) (match_operand:SI 2 "general_movsrc_operand" ""))] "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" "mov.l %2,@(%0,%1)") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (match_operand:SI 2 "general_movdst_operand" "") (mem:SI (match_dup 0)))] "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" "mov.l @(%0,%1),%2") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (mem:HI (match_dup 0)) (match_operand:HI 2 "general_movsrc_operand" ""))] "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" "mov.w %2,@(%0,%1)") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (match_operand:HI 2 "general_movdst_operand" "") (mem:HI (match_dup 0)))] "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" "mov.w @(%0,%1),%2") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (mem:QI (match_dup 0)) (match_operand:QI 2 "general_movsrc_operand" ""))] "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" "mov.b %2,@(%0,%1)") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (match_operand:QI 2 "general_movdst_operand" "") (mem:QI (match_dup 0)))] "TARGET_SH1 && REGNO (operands[0]) == 0 && reg_unused_after (operands[0], insn)" "mov.b @(%0,%1),%2") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (mem:SF (match_dup 0)) (match_operand:SF 2 "general_movsrc_operand" ""))] "TARGET_SH1 && REGNO (operands[0]) == 0 && ((GET_CODE (operands[2]) == REG && REGNO (operands[2]) < 16) || (GET_CODE (operands[2]) == SUBREG && REGNO (SUBREG_REG (operands[2])) < 16)) && reg_unused_after (operands[0], insn)" "mov.l %2,@(%0,%1)") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (match_operand:SF 2 "general_movdst_operand" "") (mem:SF (match_dup 0)))] "TARGET_SH1 && REGNO (operands[0]) == 0 && ((GET_CODE (operands[2]) == REG && REGNO (operands[2]) < 16) || (GET_CODE (operands[2]) == SUBREG && REGNO (SUBREG_REG (operands[2])) < 16)) && reg_unused_after (operands[0], insn)" "mov.l @(%0,%1),%2") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (mem:SF (match_dup 0)) (match_operand:SF 2 "general_movsrc_operand" ""))] "TARGET_SH2E && REGNO (operands[0]) == 0 && ((GET_CODE (operands[2]) == REG && FP_OR_XD_REGISTER_P (REGNO (operands[2]))) || (GET_CODE (operands[2]) == SUBREG && FP_OR_XD_REGISTER_P (REGNO (SUBREG_REG (operands[2]))))) && reg_unused_after (operands[0], insn)" "fmov{.s|} %2,@(%0,%1)") (define_peephole [(set (match_operand:SI 0 "register_operand" "=r") (plus:SI (match_dup 0) (match_operand:SI 1 "register_operand" "r"))) (set (match_operand:SF 2 "general_movdst_operand" "") (mem:SF (match_dup 0)))] "TARGET_SH2E && REGNO (operands[0]) == 0 && ((GET_CODE (operands[2]) == REG && FP_OR_XD_REGISTER_P (REGNO (operands[2]))) || (GET_CODE (operands[2]) == SUBREG && FP_OR_XD_REGISTER_P (REGNO (SUBREG_REG (operands[2]))))) && reg_unused_after (operands[0], insn)" "fmov{.s|} @(%0,%1),%2") ;; Switch to a new stack with its address in sp_switch (a SYMBOL_REF). */ (define_insn "sp_switch_1" [(const_int 1)] "TARGET_SH1" "* { rtx xoperands[1]; xoperands[0] = sp_switch; output_asm_insn (\"mov.l r0,@-r15\;mov.l %0,r0\", xoperands); output_asm_insn (\"mov.l @r0,r0\;mov.l r15,@-r0\", xoperands); return \"mov r0,r15\"; }" [(set_attr "length" "10")]) ;; Switch back to the original stack for interrupt functions with the ;; sp_switch attribute. */ (define_insn "sp_switch_2" [(const_int 2)] "TARGET_SH1" "mov.l @r15+,r15\;mov.l @r15+,r0" [(set_attr "length" "4")]) ;; Integer vector moves (define_expand "movv8qi" [(set (match_operand:V8QI 0 "general_movdst_operand" "") (match_operand:V8QI 1 "general_movsrc_operand" ""))] "TARGET_SHMEDIA" "{ if (prepare_move_operands (operands, V8QImode)) DONE; }") (define_insn "movv8qi_i" [(set (match_operand:V8QI 0 "general_movdst_operand" "=r,r,r,rl,m") (match_operand:V8QI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] "TARGET_SHMEDIA && (register_operand (operands[0], V8QImode) || sh_register_operand (operands[1], V8QImode))" "@ add %1, r63, %0 movi %1, %0 # ld%M1.q %m1, %0 st%M0.q %m0, %N1" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") (set_attr "length" "4,4,16,4,4")]) (define_split [(set (match_operand:V8QI 0 "arith_reg_dest" "") (subreg:V8QI (const_int 0) 0))] "TARGET_SHMEDIA" [(set (match_dup 0) (const_vector:V8QI [(const_int 0) (const_int 0) (const_int 0) (const_int 0) (const_int 0) (const_int 0) (const_int 0) (const_int 0)]))]) (define_split [(set (match_operand 0 "arith_reg_dest" "") (match_operand 1 "sh_rep_vec" ""))] "TARGET_SHMEDIA && reload_completed && GET_MODE (operands[0]) == GET_MODE (operands[1]) && VECTOR_MODE_SUPPORTED_P (GET_MODE (operands[0])) && GET_MODE_SIZE (GET_MODE (operands[0])) == 8 && (XVECEXP (operands[1], 0, 0) != const0_rtx || XVECEXP (operands[1], 0, 1) != const0_rtx) && (XVECEXP (operands[1], 0, 0) != constm1_rtx || XVECEXP (operands[1], 0, 1) != constm1_rtx)" [(set (match_dup 0) (match_dup 1)) (match_dup 2)] " { int unit_size = GET_MODE_UNIT_SIZE (GET_MODE (operands[1])); rtx elt1 = XVECEXP (operands[1], 0, 1); if (unit_size > 2) operands[2] = gen_mshflo_l (operands[0], operands[0], operands[0]); else { if (unit_size < 2) operands[0] = gen_rtx_REG (V4HImode, true_regnum (operands[0])); operands[2] = gen_mperm_w0 (operands[0], operands[0]); } operands[0] = gen_rtx_REG (DImode, true_regnum (operands[0])); operands[1] = XVECEXP (operands[1], 0, 0); if (unit_size < 2) { if (GET_CODE (operands[1]) == CONST_INT && GET_CODE (elt1) == CONST_INT) operands[1] = GEN_INT (TARGET_LITTLE_ENDIAN ? (INTVAL (operands[1]) & 0xff) + (INTVAL (elt1) << 8) : (INTVAL (operands[1]) << 8) + (INTVAL (elt1) & 0xff)); else { operands[0] = gen_rtx_REG (V2QImode, true_regnum (operands[0])); operands[1] = gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, operands[1], elt1)); } } }") (define_split [(set (match_operand 0 "arith_reg_dest" "") (match_operand 1 "sh_const_vec" ""))] "TARGET_SHMEDIA && reload_completed && GET_MODE (operands[0]) == GET_MODE (operands[1]) && VECTOR_MODE_SUPPORTED_P (GET_MODE (operands[0])) && operands[1] != CONST0_RTX (GET_MODE (operands[1]))" [(set (match_dup 0) (match_dup 1))] " { rtx v = operands[1]; enum machine_mode new_mode = mode_for_size (GET_MODE_BITSIZE (GET_MODE (v)), MODE_INT, 0); operands[0] = gen_rtx_REG (new_mode, true_regnum (operands[0])); operands[1] = simplify_subreg (new_mode, operands[1], GET_MODE (operands[1]), 0); }") (define_expand "movv2hi" [(set (match_operand:V2HI 0 "general_movdst_operand" "") (match_operand:V2HI 1 "general_movsrc_operand" ""))] "TARGET_SHMEDIA" "{ if (prepare_move_operands (operands, V2HImode)) DONE; }") (define_insn "movv2hi_i" [(set (match_operand:V2HI 0 "general_movdst_operand" "=r,r,r,rl,m") (match_operand:V2HI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] "TARGET_SHMEDIA && (register_operand (operands[0], V2HImode) || sh_register_operand (operands[1], V2HImode))" "@ addz.l %1, r63, %0 movi %1, %0 # ld%M1.l %m1, %0 st%M0.l %m0, %N1" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") (set_attr "length" "4,4,16,4,4")]) (define_expand "movv4hi" [(set (match_operand:V4HI 0 "general_movdst_operand" "") (match_operand:V4HI 1 "general_movsrc_operand" ""))] "TARGET_SHMEDIA" "{ if (prepare_move_operands (operands, V4HImode)) DONE; }") (define_insn "movv4hi_i" [(set (match_operand:V4HI 0 "general_movdst_operand" "=r,r,r,rl,m") (match_operand:V4HI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] "TARGET_SHMEDIA && (register_operand (operands[0], V4HImode) || sh_register_operand (operands[1], V4HImode))" "@ add %1, r63, %0 movi %1, %0 # ld%M1.q %m1, %0 st%M0.q %m0, %N1" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") (set_attr "length" "4,4,16,4,4")]) (define_expand "movv2si" [(set (match_operand:V2SI 0 "general_movdst_operand" "") (match_operand:V2SI 1 "general_movsrc_operand" ""))] "TARGET_SHMEDIA" "{ if (prepare_move_operands (operands, V2SImode)) DONE; }") (define_insn "movv2si_i" [(set (match_operand:V2SI 0 "general_movdst_operand" "=r,r,r,rl,m") (match_operand:V2SI 1 "general_movsrc_operand" "r,I16C16Z,nW,m,rlZ"))] "TARGET_SHMEDIA && (register_operand (operands[0], V2SImode) || sh_register_operand (operands[1], V2SImode))" "@ add %1, r63, %0 # # ld%M1.q %m1, %0 st%M0.q %m0, %N1" [(set_attr "type" "arith_media,arith_media,*,load_media,store_media") (set_attr "length" "4,4,16,4,4")]) ;; Multimedia Intrinsics (define_insn "absv2si2" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (abs:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mabs.l %1, %0" [(set_attr "type" "mcmp_media")]) (define_insn "absv4hi2" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (abs:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mabs.w %1, %0" [(set_attr "type" "mcmp_media")]) (define_insn "addv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (plus:V2SI (match_operand:V2SI 1 "arith_reg_operand" "%r") (match_operand:V2SI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "madd.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "addv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (plus:V4HI (match_operand:V4HI 1 "arith_reg_operand" "%r") (match_operand:V4HI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "madd.w %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "ssaddv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ss_plus:V2SI (match_operand:V2SI 1 "arith_reg_operand" "%r") (match_operand:V2SI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "madds.l %1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "usaddv8qi3" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (us_plus:V8QI (match_operand:V8QI 1 "arith_reg_operand" "%r") (match_operand:V8QI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "madds.ub %1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "ssaddv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ss_plus:V4HI (match_operand:V4HI 1 "arith_reg_operand" "%r") (match_operand:V4HI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "madds.w %1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "negcmpeqv8qi" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (neg:V8QI (eq:V8QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "%rZ") (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcmpeq.b %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "negcmpeqv2si" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (neg:V2SI (eq:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "%rZ") (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcmpeq.l %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "negcmpeqv4hi" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (neg:V4HI (eq:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "%rZ") (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcmpeq.w %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "negcmpgtuv8qi" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (neg:V8QI (gtu:V8QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "%rZ") (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcmpgt.ub %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "negcmpgtv2si" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (neg:V2SI (gt:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "%rZ") (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcmpgt.l %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "negcmpgtv4hi" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (neg:V4HI (gt:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "%rZ") (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcmpgt.w %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "mcmv" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (and:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_operand" "r")) (and:DI (match_operand:DI 3 "arith_reg_operand" "0") (not:DI (match_dup 2)))))] "TARGET_SHMEDIA" "mcmv %N1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "mcnvs_lw" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_concat:V4HI (ss_truncate:V2HI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ")) (ss_truncate:V2HI (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcnvs.lw %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "mcnvs_wb" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (vec_concat:V8QI (ss_truncate:V4QI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ")) (ss_truncate:V4QI (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcnvs.wb %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "mcnvs_wub" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (vec_concat:V8QI (us_truncate:V4QI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ")) (us_truncate:V4QI (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mcnvs.wub %N1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "mextr_rl" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (lshiftrt:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:HI 3 "mextr_bit_offset" "i")) (ashift:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") (match_operand:HI 4 "mextr_bit_offset" "i"))))] "TARGET_SHMEDIA && INTVAL (operands[3]) + INTVAL (operands[4]) == 64" "* { static char templ[16]; sprintf (templ, \"mextr%d\\t%%N1, %%N2, %%0\", (int) INTVAL (operands[3]) >> 3); return templ; }" [(set_attr "type" "arith_media")]) (define_insn "*mextr_lr" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:HI 3 "mextr_bit_offset" "i")) (lshiftrt:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") (match_operand:HI 4 "mextr_bit_offset" "i"))))] "TARGET_SHMEDIA && INTVAL (operands[3]) + INTVAL (operands[4]) == 64" "* { static char templ[16]; sprintf (templ, \"mextr%d\\t%%N2, %%N1, %%0\", (int) INTVAL (operands[4]) >> 3); return templ; }" [(set_attr "type" "arith_media")]) ; mextrN can be modelled with vec_select / vec_concat, but the selection ; vector then varies depending on endianness. (define_expand "mextr1" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (1 * 8), GEN_INT (7 * 8))); DONE; }") (define_expand "mextr2" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (2 * 8), GEN_INT (6 * 8))); DONE; }") (define_expand "mextr3" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (3 * 8), GEN_INT (5 * 8))); DONE; }") (define_expand "mextr4" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (4 * 8), GEN_INT (4 * 8))); DONE; }") (define_expand "mextr5" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (5 * 8), GEN_INT (3 * 8))); DONE; }") (define_expand "mextr6" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (6 * 8), GEN_INT (2 * 8))); DONE; }") (define_expand "mextr7" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn (gen_mextr_rl (operands[0], operands[1], operands[2], GEN_INT (7 * 8), GEN_INT (1 * 8))); DONE; }") (define_expand "mmacfx_wl" [(match_operand:V2SI 0 "arith_reg_dest" "") (match_operand:V2HI 1 "extend_reg_operand" "") (match_operand:V2HI 2 "extend_reg_operand" "") (match_operand:V2SI 3 "arith_reg_operand" "")] "TARGET_SHMEDIA" " { emit_insn (gen_mmacfx_wl_i (operands[0], operands[3], operands[1], operands[2])); DONE; }") (define_insn "mmacfx_wl_i" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ss_plus:V2SI (match_operand:V2SI 1 "arith_reg_operand" "0") (ss_truncate:V2SI (ashift:V2DI (sign_extend:V2DI (mult:V2SI (sign_extend:V2SI (match_operand:V2HI 2 "extend_reg_operand" "r")) (sign_extend:V2SI (match_operand:V2HI 3 "extend_reg_operand" "r")))) (const_int 1)))))] "TARGET_SHMEDIA" "mmacfx.wl %2, %3, %0" [(set_attr "type" "mac_media")]) (define_expand "mmacnfx_wl" [(match_operand:V2SI 0 "arith_reg_dest" "") (match_operand:V2HI 1 "extend_reg_operand" "") (match_operand:V2HI 2 "extend_reg_operand" "") (match_operand:V2SI 3 "arith_reg_operand" "")] "TARGET_SHMEDIA" " { emit_insn (gen_mmacnfx_wl_i (operands[0], operands[3], operands[1], operands[2])); DONE; }") (define_insn "mmacnfx_wl_i" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ss_minus:V2SI (match_operand:V2SI 1 "arith_reg_operand" "0") (ss_truncate:V2SI (ashift:V2DI (sign_extend:V2DI (mult:V2SI (sign_extend:V2SI (match_operand:V2HI 2 "extend_reg_operand" "r")) (sign_extend:V2SI (match_operand:V2HI 3 "extend_reg_operand" "r")))) (const_int 1)))))] "TARGET_SHMEDIA" "mmacnfx.wl %2, %3, %0" [(set_attr "type" "mac_media")]) (define_insn "mulv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (mult:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") (match_operand:V2SI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mmul.l %1, %2, %0" [(set_attr "type" "d2mpy_media")]) (define_insn "mulv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (mult:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") (match_operand:V4HI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mmul.w %1, %2, %0" [(set_attr "type" "dmpy_media")]) (define_insn "mmulfx_l" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ss_truncate:V2SI (ashiftrt:V2DI (mult:V2DI (sign_extend:V2DI (match_operand:V2SI 1 "arith_reg_operand" "r")) (sign_extend:V2DI (match_operand:V2SI 2 "arith_reg_operand" "r"))) (const_int 31))))] "TARGET_SHMEDIA" "mmulfx.l %1, %2, %0" [(set_attr "type" "d2mpy_media")]) (define_insn "mmulfx_w" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ss_truncate:V4HI (ashiftrt:V4SI (mult:V4SI (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) (const_int 15))))] "TARGET_SHMEDIA" "mmulfx.w %1, %2, %0" [(set_attr "type" "dmpy_media")]) (define_insn "mmulfxrp_w" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ss_truncate:V4HI (ashiftrt:V4SI (plus:V4SI (mult:V4SI (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) (const_int 16384)) (const_int 15))))] "TARGET_SHMEDIA" "mmulfxrp.w %1, %2, %0" [(set_attr "type" "dmpy_media")]) (define_expand "mmulhi_wl" [(match_operand:V2SI 0 "arith_reg_dest" "") (match_operand:V4HI 1 "arith_reg_operand" "") (match_operand:V4HI 2 "arith_reg_operand" "")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mmul23_wl : gen_mmul01_wl) (operands[0], operands[1], operands[2])); DONE; }") (define_expand "mmullo_wl" [(match_operand:V2SI 0 "arith_reg_dest" "") (match_operand:V4HI 1 "arith_reg_operand" "") (match_operand:V4HI 2 "arith_reg_operand" "")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mmul01_wl : gen_mmul23_wl) (operands[0], operands[1], operands[2])); DONE; }") (define_insn "mmul23_wl" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (vec_select:V2SI (mult:V4SI (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) (parallel [(const_int 2) (const_int 3)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mmulhi.wl %1, %2, %0\" : \"mmullo.wl %1, %2, %0\");" [(set_attr "type" "dmpy_media")]) (define_insn "mmul01_wl" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (vec_select:V2SI (mult:V4SI (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) (sign_extend:V4SI (match_operand:V4HI 2 "arith_reg_operand" "r"))) (parallel [(const_int 0) (const_int 1)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mmullo.wl %1, %2, %0\" : \"mmulhi.wl %1, %2, %0\");" [(set_attr "type" "dmpy_media")]) (define_expand "mmulsum_wq" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:V4HI 1 "arith_reg_operand" "") (match_operand:V4HI 2 "arith_reg_operand" "") (match_operand:DI 3 "arith_reg_operand" "")] "TARGET_SHMEDIA" " { emit_insn (gen_mmulsum_wq_i (operands[0], operands[3], operands[1], operands[2])); DONE; }") (define_insn "mmulsum_wq_i" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (plus:DI (match_operand:DI 1 "arith_reg_operand" "0") (plus:DI (plus:DI (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_operand:V4HI 2 "arith_reg_operand" "r")) (sign_extend:V4DI (match_operand:V4HI 3 "arith_reg_operand" "r"))) (parallel [(const_int 0)])) (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_dup 2)) (sign_extend:V4DI (match_dup 3))) (parallel [(const_int 1)]))) (plus:DI (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_dup 2)) (sign_extend:V4DI (match_dup 3))) (parallel [(const_int 2)])) (vec_select:DI (mult:V4DI (sign_extend:V4DI (match_dup 2)) (sign_extend:V4DI (match_dup 3))) (parallel [(const_int 3)]))))))] "TARGET_SHMEDIA" "mmulsum.wq %2, %3, %0" [(set_attr "type" "mac_media")]) (define_expand "mperm_w" [(match_operand:V4HI 0 "arith_reg_dest" "=r") (match_operand:V4HI 1 "arith_reg_operand" "r") (match_operand:QI 2 "extend_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mperm_w_little : gen_mperm_w_big) (operands[0], operands[1], operands[2])); DONE; }") ; This use of vec_select isn't exactly correct according to rtl.texi ; (because not constant), but it seems a straightforward extension. (define_insn "mperm_w_little" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_select:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") (parallel [(zero_extract:QI (match_operand:QI 2 "extend_reg_or_0_operand" "rZ") (const_int 2) (const_int 0)) (zero_extract:QI (match_dup 2) (const_int 2) (const_int 2)) (zero_extract:QI (match_dup 2) (const_int 2) (const_int 4)) (zero_extract:QI (match_dup 2) (const_int 2) (const_int 6))])))] "TARGET_SHMEDIA && TARGET_LITTLE_ENDIAN" "mperm.w %1, %N2, %0" [(set_attr "type" "arith_media")]) (define_insn "mperm_w_big" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_select:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") (parallel [(zero_extract:QI (not:QI (match_operand:QI 2 "extend_reg_or_0_operand" "rZ")) (const_int 2) (const_int 0)) (zero_extract:QI (not:QI (match_dup 2)) (const_int 2) (const_int 2)) (zero_extract:QI (not:QI (match_dup 2)) (const_int 2) (const_int 4)) (zero_extract:QI (not:QI (match_dup 2)) (const_int 2) (const_int 6))])))] "TARGET_SHMEDIA && ! TARGET_LITTLE_ENDIAN" "mperm.w %1, %N2, %0" [(set_attr "type" "arith_media")]) (define_insn "mperm_w0" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_duplicate:V4HI (truncate:HI (match_operand 1 "trunc_hi_operand" "r"))))] "TARGET_SHMEDIA" "mperm.w %1, r63, %0" [(set_attr "type" "arith_media")]) (define_expand "msad_ubq" [(match_operand:DI 0 "arith_reg_dest" "") (match_operand:V8QI 1 "arith_reg_or_0_operand" "") (match_operand:V8QI 2 "arith_reg_or_0_operand" "") (match_operand:DI 3 "arith_reg_operand" "")] "TARGET_SHMEDIA" " { emit_insn (gen_msad_ubq_i (operands[0], operands[3], operands[1], operands[2])); DONE; }") (define_insn "msad_ubq_i" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (plus:DI (plus:DI (plus:DI (plus:DI (match_operand:DI 1 "arith_reg_operand" "0") (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")) (zero_extend:V8DI (match_operand:V8QI 3 "arith_reg_or_0_operand" "rZ"))) (parallel [(const_int 0)])))) (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 1)])))) (plus:DI (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 2)]))) (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 3)]))))) (plus:DI (plus:DI (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 4)]))) (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 5)])))) (plus:DI (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 6)]))) (abs:DI (vec_select:DI (minus:V8DI (zero_extend:V8DI (match_dup 2)) (zero_extend:V8DI (match_dup 3))) (parallel [(const_int 7)])))))))] "TARGET_SHMEDIA" "msad.ubq %N2, %N3, %0" [(set_attr "type" "mac_media")]) (define_insn "mshalds_l" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ss_truncate:V2SI (ashift:V2DI (sign_extend:V2DI (match_operand:V2SI 1 "arith_reg_operand" "r")) (and:DI (match_operand:DI 2 "arith_reg_operand" "r") (const_int 31)))))] "TARGET_SHMEDIA" "mshalds.l %1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "mshalds_w" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ss_truncate:V4HI (ashift:V4SI (sign_extend:V4SI (match_operand:V4HI 1 "arith_reg_operand" "r")) (and:DI (match_operand:DI 2 "arith_reg_operand" "r") (const_int 15)))))] "TARGET_SHMEDIA" "mshalds.w %1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "ashrv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ashiftrt:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mshard.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "ashrv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ashiftrt:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mshard.w %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "mshards_q" [(set (match_operand:HI 0 "arith_reg_dest" "=r") (ss_truncate:HI (ashiftrt:DI (match_operand:DI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mshards.q %1, %N2, %0" [(set_attr "type" "mcmp_media")]) (define_expand "mshfhi_b" [(match_operand:V8QI 0 "arith_reg_dest" "") (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf4_b : gen_mshf0_b) (operands[0], operands[1], operands[2])); DONE; }") (define_expand "mshflo_b" [(match_operand:V8QI 0 "arith_reg_dest" "") (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf0_b : gen_mshf4_b) (operands[0], operands[1], operands[2])); DONE; }") (define_insn "mshf4_b" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (vec_select:V8QI (vec_concat:V16QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")) (parallel [(const_int 4) (const_int 12) (const_int 5) (const_int 13) (const_int 6) (const_int 14) (const_int 7) (const_int 15)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mshfhi.b %N1, %N2, %0\" : \"mshflo.b %N1, %N2, %0\");" [(set_attr "type" "arith_media")]) (define_insn "mshf0_b" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (vec_select:V8QI (vec_concat:V16QI (match_operand:V8QI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V8QI 2 "arith_reg_or_0_operand" "rZ")) (parallel [(const_int 0) (const_int 8) (const_int 1) (const_int 9) (const_int 2) (const_int 10) (const_int 3) (const_int 11)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mshflo.b %N1, %N2, %0\" : \"mshfhi.b %N1, %N2, %0\");" [(set_attr "type" "arith_media")]) (define_expand "mshfhi_l" [(match_operand:V2SI 0 "arith_reg_dest" "") (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf4_l : gen_mshf0_l) (operands[0], operands[1], operands[2])); DONE; }") (define_expand "mshflo_l" [(match_operand:V2SI 0 "arith_reg_dest" "") (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf0_l : gen_mshf4_l) (operands[0], operands[1], operands[2])); DONE; }") (define_insn "mshf4_l" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (vec_select:V2SI (vec_concat:V4SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")) (parallel [(const_int 1) (const_int 3)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mshfhi.l %N1, %N2, %0\" : \"mshflo.l %N1, %N2, %0\");" [(set_attr "type" "arith_media")]) (define_insn "mshf0_l" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (vec_select:V2SI (vec_concat:V4SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V2SI 2 "arith_reg_or_0_operand" "rZ")) (parallel [(const_int 0) (const_int 2)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mshflo.l %N1, %N2, %0\" : \"mshfhi.l %N1, %N2, %0\");" [(set_attr "type" "arith_media")]) (define_expand "mshfhi_w" [(match_operand:V4HI 0 "arith_reg_dest" "") (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf4_w : gen_mshf0_w) (operands[0], operands[1], operands[2])); DONE; }") (define_expand "mshflo_w" [(match_operand:V4HI 0 "arith_reg_dest" "") (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")] "TARGET_SHMEDIA" " { emit_insn ((TARGET_LITTLE_ENDIAN ? gen_mshf0_w : gen_mshf4_w) (operands[0], operands[1], operands[2])); DONE; }") (define_insn "mshf4_w" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_select:V4HI (vec_concat:V8HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")) (parallel [(const_int 2) (const_int 6) (const_int 3) (const_int 7)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mshfhi.w %N1, %N2, %0\" : \"mshflo.w %N1, %N2, %0\");" [(set_attr "type" "arith_media")]) (define_insn "mshf0_w" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_select:V4HI (vec_concat:V8HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V4HI 2 "arith_reg_or_0_operand" "rZ")) (parallel [(const_int 0) (const_int 4) (const_int 1) (const_int 5)])))] "TARGET_SHMEDIA" "* return (TARGET_LITTLE_ENDIAN ? \"mshflo.w %N1, %N2, %0\" : \"mshfhi.w %N1, %N2, %0\");" [(set_attr "type" "arith_media")]) (define_insn "mshflo_w_x" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (vec_select:V4HI (vec_concat:V4HI (match_operand:V2HI 1 "extend_reg_or_0_operand" "rZ") (match_operand:V2HI 2 "extend_reg_or_0_operand" "rZ")) (parallel [(const_int 2) (const_int 0) (const_int 3) (const_int 1)])))] "TARGET_SHMEDIA" "mshflo.w %N1, %N2, %0" [(set_attr "type" "arith_media")]) /* These are useful to expand ANDs and as combiner patterns. */ (define_insn_and_split "mshfhi_l_di" [(set (match_operand:DI 0 "arith_reg_dest" "=r,f") (ior:DI (lshiftrt:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ,f") (const_int 32)) (and:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ,?f") (const_int -4294967296))))] "TARGET_SHMEDIA" "@ mshfhi.l %N1, %N2, %0 #" "TARGET_SHMEDIA && reload_completed && ! GENERAL_REGISTER_P (true_regnum (operands[0]))" [(set (match_dup 3) (match_dup 4)) (set (match_dup 5) (match_dup 6))] " { operands[3] = gen_lowpart (SImode, operands[0]); operands[4] = gen_highpart (SImode, operands[1]); operands[5] = gen_highpart (SImode, operands[0]); operands[6] = gen_highpart (SImode, operands[2]); }" [(set_attr "type" "arith_media")]) (define_insn "*mshfhi_l_di_rev" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (and:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (const_int -4294967296)) (lshiftrt:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") (const_int 32))))] "TARGET_SHMEDIA" "mshfhi.l %N2, %N1, %0" [(set_attr "type" "arith_media")]) (define_split [(set (match_operand:DI 0 "arith_reg_dest" "") (ior:DI (zero_extend:DI (match_operand:SI 1 "extend_reg_or_0_operand" "")) (and:DI (match_operand:DI 2 "arith_reg_or_0_operand" "") (const_int -4294967296)))) (clobber (match_operand:DI 3 "arith_reg_dest" ""))] "TARGET_SHMEDIA" [(const_int 0)] " { emit_insn (gen_ashldi3_media (operands[3], simplify_gen_subreg (DImode, operands[1], SImode, 0), GEN_INT (32))); emit_insn (gen_mshfhi_l_di (operands[0], operands[3], operands[2])); DONE; }") (define_insn "mshflo_l_di" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (and:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (const_int 4294967295)) (ashift:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") (const_int 32))))] "TARGET_SHMEDIA" "mshflo.l %N1, %N2, %0" [(set_attr "type" "arith_media")]) (define_insn "*mshflo_l_di_rev" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (const_int 32)) (and:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") (const_int 4294967295))))] "TARGET_SHMEDIA" "mshflo.l %N2, %N1, %0" [(set_attr "type" "arith_media")]) ;; Combiner pattern for trampoline initialization. (define_insn_and_split "*double_shori" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_operand" "0") (const_int 32)) (match_operand:DI 2 "const_int_operand" "n")))] "TARGET_SHMEDIA && INTVAL (operands[2]) == trunc_int_for_mode (INTVAL (operands[2]), SImode)" "#" "rtx_equal_p (operands[0], operands[1])" [(const_int 0)] " { HOST_WIDE_INT v = INTVAL (operands[2]); emit_insn (gen_shori_media (operands[0], operands[0], gen_int_mode (INTVAL (operands[2]) >> 16, HImode))); emit_insn (gen_shori_media (operands[0], operands[0], gen_int_mode (v, HImode))); DONE; }") (define_insn "*mshflo_l_di_x" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (zero_extend:DI (match_operand:SI 1 "extend_reg_or_0_operand" "rZ")) (ashift:DI (match_operand:DI 2 "arith_reg_or_0_operand" "rZ") (const_int 32))))] "TARGET_SHMEDIA" "mshflo.l %N1, %N2, %0" [(set_attr "type" "arith_media")]) (define_insn_and_split "concat_v2sf" [(set (match_operand:V2SF 0 "register_operand" "=r,f,f?") ;; (vec_concat:V2SF (match_operand:SF 1 "register_operand" "rZ,0,f") (vec_concat:V2SF (match_operand:SF 1 "register_operand" "rZ,f,f") (match_operand:SF 2 "register_operand" "rZ,f,f")))] "TARGET_SHMEDIA" "@ mshflo.l %N1, %N2, %0 # #" "TARGET_SHMEDIA && reload_completed && ! GENERAL_REGISTER_P (true_regnum (operands[0]))" [(set (match_dup 3) (match_dup 1)) (set (match_dup 4) (match_dup 2))] " { operands[3] = simplify_gen_subreg (SFmode, operands[0], V2SFmode, 0); operands[4] = simplify_gen_subreg (SFmode, operands[0], V2SFmode, 4); }" [(set_attr "type" "arith_media")]) (define_insn "*mshflo_l_di_x_rev" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (ior:DI (ashift:DI (match_operand:DI 1 "arith_reg_or_0_operand" "rZ") (const_int 32)) (zero_extend:DI (match_operand:SI 2 "extend_reg_or_0_operand" "rZ"))))] "TARGET_SHMEDIA" "mshflo.l %N2, %N1, %0" [(set_attr "type" "arith_media")]) (define_insn "ashlv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ashift:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mshlld.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "ashlv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ashift:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mshlld.w %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "lshrv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (lshiftrt:V2SI (match_operand:V2SI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mshlrd.l %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "lshrv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (lshiftrt:V4HI (match_operand:V4HI 1 "arith_reg_operand" "r") (match_operand:DI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "mshlrd.w %1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "subv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (minus:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V2SI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "msub.l %N1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "subv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (minus:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V4HI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "msub.w %N1, %2, %0" [(set_attr "type" "arith_media")]) (define_insn "sssubv2si3" [(set (match_operand:V2SI 0 "arith_reg_dest" "=r") (ss_minus:V2SI (match_operand:V2SI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V2SI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "msubs.l %N1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "ussubv8qi3" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (us_minus:V8QI (match_operand:V8QI 1 "arith_reg_operand" "r") (match_operand:V8QI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "msubs.ub %1, %2, %0" [(set_attr "type" "mcmp_media")]) (define_insn "sssubv4hi3" [(set (match_operand:V4HI 0 "arith_reg_dest" "=r") (ss_minus:V4HI (match_operand:V4HI 1 "arith_reg_or_0_operand" "rZ") (match_operand:V4HI 2 "arith_reg_operand" "r")))] "TARGET_SHMEDIA" "msubs.w %N1, %2, %0" [(set_attr "type" "mcmp_media")]) ;; Floating Point Intrinsics (define_insn "fcosa_s" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (unspec:SF [(match_operand:SI 1 "fp_arith_reg_operand" "f")] UNSPEC_FCOSA))] "TARGET_SHMEDIA" "fcosa.s %1, %0" [(set_attr "type" "atrans_media")]) (define_insn "fsina_s" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (unspec:SF [(match_operand:SI 1 "fp_arith_reg_operand" "f")] UNSPEC_FSINA))] "TARGET_SHMEDIA" "fsina.s %1, %0" [(set_attr "type" "atrans_media")]) (define_insn "fipr" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (plus:SF (plus:SF (vec_select:SF (mult:V4SF (match_operand:V4SF 1 "fp_arith_reg_operand" "f") (match_operand:V4SF 2 "fp_arith_reg_operand" "f")) (parallel [(const_int 0)])) (vec_select:SF (mult:V4SF (match_dup 1) (match_dup 2)) (parallel [(const_int 1)]))) (plus:SF (vec_select:SF (mult:V4SF (match_dup 1) (match_dup 2)) (parallel [(const_int 2)])) (vec_select:SF (mult:V4SF (match_dup 1) (match_dup 2)) (parallel [(const_int 3)])))))] "TARGET_SHMEDIA" "fipr.s %1, %2, %0" [(set_attr "type" "fparith_media")]) (define_insn "fsrra_s" [(set (match_operand:SF 0 "fp_arith_reg_operand" "=f") (unspec:SF [(match_operand:SF 1 "fp_arith_reg_operand" "f")] UNSPEC_FSRRA))] "TARGET_SHMEDIA" "fsrra.s %1, %0" [(set_attr "type" "atrans_media")]) (define_insn "ftrv" [(set (match_operand:V4SF 0 "fp_arith_reg_operand" "=f") (plus:V4SF (plus:V4SF (mult:V4SF (vec_select:V4SF (match_operand:V16SF 1 "fp_arith_reg_operand" "f") (parallel [(const_int 0) (const_int 5) (const_int 10) (const_int 15)])) (match_operand:V4SF 2 "fp_arith_reg_operand" "f")) (mult:V4SF (vec_select:V4SF (match_dup 1) (parallel [(const_int 4) (const_int 9) (const_int 14) (const_int 3)])) (vec_select:V4SF (match_dup 2) (parallel [(const_int 1) (const_int 2) (const_int 3) (const_int 0)])))) (plus:V4SF (mult:V4SF (vec_select:V4SF (match_dup 1) (parallel [(const_int 8) (const_int 13) (const_int 2) (const_int 7)])) (vec_select:V4SF (match_dup 2) (parallel [(const_int 2) (const_int 3) (const_int 0) (const_int 1)]))) (mult:V4SF (vec_select:V4SF (match_dup 1) (parallel [(const_int 12) (const_int 1) (const_int 6) (const_int 11)])) (vec_select:V4SF (match_dup 2) (parallel [(const_int 3) (const_int 0) (const_int 1) (const_int 2)]))))))] "TARGET_SHMEDIA" "ftrv.s %1, %2, %0" [(set_attr "type" "fparith_media")]) (define_insn "nsb" [(set (match_operand:QI 0 "arith_reg_dest" "=r") (unspec:QI [(match_operand:DI 1 "arith_reg_operand" "r")] UNSPEC_NSB))] "TARGET_SHMEDIA" "nsb %1, %0" [(set_attr "type" "arith_media")]) (define_insn "nsbsi" [(set (match_operand:SI 0 "arith_reg_dest" "=r") (zero_extend:SI (unspec:QI [(match_operand:DI 1 "arith_reg_operand" "r")] UNSPEC_NSB)))] "TARGET_SHMEDIA" "nsb %1, %0" [(set_attr "type" "arith_media")]) (define_insn "nsbdi" [(set (match_operand:DI 0 "arith_reg_dest" "=r") (zero_extend:DI (unspec:QI [(match_operand:DI 1 "arith_reg_operand" "r")] UNSPEC_NSB)))] "TARGET_SHMEDIA" "nsb %1, %0" [(set_attr "type" "arith_media")]) (define_expand "ffsdi2" [(set (match_operand:DI 0 "arith_reg_dest" "") (ffs:DI (match_operand:DI 1 "arith_reg_operand" "")))] "TARGET_SHMEDIA" " { rtx scratch = gen_reg_rtx (DImode); rtx last; emit_insn (gen_adddi3 (scratch, operands[1], GEN_INT (-1))); emit_insn (gen_xordi3 (scratch, operands[1], scratch)); emit_insn (gen_lshrdi3_media (scratch, scratch, const1_rtx)); emit_insn (gen_nsbdi (scratch, scratch)); emit_insn (gen_adddi3 (scratch, scratch, GEN_INT (-64))); emit_insn (gen_movdicc_false (scratch, operands[1], const0_rtx, scratch)); last = emit_insn (gen_subdi3 (operands[0], const0_rtx, scratch)); REG_NOTES (last) = gen_rtx_EXPR_LIST (REG_EQUAL, gen_rtx_FFS (DImode, operands[0]), REG_NOTES (last)); DONE; }") (define_expand "ffssi2" [(set (match_operand:SI 0 "arith_reg_dest" "") (ffs:SI (match_operand:SI 1 "arith_reg_operand" "")))] "TARGET_SHMEDIA" " { rtx scratch = gen_reg_rtx (SImode); rtx discratch = gen_reg_rtx (DImode); rtx last; emit_insn (gen_adddi3 (discratch, simplify_gen_subreg (DImode, operands[1], SImode, 0), GEN_INT (-1))); emit_insn (gen_andcdi3 (discratch, simplify_gen_subreg (DImode, operands[1], SImode, 0), discratch)); emit_insn (gen_nsbsi (scratch, discratch)); last = emit_insn (gen_subsi3 (operands[0], force_reg (SImode, GEN_INT (63)), scratch)); REG_NOTES (last) = gen_rtx_EXPR_LIST (REG_EQUAL, gen_rtx_FFS (SImode, operands[0]), REG_NOTES (last)); DONE; }") (define_insn "byterev" [(set (match_operand:V8QI 0 "arith_reg_dest" "=r") (vec_select:V8QI (match_operand:V8QI 1 "arith_reg_operand" "r") (parallel [(const_int 7) (const_int 6) (const_int 5) (const_int 4) (const_int 3) (const_int 2) (const_int 1) (const_int 0)])))] "TARGET_SHMEDIA" "byterev %1, %0" [(set_attr "type" "arith_media")]) (define_insn "prefetch" [(prefetch (match_operand:QI 0 "address_operand" "p") (match_operand:SI 1 "const_int_operand" "n") (match_operand:SI 2 "const_int_operand" "n"))] "TARGET_SHMEDIA" "* { operands[0] = gen_rtx_MEM (QImode, operands[0]); output_asm_insn (\"ld%M0.b %m0,r63\", operands); return \"\"; }" [(set_attr "type" "other")]) ;; The following description models the ;; SH4 pipeline using the DFA based scheduler. ;; The DFA based description is better way to model ;; a superscalar pipeline as compared to function unit ;; reservation model. ;; 1. The function unit based model is oriented to describe at most one ;; unit reservation by each insn. It is difficult to model unit reservations in multiple ;; pipeline units by same insn. This can be done using DFA based description. ;; 2. The execution performance of DFA based scheduler does not depend on processor complexity. ;; 3. Writing all unit reservations for an instruction class is more natural description ;; of the pipeline and makes interface of the hazard recognizer simpler than the ;; old function unit based model. ;; 4. The DFA model is richer and is a part of greater overall framework of RCSP. ;; Two automata are defined to reduce number of states ;; which a single large automaton will have.(Factoring) (define_automaton "inst_pipeline,fpu_pipe") ;; This unit is basically the decode unit of the processor. ;; Since SH4 is a dual issue machine,it is as if there are two ;; units so that any insn can be processed by either one ;; of the decoding unit. (define_cpu_unit "pipe_01,pipe_02" "inst_pipeline") ;; The fixed point arithmetic calculator(?? EX Unit). (define_cpu_unit "int" "inst_pipeline") ;; f1_1 and f1_2 are floating point units.Actually there is ;; a f1 unit which can overlap with other f1 unit but ;; not another F1 unit.It is as though there were two ;; f1 units. (define_cpu_unit "f1_1,f1_2" "fpu_pipe") ;; The floating point units (except FS - F2 always precedes it.) (define_cpu_unit "F0,F1,F2,F3" "fpu_pipe") ;; This is basically the MA unit of SH4 ;; used in LOAD/STORE pipeline. (define_cpu_unit "memory" "inst_pipeline") ;; However, there are LS group insns that don't use it, even ones that ;; complete in 0 cycles. So we use an extra unit for the issue of LS insns. (define_cpu_unit "load_store" "inst_pipeline") ;; The address calculator used for branch instructions. ;; This will be reserved after "issue" of branch instructions ;; and this is to make sure that no two branch instructions ;; can be issued in parallel. (define_cpu_unit "pcr_addrcalc" "inst_pipeline") ;; ---------------------------------------------------- ;; This reservation is to simplify the dual issue description. (define_reservation "issue" "pipe_01|pipe_02") ;; This is to express the locking of D stage. ;; Note that the issue of a CO group insn also effectively locks the D stage. (define_reservation "d_lock" "pipe_01+pipe_02") ;; Every FE instruction but fipr / ftrv starts with issue and this. (define_reservation "F01" "F0+F1") ;; This is to simplify description where F1,F2,FS ;; are used simultaneously. (define_reservation "fpu" "F1+F2") ;; This is to highlight the fact that f1 ;; cannot overlap with F1. (exclusion_set "f1_1,f1_2" "F1") (define_insn_reservation "nil" 0 (eq_attr "type" "nil") "nothing") ;; Although reg moves have a latency of zero ;; we need to highlight that they use D stage ;; for one cycle. ;; Group: MT (define_insn_reservation "reg_mov" 0 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "move")) "issue") ;; Group: LS (define_insn_reservation "freg_mov" 0 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "fmove")) "issue+load_store") ;; We don't model all pipeline stages; we model the issue ('D') stage ;; inasmuch as we allow only two instructions to issue simultaneously, ;; and CO instructions prevent any simultaneous issue of another instruction. ;; (This uses pipe_01 and pipe_02). ;; Double issue of EX insns is prevented by using the int unit in the EX stage. ;; Double issue of EX / BR insns is prevented by using the int unit / ;; pcr_addrcalc unit in the EX stage. ;; Double issue of BR / LS instructions is prevented by using the ;; pcr_addrcalc / load_store unit in the issue cycle. ;; Double issue of FE instructions is prevented by using F0 in the first ;; pipeline stage after the first D stage. ;; There is no need to describe the [ES]X / [MN]A / S stages after a D stage ;; (except in the cases outlined above), nor to describe the FS stage after ;; the F2 stage. ;; Other MT group instructions(1 step operations) ;; Group: MT ;; Latency: 1 ;; Issue Rate: 1 (define_insn_reservation "mt" 1 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "mt_group")) "issue") ;; Fixed Point Arithmetic Instructions(1 step operations) ;; Group: EX ;; Latency: 1 ;; Issue Rate: 1 (define_insn_reservation "sh4_simple_arith" 1 (and (eq_attr "pipe_model" "sh4") (eq_attr "insn_class" "ex_group")) "issue,int") ;; Load and store instructions have no alignment peculiarities for the SH4, ;; but they use the load-store unit, which they share with the fmove type ;; insns (fldi[01]; fmov frn,frm; flds; fsts; fabs; fneg) . ;; Loads have a latency of two. ;; However, call insns can only paired with a preceding insn, and have ;; a delay slot, so that we want two more insns to be scheduled between the ;; load of the function address and the call. This is equivalent to a ;; latency of three. ;; ADJUST_COST can only properly handle reductions of the cost, so we ;; use a latency of three here, which gets multiplied by 10 to yield 30. ;; We only do this for SImode loads of general registers, to make the work ;; for ADJUST_COST easier. ;; Load Store instructions. (MOV.[BWL]@(d,GBR) ;; Group: LS ;; Latency: 2 ;; Issue Rate: 1 (define_insn_reservation "sh4_load" 2 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "load,pcload")) "issue+load_store,nothing,memory") ;; calls / sfuncs need an extra instruction for their delay slot. ;; Moreover, estimating the latency for SImode loads as 3 will also allow ;; adjust_cost to meaningfully bump it back up to 3 if they load the shift ;; count of a dynamic shift. (define_insn_reservation "sh4_load_si" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "load_si,pcload_si")) "issue+load_store,nothing,memory") ;; (define_bypass 2 "sh4_load_si" "!sh4_call") ;; The load latency is upped to three higher if the dependent insn does ;; double precision computation. We want the 'default' latency to reflect ;; that increased latency because otherwise the insn priorities won't ;; allow proper scheduling. (define_insn_reservation "sh4_fload" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "fload,pcfload")) "issue+load_store,nothing,memory") ;; (define_bypass 2 "sh4_fload" "!") (define_insn_reservation "sh4_store" 1 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "store")) "issue+load_store,nothing,memory") ;; Load Store instructions. ;; Group: LS ;; Latency: 1 ;; Issue Rate: 1 (define_insn_reservation "sh4_gp_fpul" 1 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "gp_fpul")) "issue+load_store") ;; Load Store instructions. ;; Group: LS ;; Latency: 3 ;; Issue Rate: 1 (define_insn_reservation "sh4_fpul_gp" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "fpul_gp")) "issue+load_store") ;; Branch (BF,BF/S,BT,BT/S,BRA) ;; Group: BR ;; Latency when taken: 2 (or 1) ;; Issue Rate: 1 ;; The latency is 1 when displacement is 0. ;; We can't really do much with the latency, even if we could express it, ;; but the pairing restrictions are useful to take into account. ;; ??? If the branch is likely, we might want to fill the delay slot; ;; if the branch is likely, but not very likely, should we pretend to use ;; a resource that CO instructions use, to get a pairable delay slot insn? (define_insn_reservation "sh4_branch" 1 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "cbranch,jump")) "issue+pcr_addrcalc") ;; Branch Far (JMP,RTS,BRAF) ;; Group: CO ;; Latency: 3 ;; Issue Rate: 2 ;; ??? Scheduling happens before branch shortening, and hence jmp and braf ;; can't be distinguished from bra for the "jump" pattern. (define_insn_reservation "sh4_return" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "return,jump_ind")) "d_lock*2") ;; RTE ;; Group: CO ;; Latency: 5 ;; Issue Rate: 5 ;; this instruction can be executed in any of the pipelines ;; and blocks the pipeline for next 4 stages. (define_insn_reservation "sh4_return_from_exp" 5 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "rte")) "d_lock*5") ;; OCBP, OCBWB ;; Group: CO ;; Latency: 1-5 ;; Issue Rate: 1 ;; cwb is used for the sequence ocbwb @%0; extu.w %0,%2; or %1,%2; mov.l %0,@%2 ;; ocbwb on its own would be "d_lock,nothing,memory*5" (define_insn_reservation "ocbwb" 6 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "cwb")) "d_lock*2,(d_lock+memory)*3,issue+load_store+memory,memory*2") ;; LDS to PR,JSR ;; Group: CO ;; Latency: 3 ;; Issue Rate: 2 ;; The SX stage is blocked for last 2 cycles. ;; OTOH, the only time that has an effect for insns generated by the compiler ;; is when lds to PR is followed by sts from PR - and that is highly unlikely - ;; or when we are doing a function call - and we don't do inter-function ;; scheduling. For the function call case, it's really best that we end with ;; something that models an rts. (define_insn_reservation "sh4_lds_to_pr" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "prset") ) "d_lock*2") ;; calls introduce a longisch delay that is likely to flush the pipelines ;; of the caller's instructions. Ordinary functions tend to end with a ;; load to restore a register (in the delay slot of rts), while sfuncs ;; tend to end with an EX or MT insn. But that is not actually relevant, ;; since there are no instructions that contend for memory access early. ;; We could, of course, provide exact scheduling information for specific ;; sfuncs, if that should prove useful. (define_insn_reservation "sh4_call" 16 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "call,sfunc")) "d_lock*16") ;; LDS.L to PR ;; Group: CO ;; Latency: 3 ;; Issue Rate: 2 ;; The SX unit is blocked for last 2 cycles. (define_insn_reservation "ldsmem_to_pr" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "pload")) "d_lock*2") ;; STS from PR ;; Group: CO ;; Latency: 2 ;; Issue Rate: 2 ;; The SX unit in second and third cycles. (define_insn_reservation "sts_from_pr" 2 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "prget")) "d_lock*2") ;; STS.L from PR ;; Group: CO ;; Latency: 2 ;; Issue Rate: 2 (define_insn_reservation "sh4_prstore_mem" 2 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "pstore")) "d_lock*2,nothing,memory") ;; LDS to FPSCR ;; Group: CO ;; Latency: 4 ;; Issue Rate: 1 ;; F1 is blocked for last three cycles. (define_insn_reservation "fpscr_load" 4 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "gp_fpscr")) "d_lock,nothing,F1*3") ;; LDS.L to FPSCR ;; Group: CO ;; Latency: 1 / 4 ;; Latency to update Rn is 1 and latency to update FPSCR is 4 ;; Issue Rate: 1 ;; F1 is blocked for last three cycles. (define_insn_reservation "fpscr_load_mem" 4 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "mem_fpscr")) "d_lock,nothing,(F1+memory),F1*2") ;; Fixed point multiplication (DMULS.L DMULU.L MUL.L MULS.W,MULU.W) ;; Group: CO ;; Latency: 4 / 4 ;; Issue Rate: 1 (define_insn_reservation "multi" 4 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "smpy,dmpy")) "d_lock,(d_lock+f1_1),(f1_1|f1_2)*3,F2") ;; Fixed STS from MACL / MACH ;; Group: CO ;; Latency: 3 ;; Issue Rate: 1 (define_insn_reservation "sh4_mac_gp" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "mac_gp")) "d_lock") ;; Single precision floating point computation FCMP/EQ, ;; FCMP/GT, FADD, FLOAT, FMAC, FMUL, FSUB, FTRC, FRVHG, FSCHG ;; Group: FE ;; Latency: 3/4 ;; Issue Rate: 1 (define_insn_reservation "fp_arith" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "fp")) "issue,F01,F2") (define_insn_reservation "fp_arith_ftrc" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "ftrc_s")) "issue,F01,F2") (define_bypass 1 "fp_arith_ftrc" "sh4_fpul_gp") ;; Single Precision FDIV/SQRT ;; Group: FE ;; Latency: 12/13 (FDIV); 11/12 (FSQRT) ;; Issue Rate: 1 ;; We describe fdiv here; fsqrt is actually one cycle faster. (define_insn_reservation "fp_div" 12 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "fdiv")) "issue,F01+F3,F2+F3,F3*7,F1+F3,F2") ;; Double Precision floating point computation ;; (FCNVDS, FCNVSD, FLOAT, FTRC) ;; Group: FE ;; Latency: (3,4)/5 ;; Issue Rate: 1 (define_insn_reservation "dp_float" 4 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "dfp_conv")) "issue,F01,F1+F2,F2") ;; Double-precision floating-point (FADD,FMUL,FSUB) ;; Group: FE ;; Latency: (7,8)/9 ;; Issue Rate: 1 (define_insn_reservation "fp_double_arith" 8 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "dfp_arith")) "issue,F01,F1+F2,fpu*4,F2") ;; Double-precision FCMP (FCMP/EQ,FCMP/GT) ;; Group: CO ;; Latency: 3/5 ;; Issue Rate: 2 (define_insn_reservation "fp_double_cmp" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "dfp_cmp")) "d_lock,(d_lock+F01),F1+F2,F2") ;; Double precision FDIV/SQRT ;; Group: FE ;; Latency: (24,25)/26 ;; Issue Rate: 1 (define_insn_reservation "dp_div" 25 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "dfdiv")) "issue,F01+F3,F1+F2+F3,F2+F3,F3*16,F1+F3,(fpu+F3)*2,F2") ;; Use the branch-not-taken case to model arith3 insns. For the branch taken ;; case, we'd get a d_lock instead of issue at the end. (define_insn_reservation "arith3" 3 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "arith3")) "issue,d_lock+pcr_addrcalc,issue") ;; arith3b insns schedule the same no matter if the branch is taken or not. (define_insn_reservation "arith3b" 2 (and (eq_attr "pipe_model" "sh4") (eq_attr "type" "arith3")) "issue,d_lock+pcr_addrcalc")