/* Analyze RTL for GNU compiler. Copyright (C) 1987, 1988, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006 Free Software Foundation, Inc. This file is part of GCC. GCC is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2, or (at your option) any later version. GCC is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with GCC; see the file COPYING. If not, write to the Free Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */ #include "config.h" #include "system.h" #include "coretypes.h" #include "tm.h" #include "toplev.h" #include "rtl.h" #include "hard-reg-set.h" #include "insn-config.h" #include "recog.h" #include "target.h" #include "output.h" #include "tm_p.h" #include "flags.h" #include "real.h" #include "regs.h" #include "function.h" /* Forward declarations */ static void set_of_1 (rtx, rtx, void *); static bool covers_regno_p (rtx, unsigned int); static bool covers_regno_no_parallel_p (rtx, unsigned int); static int rtx_referenced_p_1 (rtx *, void *); static int computed_jump_p_1 (rtx); static void parms_set (rtx, rtx, void *); static unsigned HOST_WIDE_INT cached_nonzero_bits (rtx, enum machine_mode, rtx, enum machine_mode, unsigned HOST_WIDE_INT); static unsigned HOST_WIDE_INT nonzero_bits1 (rtx, enum machine_mode, rtx, enum machine_mode, unsigned HOST_WIDE_INT); static unsigned int cached_num_sign_bit_copies (rtx, enum machine_mode, rtx, enum machine_mode, unsigned int); static unsigned int num_sign_bit_copies1 (rtx, enum machine_mode, rtx, enum machine_mode, unsigned int); /* Offset of the first 'e', 'E' or 'V' operand for each rtx code, or -1 if a code has no such operand. */ static int non_rtx_starting_operands[NUM_RTX_CODE]; /* Bit flags that specify the machine subtype we are compiling for. Bits are tested using macros TARGET_... defined in the tm.h file and set by `-m...' switches. Must be defined in rtlanal.c. */ int target_flags; /* Truncation narrows the mode from SOURCE mode to DESTINATION mode. If TARGET_MODE_REP_EXTENDED (DESTINATION, DESTINATION_REP) is SIGN_EXTEND then while narrowing we also have to enforce the representation and sign-extend the value to mode DESTINATION_REP. If the value is already sign-extended to DESTINATION_REP mode we can just switch to DESTINATION mode on it. For each pair of integral modes SOURCE and DESTINATION, when truncating from SOURCE to DESTINATION, NUM_SIGN_BIT_COPIES_IN_REP[SOURCE][DESTINATION] contains the number of high-order bits in SOURCE that have to be copies of the sign-bit so that we can do this mode-switch to DESTINATION. */ static unsigned int num_sign_bit_copies_in_rep[MAX_MODE_INT + 1][MAX_MODE_INT + 1]; /* Return 1 if the value of X is unstable (would be different at a different point in the program). The frame pointer, arg pointer, etc. are considered stable (within one function) and so is anything marked `unchanging'. */ int rtx_unstable_p (rtx x) { RTX_CODE code = GET_CODE (x); int i; const char *fmt; switch (code) { case MEM: return !MEM_READONLY_P (x) || rtx_unstable_p (XEXP (x, 0)); case CONST: case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case SYMBOL_REF: case LABEL_REF: return 0; case REG: /* As in rtx_varies_p, we have to use the actual rtx, not reg number. */ if (x == frame_pointer_rtx || x == hard_frame_pointer_rtx /* The arg pointer varies if it is not a fixed register. */ || (x == arg_pointer_rtx && fixed_regs[ARG_POINTER_REGNUM])) return 0; #ifndef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED /* ??? When call-clobbered, the value is stable modulo the restore that must happen after a call. This currently screws up local-alloc into believing that the restore is not needed. */ if (x == pic_offset_table_rtx) return 0; #endif return 1; case ASM_OPERANDS: if (MEM_VOLATILE_P (x)) return 1; /* Fall through. */ default: break; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) if (fmt[i] == 'e') { if (rtx_unstable_p (XEXP (x, i))) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (rtx_unstable_p (XVECEXP (x, i, j))) return 1; } return 0; } /* Return 1 if X has a value that can vary even between two executions of the program. 0 means X can be compared reliably against certain constants or near-constants. FOR_ALIAS is nonzero if we are called from alias analysis; if it is zero, we are slightly more conservative. The frame pointer and the arg pointer are considered constant. */ int rtx_varies_p (rtx x, int for_alias) { RTX_CODE code; int i; const char *fmt; if (!x) return 0; code = GET_CODE (x); switch (code) { case MEM: return !MEM_READONLY_P (x) || rtx_varies_p (XEXP (x, 0), for_alias); case CONST: case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case SYMBOL_REF: case LABEL_REF: return 0; case REG: /* Note that we have to test for the actual rtx used for the frame and arg pointers and not just the register number in case we have eliminated the frame and/or arg pointer and are using it for pseudos. */ if (x == frame_pointer_rtx || x == hard_frame_pointer_rtx /* The arg pointer varies if it is not a fixed register. */ || (x == arg_pointer_rtx && fixed_regs[ARG_POINTER_REGNUM])) return 0; if (x == pic_offset_table_rtx #ifdef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED /* ??? When call-clobbered, the value is stable modulo the restore that must happen after a call. This currently screws up local-alloc into believing that the restore is not needed, so we must return 0 only if we are called from alias analysis. */ && for_alias #endif ) return 0; return 1; case LO_SUM: /* The operand 0 of a LO_SUM is considered constant (in fact it is related specifically to operand 1) during alias analysis. */ return (! for_alias && rtx_varies_p (XEXP (x, 0), for_alias)) || rtx_varies_p (XEXP (x, 1), for_alias); case ASM_OPERANDS: if (MEM_VOLATILE_P (x)) return 1; /* Fall through. */ default: break; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) if (fmt[i] == 'e') { if (rtx_varies_p (XEXP (x, i), for_alias)) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (rtx_varies_p (XVECEXP (x, i, j), for_alias)) return 1; } return 0; } /* Return nonzero if the use of X as an address in a MEM can cause a trap. MODE is the mode of the MEM (not that of X) and UNALIGNED_MEMS controls whether nonzero is returned for unaligned memory accesses on strict alignment machines. */ static int rtx_addr_can_trap_p_1 (rtx x, enum machine_mode mode, bool unaligned_mems) { enum rtx_code code = GET_CODE (x); switch (code) { case SYMBOL_REF: return SYMBOL_REF_WEAK (x); case LABEL_REF: return 0; case REG: /* As in rtx_varies_p, we have to use the actual rtx, not reg number. */ if (x == frame_pointer_rtx || x == hard_frame_pointer_rtx || x == stack_pointer_rtx /* The arg pointer varies if it is not a fixed register. */ || (x == arg_pointer_rtx && fixed_regs[ARG_POINTER_REGNUM])) return 0; /* All of the virtual frame registers are stack references. */ if (REGNO (x) >= FIRST_VIRTUAL_REGISTER && REGNO (x) <= LAST_VIRTUAL_REGISTER) return 0; return 1; case CONST: return rtx_addr_can_trap_p_1 (XEXP (x, 0), mode, unaligned_mems); case PLUS: /* An address is assumed not to trap if: - it is an address that can't trap plus a constant integer, with the proper remainder modulo the mode size if we are considering unaligned memory references. */ if (!rtx_addr_can_trap_p_1 (XEXP (x, 0), mode, unaligned_mems) && GET_CODE (XEXP (x, 1)) == CONST_INT) { HOST_WIDE_INT offset; if (!STRICT_ALIGNMENT || !unaligned_mems || GET_MODE_SIZE (mode) == 0) return 0; offset = INTVAL (XEXP (x, 1)); #ifdef SPARC_STACK_BOUNDARY_HACK /* ??? The SPARC port may claim a STACK_BOUNDARY higher than the real alignment of %sp. However, when it does this, the alignment of %sp+STACK_POINTER_OFFSET is STACK_BOUNDARY. */ if (SPARC_STACK_BOUNDARY_HACK && (XEXP (x, 0) == stack_pointer_rtx || XEXP (x, 0) == hard_frame_pointer_rtx)) offset -= STACK_POINTER_OFFSET; #endif return offset % GET_MODE_SIZE (mode) != 0; } /* - or it is the pic register plus a constant. */ if (XEXP (x, 0) == pic_offset_table_rtx && CONSTANT_P (XEXP (x, 1))) return 0; return 1; case LO_SUM: case PRE_MODIFY: return rtx_addr_can_trap_p_1 (XEXP (x, 1), mode, unaligned_mems); case PRE_DEC: case PRE_INC: case POST_DEC: case POST_INC: case POST_MODIFY: return rtx_addr_can_trap_p_1 (XEXP (x, 0), mode, unaligned_mems); default: break; } /* If it isn't one of the case above, it can cause a trap. */ return 1; } /* Return nonzero if the use of X as an address in a MEM can cause a trap. */ int rtx_addr_can_trap_p (rtx x) { return rtx_addr_can_trap_p_1 (x, VOIDmode, false); } /* Return true if X is an address that is known to not be zero. */ bool nonzero_address_p (rtx x) { enum rtx_code code = GET_CODE (x); switch (code) { case SYMBOL_REF: return !SYMBOL_REF_WEAK (x); case LABEL_REF: return true; case REG: /* As in rtx_varies_p, we have to use the actual rtx, not reg number. */ if (x == frame_pointer_rtx || x == hard_frame_pointer_rtx || x == stack_pointer_rtx || (x == arg_pointer_rtx && fixed_regs[ARG_POINTER_REGNUM])) return true; /* All of the virtual frame registers are stack references. */ if (REGNO (x) >= FIRST_VIRTUAL_REGISTER && REGNO (x) <= LAST_VIRTUAL_REGISTER) return true; return false; case CONST: return nonzero_address_p (XEXP (x, 0)); case PLUS: if (GET_CODE (XEXP (x, 1)) == CONST_INT) return nonzero_address_p (XEXP (x, 0)); /* Handle PIC references. */ else if (XEXP (x, 0) == pic_offset_table_rtx && CONSTANT_P (XEXP (x, 1))) return true; return false; case PRE_MODIFY: /* Similar to the above; allow positive offsets. Further, since auto-inc is only allowed in memories, the register must be a pointer. */ if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) > 0) return true; return nonzero_address_p (XEXP (x, 0)); case PRE_INC: /* Similarly. Further, the offset is always positive. */ return true; case PRE_DEC: case POST_DEC: case POST_INC: case POST_MODIFY: return nonzero_address_p (XEXP (x, 0)); case LO_SUM: return nonzero_address_p (XEXP (x, 1)); default: break; } /* If it isn't one of the case above, might be zero. */ return false; } /* Return 1 if X refers to a memory location whose address cannot be compared reliably with constant addresses, or if X refers to a BLKmode memory object. FOR_ALIAS is nonzero if we are called from alias analysis; if it is zero, we are slightly more conservative. */ int rtx_addr_varies_p (rtx x, int for_alias) { enum rtx_code code; int i; const char *fmt; if (x == 0) return 0; code = GET_CODE (x); if (code == MEM) return GET_MODE (x) == BLKmode || rtx_varies_p (XEXP (x, 0), for_alias); fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) if (fmt[i] == 'e') { if (rtx_addr_varies_p (XEXP (x, i), for_alias)) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (rtx_addr_varies_p (XVECEXP (x, i, j), for_alias)) return 1; } return 0; } /* Return the value of the integer term in X, if one is apparent; otherwise return 0. Only obvious integer terms are detected. This is used in cse.c with the `related_value' field. */ HOST_WIDE_INT get_integer_term (rtx x) { if (GET_CODE (x) == CONST) x = XEXP (x, 0); if (GET_CODE (x) == MINUS && GET_CODE (XEXP (x, 1)) == CONST_INT) return - INTVAL (XEXP (x, 1)); if (GET_CODE (x) == PLUS && GET_CODE (XEXP (x, 1)) == CONST_INT) return INTVAL (XEXP (x, 1)); return 0; } /* If X is a constant, return the value sans apparent integer term; otherwise return 0. Only obvious integer terms are detected. */ rtx get_related_value (rtx x) { if (GET_CODE (x) != CONST) return 0; x = XEXP (x, 0); if (GET_CODE (x) == PLUS && GET_CODE (XEXP (x, 1)) == CONST_INT) return XEXP (x, 0); else if (GET_CODE (x) == MINUS && GET_CODE (XEXP (x, 1)) == CONST_INT) return XEXP (x, 0); return 0; } /* Return the number of places FIND appears within X. If COUNT_DEST is zero, we do not count occurrences inside the destination of a SET. */ int count_occurrences (rtx x, rtx find, int count_dest) { int i, j; enum rtx_code code; const char *format_ptr; int count; if (x == find) return 1; code = GET_CODE (x); switch (code) { case REG: case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case SYMBOL_REF: case CODE_LABEL: case PC: case CC0: return 0; case MEM: if (MEM_P (find) && rtx_equal_p (x, find)) return 1; break; case SET: if (SET_DEST (x) == find && ! count_dest) return count_occurrences (SET_SRC (x), find, count_dest); break; default: break; } format_ptr = GET_RTX_FORMAT (code); count = 0; for (i = 0; i < GET_RTX_LENGTH (code); i++) { switch (*format_ptr++) { case 'e': count += count_occurrences (XEXP (x, i), find, count_dest); break; case 'E': for (j = 0; j < XVECLEN (x, i); j++) count += count_occurrences (XVECEXP (x, i, j), find, count_dest); break; } } return count; } /* Nonzero if register REG appears somewhere within IN. Also works if REG is not a register; in this case it checks for a subexpression of IN that is Lisp "equal" to REG. */ int reg_mentioned_p (rtx reg, rtx in) { const char *fmt; int i; enum rtx_code code; if (in == 0) return 0; if (reg == in) return 1; if (GET_CODE (in) == LABEL_REF) return reg == XEXP (in, 0); code = GET_CODE (in); switch (code) { /* Compare registers by number. */ case REG: return REG_P (reg) && REGNO (in) == REGNO (reg); /* These codes have no constituent expressions and are unique. */ case SCRATCH: case CC0: case PC: return 0; case CONST_INT: case CONST_VECTOR: case CONST_DOUBLE: /* These are kept unique for a given value. */ return 0; default: break; } if (GET_CODE (reg) == code && rtx_equal_p (reg, in)) return 1; fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'E') { int j; for (j = XVECLEN (in, i) - 1; j >= 0; j--) if (reg_mentioned_p (reg, XVECEXP (in, i, j))) return 1; } else if (fmt[i] == 'e' && reg_mentioned_p (reg, XEXP (in, i))) return 1; } return 0; } /* Return 1 if in between BEG and END, exclusive of BEG and END, there is no CODE_LABEL insn. */ int no_labels_between_p (rtx beg, rtx end) { rtx p; if (beg == end) return 0; for (p = NEXT_INSN (beg); p != end; p = NEXT_INSN (p)) if (LABEL_P (p)) return 0; return 1; } /* Nonzero if register REG is used in an insn between FROM_INSN and TO_INSN (exclusive of those two). */ int reg_used_between_p (rtx reg, rtx from_insn, rtx to_insn) { rtx insn; if (from_insn == to_insn) return 0; for (insn = NEXT_INSN (from_insn); insn != to_insn; insn = NEXT_INSN (insn)) if (INSN_P (insn) && (reg_overlap_mentioned_p (reg, PATTERN (insn)) || (CALL_P (insn) && find_reg_fusage (insn, USE, reg)))) return 1; return 0; } /* Nonzero if the old value of X, a register, is referenced in BODY. If X is entirely replaced by a new value and the only use is as a SET_DEST, we do not consider it a reference. */ int reg_referenced_p (rtx x, rtx body) { int i; switch (GET_CODE (body)) { case SET: if (reg_overlap_mentioned_p (x, SET_SRC (body))) return 1; /* If the destination is anything other than CC0, PC, a REG or a SUBREG of a REG that occupies all of the REG, the insn references X if it is mentioned in the destination. */ if (GET_CODE (SET_DEST (body)) != CC0 && GET_CODE (SET_DEST (body)) != PC && !REG_P (SET_DEST (body)) && ! (GET_CODE (SET_DEST (body)) == SUBREG && REG_P (SUBREG_REG (SET_DEST (body))) && (((GET_MODE_SIZE (GET_MODE (SUBREG_REG (SET_DEST (body)))) + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD) == ((GET_MODE_SIZE (GET_MODE (SET_DEST (body))) + (UNITS_PER_WORD - 1)) / UNITS_PER_WORD))) && reg_overlap_mentioned_p (x, SET_DEST (body))) return 1; return 0; case ASM_OPERANDS: for (i = ASM_OPERANDS_INPUT_LENGTH (body) - 1; i >= 0; i--) if (reg_overlap_mentioned_p (x, ASM_OPERANDS_INPUT (body, i))) return 1; return 0; case CALL: case USE: case IF_THEN_ELSE: return reg_overlap_mentioned_p (x, body); case TRAP_IF: return reg_overlap_mentioned_p (x, TRAP_CONDITION (body)); case PREFETCH: return reg_overlap_mentioned_p (x, XEXP (body, 0)); case UNSPEC: case UNSPEC_VOLATILE: for (i = XVECLEN (body, 0) - 1; i >= 0; i--) if (reg_overlap_mentioned_p (x, XVECEXP (body, 0, i))) return 1; return 0; case PARALLEL: for (i = XVECLEN (body, 0) - 1; i >= 0; i--) if (reg_referenced_p (x, XVECEXP (body, 0, i))) return 1; return 0; case CLOBBER: if (MEM_P (XEXP (body, 0))) if (reg_overlap_mentioned_p (x, XEXP (XEXP (body, 0), 0))) return 1; return 0; case COND_EXEC: if (reg_overlap_mentioned_p (x, COND_EXEC_TEST (body))) return 1; return reg_referenced_p (x, COND_EXEC_CODE (body)); default: return 0; } } /* Nonzero if register REG is set or clobbered in an insn between FROM_INSN and TO_INSN (exclusive of those two). */ int reg_set_between_p (rtx reg, rtx from_insn, rtx to_insn) { rtx insn; if (from_insn == to_insn) return 0; for (insn = NEXT_INSN (from_insn); insn != to_insn; insn = NEXT_INSN (insn)) if (INSN_P (insn) && reg_set_p (reg, insn)) return 1; return 0; } /* Internals of reg_set_between_p. */ int reg_set_p (rtx reg, rtx insn) { /* We can be passed an insn or part of one. If we are passed an insn, check if a side-effect of the insn clobbers REG. */ if (INSN_P (insn) && (FIND_REG_INC_NOTE (insn, reg) || (CALL_P (insn) && ((REG_P (reg) && REGNO (reg) < FIRST_PSEUDO_REGISTER && overlaps_hard_reg_set_p (regs_invalidated_by_call, GET_MODE (reg), REGNO (reg))) || MEM_P (reg) || find_reg_fusage (insn, CLOBBER, reg))))) return 1; return set_of (reg, insn) != NULL_RTX; } /* Similar to reg_set_between_p, but check all registers in X. Return 0 only if none of them are modified between START and END. Return 1 if X contains a MEM; this routine does usememory aliasing. */ int modified_between_p (rtx x, rtx start, rtx end) { enum rtx_code code = GET_CODE (x); const char *fmt; int i, j; rtx insn; if (start == end) return 0; switch (code) { case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case CONST: case SYMBOL_REF: case LABEL_REF: return 0; case PC: case CC0: return 1; case MEM: if (modified_between_p (XEXP (x, 0), start, end)) return 1; if (MEM_READONLY_P (x)) return 0; for (insn = NEXT_INSN (start); insn != end; insn = NEXT_INSN (insn)) if (memory_modified_in_insn_p (x, insn)) return 1; return 0; break; case REG: return reg_set_between_p (x, start, end); default: break; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e' && modified_between_p (XEXP (x, i), start, end)) return 1; else if (fmt[i] == 'E') for (j = XVECLEN (x, i) - 1; j >= 0; j--) if (modified_between_p (XVECEXP (x, i, j), start, end)) return 1; } return 0; } /* Similar to reg_set_p, but check all registers in X. Return 0 only if none of them are modified in INSN. Return 1 if X contains a MEM; this routine does use memory aliasing. */ int modified_in_p (rtx x, rtx insn) { enum rtx_code code = GET_CODE (x); const char *fmt; int i, j; switch (code) { case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case CONST: case SYMBOL_REF: case LABEL_REF: return 0; case PC: case CC0: return 1; case MEM: if (modified_in_p (XEXP (x, 0), insn)) return 1; if (MEM_READONLY_P (x)) return 0; if (memory_modified_in_insn_p (x, insn)) return 1; return 0; break; case REG: return reg_set_p (x, insn); default: break; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e' && modified_in_p (XEXP (x, i), insn)) return 1; else if (fmt[i] == 'E') for (j = XVECLEN (x, i) - 1; j >= 0; j--) if (modified_in_p (XVECEXP (x, i, j), insn)) return 1; } return 0; } /* Helper function for set_of. */ struct set_of_data { rtx found; rtx pat; }; static void set_of_1 (rtx x, rtx pat, void *data1) { struct set_of_data *data = (struct set_of_data *) (data1); if (rtx_equal_p (x, data->pat) || (!MEM_P (x) && reg_overlap_mentioned_p (data->pat, x))) data->found = pat; } /* Give an INSN, return a SET or CLOBBER expression that does modify PAT (either directly or via STRICT_LOW_PART and similar modifiers). */ rtx set_of (rtx pat, rtx insn) { struct set_of_data data; data.found = NULL_RTX; data.pat = pat; note_stores (INSN_P (insn) ? PATTERN (insn) : insn, set_of_1, &data); return data.found; } /* Given an INSN, return a SET expression if this insn has only a single SET. It may also have CLOBBERs, USEs, or SET whose output will not be used, which we ignore. */ rtx single_set_2 (rtx insn, rtx pat) { rtx set = NULL; int set_verified = 1; int i; if (GET_CODE (pat) == PARALLEL) { for (i = 0; i < XVECLEN (pat, 0); i++) { rtx sub = XVECEXP (pat, 0, i); switch (GET_CODE (sub)) { case USE: case CLOBBER: break; case SET: /* We can consider insns having multiple sets, where all but one are dead as single set insns. In common case only single set is present in the pattern so we want to avoid checking for REG_UNUSED notes unless necessary. When we reach set first time, we just expect this is the single set we are looking for and only when more sets are found in the insn, we check them. */ if (!set_verified) { if (find_reg_note (insn, REG_UNUSED, SET_DEST (set)) && !side_effects_p (set)) set = NULL; else set_verified = 1; } if (!set) set = sub, set_verified = 0; else if (!find_reg_note (insn, REG_UNUSED, SET_DEST (sub)) || side_effects_p (sub)) return NULL_RTX; break; default: return NULL_RTX; } } } return set; } /* Given an INSN, return nonzero if it has more than one SET, else return zero. */ int multiple_sets (rtx insn) { int found; int i; /* INSN must be an insn. */ if (! INSN_P (insn)) return 0; /* Only a PARALLEL can have multiple SETs. */ if (GET_CODE (PATTERN (insn)) == PARALLEL) { for (i = 0, found = 0; i < XVECLEN (PATTERN (insn), 0); i++) if (GET_CODE (XVECEXP (PATTERN (insn), 0, i)) == SET) { /* If we have already found a SET, then return now. */ if (found) return 1; else found = 1; } } /* Either zero or one SET. */ return 0; } /* Return nonzero if the destination of SET equals the source and there are no side effects. */ int set_noop_p (rtx set) { rtx src = SET_SRC (set); rtx dst = SET_DEST (set); if (dst == pc_rtx && src == pc_rtx) return 1; if (MEM_P (dst) && MEM_P (src)) return rtx_equal_p (dst, src) && !side_effects_p (dst); if (GET_CODE (dst) == ZERO_EXTRACT) return rtx_equal_p (XEXP (dst, 0), src) && ! BYTES_BIG_ENDIAN && XEXP (dst, 2) == const0_rtx && !side_effects_p (src); if (GET_CODE (dst) == STRICT_LOW_PART) dst = XEXP (dst, 0); if (GET_CODE (src) == SUBREG && GET_CODE (dst) == SUBREG) { if (SUBREG_BYTE (src) != SUBREG_BYTE (dst)) return 0; src = SUBREG_REG (src); dst = SUBREG_REG (dst); } return (REG_P (src) && REG_P (dst) && REGNO (src) == REGNO (dst)); } /* Return nonzero if an insn consists only of SETs, each of which only sets a value to itself. */ int noop_move_p (rtx insn) { rtx pat = PATTERN (insn); if (INSN_CODE (insn) == NOOP_MOVE_INSN_CODE) return 1; /* Insns carrying these notes are useful later on. */ if (find_reg_note (insn, REG_EQUAL, NULL_RTX)) return 0; /* For now treat an insn with a REG_RETVAL note as a a special insn which should not be considered a no-op. */ if (find_reg_note (insn, REG_RETVAL, NULL_RTX)) return 0; if (GET_CODE (pat) == SET && set_noop_p (pat)) return 1; if (GET_CODE (pat) == PARALLEL) { int i; /* If nothing but SETs of registers to themselves, this insn can also be deleted. */ for (i = 0; i < XVECLEN (pat, 0); i++) { rtx tem = XVECEXP (pat, 0, i); if (GET_CODE (tem) == USE || GET_CODE (tem) == CLOBBER) continue; if (GET_CODE (tem) != SET || ! set_noop_p (tem)) return 0; } return 1; } return 0; } /* Return the last thing that X was assigned from before *PINSN. If VALID_TO is not NULL_RTX then verify that the object is not modified up to VALID_TO. If the object was modified, if we hit a partial assignment to X, or hit a CODE_LABEL first, return X. If we found an assignment, update *PINSN to point to it. ALLOW_HWREG is set to 1 if hardware registers are allowed to be the src. */ rtx find_last_value (rtx x, rtx *pinsn, rtx valid_to, int allow_hwreg) { rtx p; for (p = PREV_INSN (*pinsn); p && !LABEL_P (p); p = PREV_INSN (p)) if (INSN_P (p)) { rtx set = single_set (p); rtx note = find_reg_note (p, REG_EQUAL, NULL_RTX); if (set && rtx_equal_p (x, SET_DEST (set))) { rtx src = SET_SRC (set); if (note && GET_CODE (XEXP (note, 0)) != EXPR_LIST) src = XEXP (note, 0); if ((valid_to == NULL_RTX || ! modified_between_p (src, PREV_INSN (p), valid_to)) /* Reject hard registers because we don't usually want to use them; we'd rather use a pseudo. */ && (! (REG_P (src) && REGNO (src) < FIRST_PSEUDO_REGISTER) || allow_hwreg)) { *pinsn = p; return src; } } /* If set in non-simple way, we don't have a value. */ if (reg_set_p (x, p)) break; } return x; } /* Return nonzero if register in range [REGNO, ENDREGNO) appears either explicitly or implicitly in X other than being stored into. References contained within the substructure at LOC do not count. LOC may be zero, meaning don't ignore anything. */ int refers_to_regno_p (unsigned int regno, unsigned int endregno, rtx x, rtx *loc) { int i; unsigned int x_regno; RTX_CODE code; const char *fmt; repeat: /* The contents of a REG_NONNEG note is always zero, so we must come here upon repeat in case the last REG_NOTE is a REG_NONNEG note. */ if (x == 0) return 0; code = GET_CODE (x); switch (code) { case REG: x_regno = REGNO (x); /* If we modifying the stack, frame, or argument pointer, it will clobber a virtual register. In fact, we could be more precise, but it isn't worth it. */ if ((x_regno == STACK_POINTER_REGNUM #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM || x_regno == ARG_POINTER_REGNUM #endif || x_regno == FRAME_POINTER_REGNUM) && regno >= FIRST_VIRTUAL_REGISTER && regno <= LAST_VIRTUAL_REGISTER) return 1; return (endregno > x_regno && regno < x_regno + (x_regno < FIRST_PSEUDO_REGISTER ? hard_regno_nregs[x_regno][GET_MODE (x)] : 1)); case SUBREG: /* If this is a SUBREG of a hard reg, we can see exactly which registers are being modified. Otherwise, handle normally. */ if (REG_P (SUBREG_REG (x)) && REGNO (SUBREG_REG (x)) < FIRST_PSEUDO_REGISTER) { unsigned int inner_regno = subreg_regno (x); unsigned int inner_endregno = inner_regno + (inner_regno < FIRST_PSEUDO_REGISTER ? hard_regno_nregs[inner_regno][GET_MODE (x)] : 1); return endregno > inner_regno && regno < inner_endregno; } break; case CLOBBER: case SET: if (&SET_DEST (x) != loc /* Note setting a SUBREG counts as referring to the REG it is in for a pseudo but not for hard registers since we can treat each word individually. */ && ((GET_CODE (SET_DEST (x)) == SUBREG && loc != &SUBREG_REG (SET_DEST (x)) && REG_P (SUBREG_REG (SET_DEST (x))) && REGNO (SUBREG_REG (SET_DEST (x))) >= FIRST_PSEUDO_REGISTER && refers_to_regno_p (regno, endregno, SUBREG_REG (SET_DEST (x)), loc)) || (!REG_P (SET_DEST (x)) && refers_to_regno_p (regno, endregno, SET_DEST (x), loc)))) return 1; if (code == CLOBBER || loc == &SET_SRC (x)) return 0; x = SET_SRC (x); goto repeat; default: break; } /* X does not match, so try its subexpressions. */ fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e' && loc != &XEXP (x, i)) { if (i == 0) { x = XEXP (x, 0); goto repeat; } else if (refers_to_regno_p (regno, endregno, XEXP (x, i), loc)) return 1; } else if (fmt[i] == 'E') { int j; for (j = XVECLEN (x, i) - 1; j >= 0; j--) if (loc != &XVECEXP (x, i, j) && refers_to_regno_p (regno, endregno, XVECEXP (x, i, j), loc)) return 1; } } return 0; } /* Nonzero if modifying X will affect IN. If X is a register or a SUBREG, we check if any register number in X conflicts with the relevant register numbers. If X is a constant, return 0. If X is a MEM, return 1 iff IN contains a MEM (we don't bother checking for memory addresses that can't conflict because we expect this to be a rare case. */ int reg_overlap_mentioned_p (rtx x, rtx in) { unsigned int regno, endregno; /* If either argument is a constant, then modifying X can not affect IN. Here we look at IN, we can profitably combine CONSTANT_P (x) with the switch statement below. */ if (CONSTANT_P (in)) return 0; recurse: switch (GET_CODE (x)) { case STRICT_LOW_PART: case ZERO_EXTRACT: case SIGN_EXTRACT: /* Overly conservative. */ x = XEXP (x, 0); goto recurse; case SUBREG: regno = REGNO (SUBREG_REG (x)); if (regno < FIRST_PSEUDO_REGISTER) regno = subreg_regno (x); goto do_reg; case REG: regno = REGNO (x); do_reg: endregno = regno + (regno < FIRST_PSEUDO_REGISTER ? hard_regno_nregs[regno][GET_MODE (x)] : 1); return refers_to_regno_p (regno, endregno, in, (rtx*) 0); case MEM: { const char *fmt; int i; if (MEM_P (in)) return 1; fmt = GET_RTX_FORMAT (GET_CODE (in)); for (i = GET_RTX_LENGTH (GET_CODE (in)) - 1; i >= 0; i--) if (fmt[i] == 'e') { if (reg_overlap_mentioned_p (x, XEXP (in, i))) return 1; } else if (fmt[i] == 'E') { int j; for (j = XVECLEN (in, i) - 1; j >= 0; --j) if (reg_overlap_mentioned_p (x, XVECEXP (in, i, j))) return 1; } return 0; } case SCRATCH: case PC: case CC0: return reg_mentioned_p (x, in); case PARALLEL: { int i; /* If any register in here refers to it we return true. */ for (i = XVECLEN (x, 0) - 1; i >= 0; i--) if (XEXP (XVECEXP (x, 0, i), 0) != 0 && reg_overlap_mentioned_p (XEXP (XVECEXP (x, 0, i), 0), in)) return 1; return 0; } default: gcc_assert (CONSTANT_P (x)); return 0; } } /* Call FUN on each register or MEM that is stored into or clobbered by X. (X would be the pattern of an insn). FUN receives two arguments: the REG, MEM, CC0 or PC being stored in or clobbered, the SET or CLOBBER rtx that does the store. If the item being stored in or clobbered is a SUBREG of a hard register, the SUBREG will be passed. */ void note_stores (rtx x, void (*fun) (rtx, rtx, void *), void *data) { int i; if (GET_CODE (x) == COND_EXEC) x = COND_EXEC_CODE (x); if (GET_CODE (x) == SET || GET_CODE (x) == CLOBBER) { rtx dest = SET_DEST (x); while ((GET_CODE (dest) == SUBREG && (!REG_P (SUBREG_REG (dest)) || REGNO (SUBREG_REG (dest)) >= FIRST_PSEUDO_REGISTER)) || GET_CODE (dest) == ZERO_EXTRACT || GET_CODE (dest) == STRICT_LOW_PART) dest = XEXP (dest, 0); /* If we have a PARALLEL, SET_DEST is a list of EXPR_LIST expressions, each of whose first operand is a register. */ if (GET_CODE (dest) == PARALLEL) { for (i = XVECLEN (dest, 0) - 1; i >= 0; i--) if (XEXP (XVECEXP (dest, 0, i), 0) != 0) (*fun) (XEXP (XVECEXP (dest, 0, i), 0), x, data); } else (*fun) (dest, x, data); } else if (GET_CODE (x) == PARALLEL) for (i = XVECLEN (x, 0) - 1; i >= 0; i--) note_stores (XVECEXP (x, 0, i), fun, data); } /* Like notes_stores, but call FUN for each expression that is being referenced in PBODY, a pointer to the PATTERN of an insn. We only call FUN for each expression, not any interior subexpressions. FUN receives a pointer to the expression and the DATA passed to this function. Note that this is not quite the same test as that done in reg_referenced_p since that considers something as being referenced if it is being partially set, while we do not. */ void note_uses (rtx *pbody, void (*fun) (rtx *, void *), void *data) { rtx body = *pbody; int i; switch (GET_CODE (body)) { case COND_EXEC: (*fun) (&COND_EXEC_TEST (body), data); note_uses (&COND_EXEC_CODE (body), fun, data); return; case PARALLEL: for (i = XVECLEN (body, 0) - 1; i >= 0; i--) note_uses (&XVECEXP (body, 0, i), fun, data); return; case USE: (*fun) (&XEXP (body, 0), data); return; case ASM_OPERANDS: for (i = ASM_OPERANDS_INPUT_LENGTH (body) - 1; i >= 0; i--) (*fun) (&ASM_OPERANDS_INPUT (body, i), data); return; case TRAP_IF: (*fun) (&TRAP_CONDITION (body), data); return; case PREFETCH: (*fun) (&XEXP (body, 0), data); return; case UNSPEC: case UNSPEC_VOLATILE: for (i = XVECLEN (body, 0) - 1; i >= 0; i--) (*fun) (&XVECEXP (body, 0, i), data); return; case CLOBBER: if (MEM_P (XEXP (body, 0))) (*fun) (&XEXP (XEXP (body, 0), 0), data); return; case SET: { rtx dest = SET_DEST (body); /* For sets we replace everything in source plus registers in memory expression in store and operands of a ZERO_EXTRACT. */ (*fun) (&SET_SRC (body), data); if (GET_CODE (dest) == ZERO_EXTRACT) { (*fun) (&XEXP (dest, 1), data); (*fun) (&XEXP (dest, 2), data); } while (GET_CODE (dest) == SUBREG || GET_CODE (dest) == STRICT_LOW_PART) dest = XEXP (dest, 0); if (MEM_P (dest)) (*fun) (&XEXP (dest, 0), data); } return; default: /* All the other possibilities never store. */ (*fun) (pbody, data); return; } } /* Return nonzero if X's old contents don't survive after INSN. This will be true if X is (cc0) or if X is a register and X dies in INSN or because INSN entirely sets X. "Entirely set" means set directly and not through a SUBREG, or ZERO_EXTRACT, so no trace of the old contents remains. Likewise, REG_INC does not count. REG may be a hard or pseudo reg. Renumbering is not taken into account, but for this use that makes no difference, since regs don't overlap during their lifetimes. Therefore, this function may be used at any time after deaths have been computed (in flow.c). If REG is a hard reg that occupies multiple machine registers, this function will only return 1 if each of those registers will be replaced by INSN. */ int dead_or_set_p (rtx insn, rtx x) { unsigned int regno, last_regno; unsigned int i; /* Can't use cc0_rtx below since this file is used by genattrtab.c. */ if (GET_CODE (x) == CC0) return 1; gcc_assert (REG_P (x)); regno = REGNO (x); last_regno = (regno >= FIRST_PSEUDO_REGISTER ? regno : regno + hard_regno_nregs[regno][GET_MODE (x)] - 1); for (i = regno; i <= last_regno; i++) if (! dead_or_set_regno_p (insn, i)) return 0; return 1; } /* Return TRUE iff DEST is a register or subreg of a register and doesn't change the number of words of the inner register, and any part of the register is TEST_REGNO. */ static bool covers_regno_no_parallel_p (rtx dest, unsigned int test_regno) { unsigned int regno, endregno; if (GET_CODE (dest) == SUBREG && (((GET_MODE_SIZE (GET_MODE (dest)) + UNITS_PER_WORD - 1) / UNITS_PER_WORD) == ((GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))) + UNITS_PER_WORD - 1) / UNITS_PER_WORD))) dest = SUBREG_REG (dest); if (!REG_P (dest)) return false; regno = REGNO (dest); endregno = (regno >= FIRST_PSEUDO_REGISTER ? regno + 1 : regno + hard_regno_nregs[regno][GET_MODE (dest)]); return (test_regno >= regno && test_regno < endregno); } /* Like covers_regno_no_parallel_p, but also handles PARALLELs where any member matches the covers_regno_no_parallel_p criteria. */ static bool covers_regno_p (rtx dest, unsigned int test_regno) { if (GET_CODE (dest) == PARALLEL) { /* Some targets place small structures in registers for return values of functions, and those registers are wrapped in PARALLELs that we may see as the destination of a SET. */ int i; for (i = XVECLEN (dest, 0) - 1; i >= 0; i--) { rtx inner = XEXP (XVECEXP (dest, 0, i), 0); if (inner != NULL_RTX && covers_regno_no_parallel_p (inner, test_regno)) return true; } return false; } else return covers_regno_no_parallel_p (dest, test_regno); } /* Utility function for dead_or_set_p to check an individual register. Also called from flow.c. */ int dead_or_set_regno_p (rtx insn, unsigned int test_regno) { rtx pattern; /* See if there is a death note for something that includes TEST_REGNO. */ if (find_regno_note (insn, REG_DEAD, test_regno)) return 1; if (CALL_P (insn) && find_regno_fusage (insn, CLOBBER, test_regno)) return 1; pattern = PATTERN (insn); if (GET_CODE (pattern) == COND_EXEC) pattern = COND_EXEC_CODE (pattern); if (GET_CODE (pattern) == SET) return covers_regno_p (SET_DEST (pattern), test_regno); else if (GET_CODE (pattern) == PARALLEL) { int i; for (i = XVECLEN (pattern, 0) - 1; i >= 0; i--) { rtx body = XVECEXP (pattern, 0, i); if (GET_CODE (body) == COND_EXEC) body = COND_EXEC_CODE (body); if ((GET_CODE (body) == SET || GET_CODE (body) == CLOBBER) && covers_regno_p (SET_DEST (body), test_regno)) return 1; } } return 0; } /* Return the reg-note of kind KIND in insn INSN, if there is one. If DATUM is nonzero, look for one whose datum is DATUM. */ rtx find_reg_note (rtx insn, enum reg_note kind, rtx datum) { rtx link; gcc_assert (insn); /* Ignore anything that is not an INSN, JUMP_INSN or CALL_INSN. */ if (! INSN_P (insn)) return 0; if (datum == 0) { for (link = REG_NOTES (insn); link; link = XEXP (link, 1)) if (REG_NOTE_KIND (link) == kind) return link; return 0; } for (link = REG_NOTES (insn); link; link = XEXP (link, 1)) if (REG_NOTE_KIND (link) == kind && datum == XEXP (link, 0)) return link; return 0; } /* Return the reg-note of kind KIND in insn INSN which applies to register number REGNO, if any. Return 0 if there is no such reg-note. Note that the REGNO of this NOTE need not be REGNO if REGNO is a hard register; it might be the case that the note overlaps REGNO. */ rtx find_regno_note (rtx insn, enum reg_note kind, unsigned int regno) { rtx link; /* Ignore anything that is not an INSN, JUMP_INSN or CALL_INSN. */ if (! INSN_P (insn)) return 0; for (link = REG_NOTES (insn); link; link = XEXP (link, 1)) if (REG_NOTE_KIND (link) == kind /* Verify that it is a register, so that scratch and MEM won't cause a problem here. */ && REG_P (XEXP (link, 0)) && REGNO (XEXP (link, 0)) <= regno && ((REGNO (XEXP (link, 0)) + (REGNO (XEXP (link, 0)) >= FIRST_PSEUDO_REGISTER ? 1 : hard_regno_nregs[REGNO (XEXP (link, 0))] [GET_MODE (XEXP (link, 0))])) > regno)) return link; return 0; } /* Return a REG_EQUIV or REG_EQUAL note if insn has only a single set and has such a note. */ rtx find_reg_equal_equiv_note (rtx insn) { rtx link; if (!INSN_P (insn)) return 0; for (link = REG_NOTES (insn); link; link = XEXP (link, 1)) if (REG_NOTE_KIND (link) == REG_EQUAL || REG_NOTE_KIND (link) == REG_EQUIV) { if (single_set (insn) == 0) return 0; return link; } return NULL; } /* Return true if DATUM, or any overlap of DATUM, of kind CODE is found in the CALL_INSN_FUNCTION_USAGE information of INSN. */ int find_reg_fusage (rtx insn, enum rtx_code code, rtx datum) { /* If it's not a CALL_INSN, it can't possibly have a CALL_INSN_FUNCTION_USAGE field, so don't bother checking. */ if (!CALL_P (insn)) return 0; gcc_assert (datum); if (!REG_P (datum)) { rtx link; for (link = CALL_INSN_FUNCTION_USAGE (insn); link; link = XEXP (link, 1)) if (GET_CODE (XEXP (link, 0)) == code && rtx_equal_p (datum, XEXP (XEXP (link, 0), 0))) return 1; } else { unsigned int regno = REGNO (datum); /* CALL_INSN_FUNCTION_USAGE information cannot contain references to pseudo registers, so don't bother checking. */ if (regno < FIRST_PSEUDO_REGISTER) { unsigned int end_regno = regno + hard_regno_nregs[regno][GET_MODE (datum)]; unsigned int i; for (i = regno; i < end_regno; i++) if (find_regno_fusage (insn, code, i)) return 1; } } return 0; } /* Return true if REGNO, or any overlap of REGNO, of kind CODE is found in the CALL_INSN_FUNCTION_USAGE information of INSN. */ int find_regno_fusage (rtx insn, enum rtx_code code, unsigned int regno) { rtx link; /* CALL_INSN_FUNCTION_USAGE information cannot contain references to pseudo registers, so don't bother checking. */ if (regno >= FIRST_PSEUDO_REGISTER || !CALL_P (insn) ) return 0; for (link = CALL_INSN_FUNCTION_USAGE (insn); link; link = XEXP (link, 1)) { unsigned int regnote; rtx op, reg; if (GET_CODE (op = XEXP (link, 0)) == code && REG_P (reg = XEXP (op, 0)) && (regnote = REGNO (reg)) <= regno && regnote + hard_regno_nregs[regnote][GET_MODE (reg)] > regno) return 1; } return 0; } /* Return true if INSN is a call to a pure function. */ int pure_call_p (rtx insn) { rtx link; if (!CALL_P (insn) || ! CONST_OR_PURE_CALL_P (insn)) return 0; /* Look for the note that differentiates const and pure functions. */ for (link = CALL_INSN_FUNCTION_USAGE (insn); link; link = XEXP (link, 1)) { rtx u, m; if (GET_CODE (u = XEXP (link, 0)) == USE && MEM_P (m = XEXP (u, 0)) && GET_MODE (m) == BLKmode && GET_CODE (XEXP (m, 0)) == SCRATCH) return 1; } return 0; } /* Remove register note NOTE from the REG_NOTES of INSN. */ void remove_note (rtx insn, rtx note) { rtx link; if (note == NULL_RTX) return; if (REG_NOTES (insn) == note) { REG_NOTES (insn) = XEXP (note, 1); return; } for (link = REG_NOTES (insn); link; link = XEXP (link, 1)) if (XEXP (link, 1) == note) { XEXP (link, 1) = XEXP (note, 1); return; } gcc_unreachable (); } /* Search LISTP (an EXPR_LIST) for an entry whose first operand is NODE and return 1 if it is found. A simple equality test is used to determine if NODE matches. */ int in_expr_list_p (rtx listp, rtx node) { rtx x; for (x = listp; x; x = XEXP (x, 1)) if (node == XEXP (x, 0)) return 1; return 0; } /* Search LISTP (an EXPR_LIST) for an entry whose first operand is NODE and remove that entry from the list if it is found. A simple equality test is used to determine if NODE matches. */ void remove_node_from_expr_list (rtx node, rtx *listp) { rtx temp = *listp; rtx prev = NULL_RTX; while (temp) { if (node == XEXP (temp, 0)) { /* Splice the node out of the list. */ if (prev) XEXP (prev, 1) = XEXP (temp, 1); else *listp = XEXP (temp, 1); return; } prev = temp; temp = XEXP (temp, 1); } } /* Nonzero if X contains any volatile instructions. These are instructions which may cause unpredictable machine state instructions, and thus no instructions should be moved or combined across them. This includes only volatile asms and UNSPEC_VOLATILE instructions. */ int volatile_insn_p (rtx x) { RTX_CODE code; code = GET_CODE (x); switch (code) { case LABEL_REF: case SYMBOL_REF: case CONST_INT: case CONST: case CONST_DOUBLE: case CONST_VECTOR: case CC0: case PC: case REG: case SCRATCH: case CLOBBER: case ADDR_VEC: case ADDR_DIFF_VEC: case CALL: case MEM: return 0; case UNSPEC_VOLATILE: /* case TRAP_IF: This isn't clear yet. */ return 1; case ASM_INPUT: case ASM_OPERANDS: if (MEM_VOLATILE_P (x)) return 1; default: break; } /* Recursively scan the operands of this expression. */ { const char *fmt = GET_RTX_FORMAT (code); int i; for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e') { if (volatile_insn_p (XEXP (x, i))) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (volatile_insn_p (XVECEXP (x, i, j))) return 1; } } } return 0; } /* Nonzero if X contains any volatile memory references UNSPEC_VOLATILE operations or volatile ASM_OPERANDS expressions. */ int volatile_refs_p (rtx x) { RTX_CODE code; code = GET_CODE (x); switch (code) { case LABEL_REF: case SYMBOL_REF: case CONST_INT: case CONST: case CONST_DOUBLE: case CONST_VECTOR: case CC0: case PC: case REG: case SCRATCH: case CLOBBER: case ADDR_VEC: case ADDR_DIFF_VEC: return 0; case UNSPEC_VOLATILE: return 1; case MEM: case ASM_INPUT: case ASM_OPERANDS: if (MEM_VOLATILE_P (x)) return 1; default: break; } /* Recursively scan the operands of this expression. */ { const char *fmt = GET_RTX_FORMAT (code); int i; for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e') { if (volatile_refs_p (XEXP (x, i))) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (volatile_refs_p (XVECEXP (x, i, j))) return 1; } } } return 0; } /* Similar to above, except that it also rejects register pre- and post- incrementing. */ int side_effects_p (rtx x) { RTX_CODE code; code = GET_CODE (x); switch (code) { case LABEL_REF: case SYMBOL_REF: case CONST_INT: case CONST: case CONST_DOUBLE: case CONST_VECTOR: case CC0: case PC: case REG: case SCRATCH: case ADDR_VEC: case ADDR_DIFF_VEC: return 0; case CLOBBER: /* Reject CLOBBER with a non-VOID mode. These are made by combine.c when some combination can't be done. If we see one, don't think that we can simplify the expression. */ return (GET_MODE (x) != VOIDmode); case PRE_INC: case PRE_DEC: case POST_INC: case POST_DEC: case PRE_MODIFY: case POST_MODIFY: case CALL: case UNSPEC_VOLATILE: /* case TRAP_IF: This isn't clear yet. */ return 1; case MEM: case ASM_INPUT: case ASM_OPERANDS: if (MEM_VOLATILE_P (x)) return 1; default: break; } /* Recursively scan the operands of this expression. */ { const char *fmt = GET_RTX_FORMAT (code); int i; for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e') { if (side_effects_p (XEXP (x, i))) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (side_effects_p (XVECEXP (x, i, j))) return 1; } } } return 0; } enum may_trap_p_flags { MTP_UNALIGNED_MEMS = 1, MTP_AFTER_MOVE = 2 }; /* Return nonzero if evaluating rtx X might cause a trap. (FLAGS & MTP_UNALIGNED_MEMS) controls whether nonzero is returned for unaligned memory accesses on strict alignment machines. If (FLAGS & AFTER_MOVE) is true, returns nonzero even in case the expression cannot trap at its current location, but it might become trapping if moved elsewhere. */ static int may_trap_p_1 (rtx x, unsigned flags) { int i; enum rtx_code code; const char *fmt; bool unaligned_mems = (flags & MTP_UNALIGNED_MEMS) != 0; if (x == 0) return 0; code = GET_CODE (x); switch (code) { /* Handle these cases quickly. */ case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case SYMBOL_REF: case LABEL_REF: case CONST: case PC: case CC0: case REG: case SCRATCH: return 0; case ASM_INPUT: case UNSPEC_VOLATILE: case TRAP_IF: return 1; case ASM_OPERANDS: return MEM_VOLATILE_P (x); /* Memory ref can trap unless it's a static var or a stack slot. */ case MEM: if (/* MEM_NOTRAP_P only relates to the actual position of the memory reference; moving it out of condition might cause its address become invalid. */ !(flags & MTP_AFTER_MOVE) && MEM_NOTRAP_P (x) && (!STRICT_ALIGNMENT || !unaligned_mems)) return 0; return rtx_addr_can_trap_p_1 (XEXP (x, 0), GET_MODE (x), unaligned_mems); /* Division by a non-constant might trap. */ case DIV: case MOD: case UDIV: case UMOD: if (HONOR_SNANS (GET_MODE (x))) return 1; if (SCALAR_FLOAT_MODE_P (GET_MODE (x))) return flag_trapping_math; if (!CONSTANT_P (XEXP (x, 1)) || (XEXP (x, 1) == const0_rtx)) return 1; break; case EXPR_LIST: /* An EXPR_LIST is used to represent a function call. This certainly may trap. */ return 1; case GE: case GT: case LE: case LT: case LTGT: case COMPARE: /* Some floating point comparisons may trap. */ if (!flag_trapping_math) break; /* ??? There is no machine independent way to check for tests that trap when COMPARE is used, though many targets do make this distinction. For instance, sparc uses CCFPE for compares which generate exceptions and CCFP for compares which do not generate exceptions. */ if (HONOR_NANS (GET_MODE (x))) return 1; /* But often the compare has some CC mode, so check operand modes as well. */ if (HONOR_NANS (GET_MODE (XEXP (x, 0))) || HONOR_NANS (GET_MODE (XEXP (x, 1)))) return 1; break; case EQ: case NE: if (HONOR_SNANS (GET_MODE (x))) return 1; /* Often comparison is CC mode, so check operand modes. */ if (HONOR_SNANS (GET_MODE (XEXP (x, 0))) || HONOR_SNANS (GET_MODE (XEXP (x, 1)))) return 1; break; case FIX: /* Conversion of floating point might trap. */ if (flag_trapping_math && HONOR_NANS (GET_MODE (XEXP (x, 0)))) return 1; break; case NEG: case ABS: case SUBREG: /* These operations don't trap even with floating point. */ break; default: /* Any floating arithmetic may trap. */ if (SCALAR_FLOAT_MODE_P (GET_MODE (x)) && flag_trapping_math) return 1; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e') { if (may_trap_p_1 (XEXP (x, i), flags)) return 1; } else if (fmt[i] == 'E') { int j; for (j = 0; j < XVECLEN (x, i); j++) if (may_trap_p_1 (XVECEXP (x, i, j), flags)) return 1; } } return 0; } /* Return nonzero if evaluating rtx X might cause a trap. */ int may_trap_p (rtx x) { return may_trap_p_1 (x, 0); } /* Return nonzero if evaluating rtx X might cause a trap, when the expression is moved from its current location by some optimization. */ int may_trap_after_code_motion_p (rtx x) { return may_trap_p_1 (x, MTP_AFTER_MOVE); } /* Same as above, but additionally return nonzero if evaluating rtx X might cause a fault. We define a fault for the purpose of this function as a erroneous execution condition that cannot be encountered during the normal execution of a valid program; the typical example is an unaligned memory access on a strict alignment machine. The compiler guarantees that it doesn't generate code that will fault from a valid program, but this guarantee doesn't mean anything for individual instructions. Consider the following example: struct S { int d; union { char *cp; int *ip; }; }; int foo(struct S *s) { if (s->d == 1) return *s->ip; else return *s->cp; } on a strict alignment machine. In a valid program, foo will never be invoked on a structure for which d is equal to 1 and the underlying unique field of the union not aligned on a 4-byte boundary, but the expression *s->ip might cause a fault if considered individually. At the RTL level, potentially problematic expressions will almost always verify may_trap_p; for example, the above dereference can be emitted as (mem:SI (reg:P)) and this expression is may_trap_p for a generic register. However, suppose that foo is inlined in a caller that causes s->cp to point to a local character variable and guarantees that s->d is not set to 1; foo may have been effectively translated into pseudo-RTL as: if ((reg:SI) == 1) (set (reg:SI) (mem:SI (%fp - 7))) else (set (reg:QI) (mem:QI (%fp - 7))) Now (mem:SI (%fp - 7)) is considered as not may_trap_p since it is a memory reference to a stack slot, but it will certainly cause a fault on a strict alignment machine. */ int may_trap_or_fault_p (rtx x) { return may_trap_p_1 (x, MTP_UNALIGNED_MEMS); } /* Return nonzero if X contains a comparison that is not either EQ or NE, i.e., an inequality. */ int inequality_comparisons_p (rtx x) { const char *fmt; int len, i; enum rtx_code code = GET_CODE (x); switch (code) { case REG: case SCRATCH: case PC: case CC0: case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case CONST: case LABEL_REF: case SYMBOL_REF: return 0; case LT: case LTU: case GT: case GTU: case LE: case LEU: case GE: case GEU: return 1; default: break; } len = GET_RTX_LENGTH (code); fmt = GET_RTX_FORMAT (code); for (i = 0; i < len; i++) { if (fmt[i] == 'e') { if (inequality_comparisons_p (XEXP (x, i))) return 1; } else if (fmt[i] == 'E') { int j; for (j = XVECLEN (x, i) - 1; j >= 0; j--) if (inequality_comparisons_p (XVECEXP (x, i, j))) return 1; } } return 0; } /* Replace any occurrence of FROM in X with TO. The function does not enter into CONST_DOUBLE for the replace. Note that copying is not done so X must not be shared unless all copies are to be modified. */ rtx replace_rtx (rtx x, rtx from, rtx to) { int i, j; const char *fmt; /* The following prevents loops occurrence when we change MEM in CONST_DOUBLE onto the same CONST_DOUBLE. */ if (x != 0 && GET_CODE (x) == CONST_DOUBLE) return x; if (x == from) return to; /* Allow this function to make replacements in EXPR_LISTs. */ if (x == 0) return 0; if (GET_CODE (x) == SUBREG) { rtx new = replace_rtx (SUBREG_REG (x), from, to); if (GET_CODE (new) == CONST_INT) { x = simplify_subreg (GET_MODE (x), new, GET_MODE (SUBREG_REG (x)), SUBREG_BYTE (x)); gcc_assert (x); } else SUBREG_REG (x) = new; return x; } else if (GET_CODE (x) == ZERO_EXTEND) { rtx new = replace_rtx (XEXP (x, 0), from, to); if (GET_CODE (new) == CONST_INT) { x = simplify_unary_operation (ZERO_EXTEND, GET_MODE (x), new, GET_MODE (XEXP (x, 0))); gcc_assert (x); } else XEXP (x, 0) = new; return x; } fmt = GET_RTX_FORMAT (GET_CODE (x)); for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--) { if (fmt[i] == 'e') XEXP (x, i) = replace_rtx (XEXP (x, i), from, to); else if (fmt[i] == 'E') for (j = XVECLEN (x, i) - 1; j >= 0; j--) XVECEXP (x, i, j) = replace_rtx (XVECEXP (x, i, j), from, to); } return x; } /* Replace occurrences of the old label in *X with the new one. DATA is a REPLACE_LABEL_DATA containing the old and new labels. */ int replace_label (rtx *x, void *data) { rtx l = *x; rtx old_label = ((replace_label_data *) data)->r1; rtx new_label = ((replace_label_data *) data)->r2; bool update_label_nuses = ((replace_label_data *) data)->update_label_nuses; if (l == NULL_RTX) return 0; if (GET_CODE (l) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (l)) { rtx c = get_pool_constant (l); if (rtx_referenced_p (old_label, c)) { rtx new_c, new_l; replace_label_data *d = (replace_label_data *) data; /* Create a copy of constant C; replace the label inside but do not update LABEL_NUSES because uses in constant pool are not counted. */ new_c = copy_rtx (c); d->update_label_nuses = false; for_each_rtx (&new_c, replace_label, data); d->update_label_nuses = update_label_nuses; /* Add the new constant NEW_C to constant pool and replace the old reference to constant by new reference. */ new_l = XEXP (force_const_mem (get_pool_mode (l), new_c), 0); *x = replace_rtx (l, l, new_l); } return 0; } /* If this is a JUMP_INSN, then we also need to fix the JUMP_LABEL field. This is not handled by for_each_rtx because it doesn't handle unprinted ('0') fields. */ if (JUMP_P (l) && JUMP_LABEL (l) == old_label) JUMP_LABEL (l) = new_label; if ((GET_CODE (l) == LABEL_REF || GET_CODE (l) == INSN_LIST) && XEXP (l, 0) == old_label) { XEXP (l, 0) = new_label; if (update_label_nuses) { ++LABEL_NUSES (new_label); --LABEL_NUSES (old_label); } return 0; } return 0; } /* When *BODY is equal to X or X is directly referenced by *BODY return nonzero, thus FOR_EACH_RTX stops traversing and returns nonzero too, otherwise FOR_EACH_RTX continues traversing *BODY. */ static int rtx_referenced_p_1 (rtx *body, void *x) { rtx y = (rtx) x; if (*body == NULL_RTX) return y == NULL_RTX; /* Return true if a label_ref *BODY refers to label Y. */ if (GET_CODE (*body) == LABEL_REF && LABEL_P (y)) return XEXP (*body, 0) == y; /* If *BODY is a reference to pool constant traverse the constant. */ if (GET_CODE (*body) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (*body)) return rtx_referenced_p (y, get_pool_constant (*body)); /* By default, compare the RTL expressions. */ return rtx_equal_p (*body, y); } /* Return true if X is referenced in BODY. */ int rtx_referenced_p (rtx x, rtx body) { return for_each_rtx (&body, rtx_referenced_p_1, x); } /* If INSN is a tablejump return true and store the label (before jump table) to *LABELP and the jump table to *TABLEP. LABELP and TABLEP may be NULL. */ bool tablejump_p (rtx insn, rtx *labelp, rtx *tablep) { rtx label, table; if (JUMP_P (insn) && (label = JUMP_LABEL (insn)) != NULL_RTX && (table = next_active_insn (label)) != NULL_RTX && JUMP_P (table) && (GET_CODE (PATTERN (table)) == ADDR_VEC || GET_CODE (PATTERN (table)) == ADDR_DIFF_VEC)) { if (labelp) *labelp = label; if (tablep) *tablep = table; return true; } return false; } /* A subroutine of computed_jump_p, return 1 if X contains a REG or MEM or constant that is not in the constant pool and not in the condition of an IF_THEN_ELSE. */ static int computed_jump_p_1 (rtx x) { enum rtx_code code = GET_CODE (x); int i, j; const char *fmt; switch (code) { case LABEL_REF: case PC: return 0; case CONST: case CONST_INT: case CONST_DOUBLE: case CONST_VECTOR: case SYMBOL_REF: case REG: return 1; case MEM: return ! (GET_CODE (XEXP (x, 0)) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (XEXP (x, 0))); case IF_THEN_ELSE: return (computed_jump_p_1 (XEXP (x, 1)) || computed_jump_p_1 (XEXP (x, 2))); default: break; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e' && computed_jump_p_1 (XEXP (x, i))) return 1; else if (fmt[i] == 'E') for (j = 0; j < XVECLEN (x, i); j++) if (computed_jump_p_1 (XVECEXP (x, i, j))) return 1; } return 0; } /* Return nonzero if INSN is an indirect jump (aka computed jump). Tablejumps and casesi insns are not considered indirect jumps; we can recognize them by a (use (label_ref)). */ int computed_jump_p (rtx insn) { int i; if (JUMP_P (insn)) { rtx pat = PATTERN (insn); if (find_reg_note (insn, REG_LABEL, NULL_RTX)) return 0; else if (GET_CODE (pat) == PARALLEL) { int len = XVECLEN (pat, 0); int has_use_labelref = 0; for (i = len - 1; i >= 0; i--) if (GET_CODE (XVECEXP (pat, 0, i)) == USE && (GET_CODE (XEXP (XVECEXP (pat, 0, i), 0)) == LABEL_REF)) has_use_labelref = 1; if (! has_use_labelref) for (i = len - 1; i >= 0; i--) if (GET_CODE (XVECEXP (pat, 0, i)) == SET && SET_DEST (XVECEXP (pat, 0, i)) == pc_rtx && computed_jump_p_1 (SET_SRC (XVECEXP (pat, 0, i)))) return 1; } else if (GET_CODE (pat) == SET && SET_DEST (pat) == pc_rtx && computed_jump_p_1 (SET_SRC (pat))) return 1; } return 0; } /* Optimized loop of for_each_rtx, trying to avoid useless recursive calls. Processes the subexpressions of EXP and passes them to F. */ static int for_each_rtx_1 (rtx exp, int n, rtx_function f, void *data) { int result, i, j; const char *format = GET_RTX_FORMAT (GET_CODE (exp)); rtx *x; for (; format[n] != '\0'; n++) { switch (format[n]) { case 'e': /* Call F on X. */ x = &XEXP (exp, n); result = (*f) (x, data); if (result == -1) /* Do not traverse sub-expressions. */ continue; else if (result != 0) /* Stop the traversal. */ return result; if (*x == NULL_RTX) /* There are no sub-expressions. */ continue; i = non_rtx_starting_operands[GET_CODE (*x)]; if (i >= 0) { result = for_each_rtx_1 (*x, i, f, data); if (result != 0) return result; } break; case 'V': case 'E': if (XVEC (exp, n) == 0) continue; for (j = 0; j < XVECLEN (exp, n); ++j) { /* Call F on X. */ x = &XVECEXP (exp, n, j); result = (*f) (x, data); if (result == -1) /* Do not traverse sub-expressions. */ continue; else if (result != 0) /* Stop the traversal. */ return result; if (*x == NULL_RTX) /* There are no sub-expressions. */ continue; i = non_rtx_starting_operands[GET_CODE (*x)]; if (i >= 0) { result = for_each_rtx_1 (*x, i, f, data); if (result != 0) return result; } } break; default: /* Nothing to do. */ break; } } return 0; } /* Traverse X via depth-first search, calling F for each sub-expression (including X itself). F is also passed the DATA. If F returns -1, do not traverse sub-expressions, but continue traversing the rest of the tree. If F ever returns any other nonzero value, stop the traversal, and return the value returned by F. Otherwise, return 0. This function does not traverse inside tree structure that contains RTX_EXPRs, or into sub-expressions whose format code is `0' since it is not known whether or not those codes are actually RTL. This routine is very general, and could (should?) be used to implement many of the other routines in this file. */ int for_each_rtx (rtx *x, rtx_function f, void *data) { int result; int i; /* Call F on X. */ result = (*f) (x, data); if (result == -1) /* Do not traverse sub-expressions. */ return 0; else if (result != 0) /* Stop the traversal. */ return result; if (*x == NULL_RTX) /* There are no sub-expressions. */ return 0; i = non_rtx_starting_operands[GET_CODE (*x)]; if (i < 0) return 0; return for_each_rtx_1 (*x, i, f, data); } /* Searches X for any reference to REGNO, returning the rtx of the reference found if any. Otherwise, returns NULL_RTX. */ rtx regno_use_in (unsigned int regno, rtx x) { const char *fmt; int i, j; rtx tem; if (REG_P (x) && REGNO (x) == regno) return x; fmt = GET_RTX_FORMAT (GET_CODE (x)); for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--) { if (fmt[i] == 'e') { if ((tem = regno_use_in (regno, XEXP (x, i)))) return tem; } else if (fmt[i] == 'E') for (j = XVECLEN (x, i) - 1; j >= 0; j--) if ((tem = regno_use_in (regno , XVECEXP (x, i, j)))) return tem; } return NULL_RTX; } /* Return a value indicating whether OP, an operand of a commutative operation, is preferred as the first or second operand. The higher the value, the stronger the preference for being the first operand. We use negative values to indicate a preference for the first operand and positive values for the second operand. */ int commutative_operand_precedence (rtx op) { enum rtx_code code = GET_CODE (op); /* Constants always come the second operand. Prefer "nice" constants. */ if (code == CONST_INT) return -7; if (code == CONST_DOUBLE) return -6; op = avoid_constant_pool_reference (op); code = GET_CODE (op); switch (GET_RTX_CLASS (code)) { case RTX_CONST_OBJ: if (code == CONST_INT) return -5; if (code == CONST_DOUBLE) return -4; return -3; case RTX_EXTRA: /* SUBREGs of objects should come second. */ if (code == SUBREG && OBJECT_P (SUBREG_REG (op))) return -2; if (!CONSTANT_P (op)) return 0; else /* As for RTX_CONST_OBJ. */ return -3; case RTX_OBJ: /* Complex expressions should be the first, so decrease priority of objects. */ return -1; case RTX_COMM_ARITH: /* Prefer operands that are themselves commutative to be first. This helps to make things linear. In particular, (and (and (reg) (reg)) (not (reg))) is canonical. */ return 4; case RTX_BIN_ARITH: /* If only one operand is a binary expression, it will be the first operand. In particular, (plus (minus (reg) (reg)) (neg (reg))) is canonical, although it will usually be further simplified. */ return 2; case RTX_UNARY: /* Then prefer NEG and NOT. */ if (code == NEG || code == NOT) return 1; default: return 0; } } /* Return 1 iff it is necessary to swap operands of commutative operation in order to canonicalize expression. */ int swap_commutative_operands_p (rtx x, rtx y) { return (commutative_operand_precedence (x) < commutative_operand_precedence (y)); } /* Return 1 if X is an autoincrement side effect and the register is not the stack pointer. */ int auto_inc_p (rtx x) { switch (GET_CODE (x)) { case PRE_INC: case POST_INC: case PRE_DEC: case POST_DEC: case PRE_MODIFY: case POST_MODIFY: /* There are no REG_INC notes for SP. */ if (XEXP (x, 0) != stack_pointer_rtx) return 1; default: break; } return 0; } /* Return nonzero if IN contains a piece of rtl that has the address LOC. */ int loc_mentioned_in_p (rtx *loc, rtx in) { enum rtx_code code = GET_CODE (in); const char *fmt = GET_RTX_FORMAT (code); int i, j; for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (loc == &in->u.fld[i].rt_rtx) return 1; if (fmt[i] == 'e') { if (loc_mentioned_in_p (loc, XEXP (in, i))) return 1; } else if (fmt[i] == 'E') for (j = XVECLEN (in, i) - 1; j >= 0; j--) if (loc_mentioned_in_p (loc, XVECEXP (in, i, j))) return 1; } return 0; } /* Helper function for subreg_lsb. Given a subreg's OUTER_MODE, INNER_MODE, and SUBREG_BYTE, return the bit offset where the subreg begins (counting from the least significant bit of the operand). */ unsigned int subreg_lsb_1 (enum machine_mode outer_mode, enum machine_mode inner_mode, unsigned int subreg_byte) { unsigned int bitpos; unsigned int byte; unsigned int word; /* A paradoxical subreg begins at bit position 0. */ if (GET_MODE_BITSIZE (outer_mode) > GET_MODE_BITSIZE (inner_mode)) return 0; if (WORDS_BIG_ENDIAN != BYTES_BIG_ENDIAN) /* If the subreg crosses a word boundary ensure that it also begins and ends on a word boundary. */ gcc_assert (!((subreg_byte % UNITS_PER_WORD + GET_MODE_SIZE (outer_mode)) > UNITS_PER_WORD && (subreg_byte % UNITS_PER_WORD || GET_MODE_SIZE (outer_mode) % UNITS_PER_WORD))); if (WORDS_BIG_ENDIAN) word = (GET_MODE_SIZE (inner_mode) - (subreg_byte + GET_MODE_SIZE (outer_mode))) / UNITS_PER_WORD; else word = subreg_byte / UNITS_PER_WORD; bitpos = word * BITS_PER_WORD; if (BYTES_BIG_ENDIAN) byte = (GET_MODE_SIZE (inner_mode) - (subreg_byte + GET_MODE_SIZE (outer_mode))) % UNITS_PER_WORD; else byte = subreg_byte % UNITS_PER_WORD; bitpos += byte * BITS_PER_UNIT; return bitpos; } /* Given a subreg X, return the bit offset where the subreg begins (counting from the least significant bit of the reg). */ unsigned int subreg_lsb (rtx x) { return subreg_lsb_1 (GET_MODE (x), GET_MODE (SUBREG_REG (x)), SUBREG_BYTE (x)); } /* This function returns the regno offset of a subreg expression. xregno - A regno of an inner hard subreg_reg (or what will become one). xmode - The mode of xregno. offset - The byte offset. ymode - The mode of a top level SUBREG (or what may become one). RETURN - The regno offset which would be used. */ unsigned int subreg_regno_offset (unsigned int xregno, enum machine_mode xmode, unsigned int offset, enum machine_mode ymode) { int nregs_xmode, nregs_ymode; int mode_multiple, nregs_multiple; int y_offset; gcc_assert (xregno < FIRST_PSEUDO_REGISTER); /* Adjust nregs_xmode to allow for 'holes'. */ if (HARD_REGNO_NREGS_HAS_PADDING (xregno, xmode)) nregs_xmode = HARD_REGNO_NREGS_WITH_PADDING (xregno, xmode); else nregs_xmode = hard_regno_nregs[xregno][xmode]; nregs_ymode = hard_regno_nregs[xregno][ymode]; /* If this is a big endian paradoxical subreg, which uses more actual hard registers than the original register, we must return a negative offset so that we find the proper highpart of the register. */ if (offset == 0 && nregs_ymode > nregs_xmode && (GET_MODE_SIZE (ymode) > UNITS_PER_WORD ? WORDS_BIG_ENDIAN : BYTES_BIG_ENDIAN)) return nregs_xmode - nregs_ymode; if (offset == 0 || nregs_xmode == nregs_ymode) return 0; /* Size of ymode must not be greater than the size of xmode. */ mode_multiple = GET_MODE_SIZE (xmode) / GET_MODE_SIZE (ymode); gcc_assert (mode_multiple != 0); y_offset = offset / GET_MODE_SIZE (ymode); nregs_multiple = nregs_xmode / nregs_ymode; return (y_offset / (mode_multiple / nregs_multiple)) * nregs_ymode; } /* This function returns true when the offset is representable via subreg_offset in the given regno. xregno - A regno of an inner hard subreg_reg (or what will become one). xmode - The mode of xregno. offset - The byte offset. ymode - The mode of a top level SUBREG (or what may become one). RETURN - Whether the offset is representable. */ bool subreg_offset_representable_p (unsigned int xregno, enum machine_mode xmode, unsigned int offset, enum machine_mode ymode) { int nregs_xmode, nregs_ymode; int mode_multiple, nregs_multiple; int y_offset; int regsize_xmode, regsize_ymode; gcc_assert (xregno < FIRST_PSEUDO_REGISTER); /* If there are holes in a non-scalar mode in registers, we expect that it is made up of its units concatenated together. */ if (HARD_REGNO_NREGS_HAS_PADDING (xregno, xmode)) { enum machine_mode xmode_unit; nregs_xmode = HARD_REGNO_NREGS_WITH_PADDING (xregno, xmode); if (GET_MODE_INNER (xmode) == VOIDmode) xmode_unit = xmode; else xmode_unit = GET_MODE_INNER (xmode); gcc_assert (HARD_REGNO_NREGS_HAS_PADDING (xregno, xmode_unit)); gcc_assert (nregs_xmode == (GET_MODE_NUNITS (xmode) * HARD_REGNO_NREGS_WITH_PADDING (xregno, xmode_unit))); gcc_assert (hard_regno_nregs[xregno][xmode] == (hard_regno_nregs[xregno][xmode_unit] * GET_MODE_NUNITS (xmode))); /* You can only ask for a SUBREG of a value with holes in the middle if you don't cross the holes. (Such a SUBREG should be done by picking a different register class, or doing it in memory if necessary.) An example of a value with holes is XCmode on 32-bit x86 with -m128bit-long-double; it's represented in 6 32-bit registers, 3 for each part, but in memory it's two 128-bit parts. Padding is assumed to be at the end (not necessarily the 'high part') of each unit. */ if ((offset / GET_MODE_SIZE (xmode_unit) + 1 < GET_MODE_NUNITS (xmode)) && (offset / GET_MODE_SIZE (xmode_unit) != ((offset + GET_MODE_SIZE (ymode) - 1) / GET_MODE_SIZE (xmode_unit)))) return false; } else nregs_xmode = hard_regno_nregs[xregno][xmode]; nregs_ymode = hard_regno_nregs[xregno][ymode]; /* Paradoxical subregs are otherwise valid. */ if (offset == 0 && nregs_ymode > nregs_xmode && (GET_MODE_SIZE (ymode) > UNITS_PER_WORD ? WORDS_BIG_ENDIAN : BYTES_BIG_ENDIAN)) return true; /* If registers store different numbers of bits in the different modes, we cannot generally form this subreg. */ regsize_xmode = GET_MODE_SIZE (xmode) / nregs_xmode; regsize_ymode = GET_MODE_SIZE (ymode) / nregs_ymode; if (regsize_xmode > regsize_ymode && nregs_ymode > 1) return false; if (regsize_ymode > regsize_xmode && nregs_xmode > 1) return false; /* Lowpart subregs are otherwise valid. */ if (offset == subreg_lowpart_offset (ymode, xmode)) return true; /* This should always pass, otherwise we don't know how to verify the constraint. These conditions may be relaxed but subreg_regno_offset would need to be redesigned. */ gcc_assert ((GET_MODE_SIZE (xmode) % GET_MODE_SIZE (ymode)) == 0); gcc_assert ((nregs_xmode % nregs_ymode) == 0); /* The XMODE value can be seen as a vector of NREGS_XMODE values. The subreg must represent a lowpart of given field. Compute what field it is. */ offset -= subreg_lowpart_offset (ymode, mode_for_size (GET_MODE_BITSIZE (xmode) / nregs_xmode, MODE_INT, 0)); /* Size of ymode must not be greater than the size of xmode. */ mode_multiple = GET_MODE_SIZE (xmode) / GET_MODE_SIZE (ymode); gcc_assert (mode_multiple != 0); y_offset = offset / GET_MODE_SIZE (ymode); nregs_multiple = nregs_xmode / nregs_ymode; gcc_assert ((offset % GET_MODE_SIZE (ymode)) == 0); gcc_assert ((mode_multiple % nregs_multiple) == 0); return (!(y_offset % (mode_multiple / nregs_multiple))); } /* Return the final regno that a subreg expression refers to. */ unsigned int subreg_regno (rtx x) { unsigned int ret; rtx subreg = SUBREG_REG (x); int regno = REGNO (subreg); ret = regno + subreg_regno_offset (regno, GET_MODE (subreg), SUBREG_BYTE (x), GET_MODE (x)); return ret; } struct parms_set_data { int nregs; HARD_REG_SET regs; }; /* Helper function for noticing stores to parameter registers. */ static void parms_set (rtx x, rtx pat ATTRIBUTE_UNUSED, void *data) { struct parms_set_data *d = data; if (REG_P (x) && REGNO (x) < FIRST_PSEUDO_REGISTER && TEST_HARD_REG_BIT (d->regs, REGNO (x))) { CLEAR_HARD_REG_BIT (d->regs, REGNO (x)); d->nregs--; } } /* Look backward for first parameter to be loaded. Note that loads of all parameters will not necessarily be found if CSE has eliminated some of them (e.g., an argument to the outer function is passed down as a parameter). Do not skip BOUNDARY. */ rtx find_first_parameter_load (rtx call_insn, rtx boundary) { struct parms_set_data parm; rtx p, before, first_set; /* Since different machines initialize their parameter registers in different orders, assume nothing. Collect the set of all parameter registers. */ CLEAR_HARD_REG_SET (parm.regs); parm.nregs = 0; for (p = CALL_INSN_FUNCTION_USAGE (call_insn); p; p = XEXP (p, 1)) if (GET_CODE (XEXP (p, 0)) == USE && REG_P (XEXP (XEXP (p, 0), 0))) { gcc_assert (REGNO (XEXP (XEXP (p, 0), 0)) < FIRST_PSEUDO_REGISTER); /* We only care about registers which can hold function arguments. */ if (!FUNCTION_ARG_REGNO_P (REGNO (XEXP (XEXP (p, 0), 0)))) continue; SET_HARD_REG_BIT (parm.regs, REGNO (XEXP (XEXP (p, 0), 0))); parm.nregs++; } before = call_insn; first_set = call_insn; /* Search backward for the first set of a register in this set. */ while (parm.nregs && before != boundary) { before = PREV_INSN (before); /* It is possible that some loads got CSEed from one call to another. Stop in that case. */ if (CALL_P (before)) break; /* Our caller needs either ensure that we will find all sets (in case code has not been optimized yet), or take care for possible labels in a way by setting boundary to preceding CODE_LABEL. */ if (LABEL_P (before)) { gcc_assert (before == boundary); break; } if (INSN_P (before)) { int nregs_old = parm.nregs; note_stores (PATTERN (before), parms_set, &parm); /* If we found something that did not set a parameter reg, we're done. Do not keep going, as that might result in hoisting an insn before the setting of a pseudo that is used by the hoisted insn. */ if (nregs_old != parm.nregs) first_set = before; else break; } } return first_set; } /* Return true if we should avoid inserting code between INSN and preceding call instruction. */ bool keep_with_call_p (rtx insn) { rtx set; if (INSN_P (insn) && (set = single_set (insn)) != NULL) { if (REG_P (SET_DEST (set)) && REGNO (SET_DEST (set)) < FIRST_PSEUDO_REGISTER && fixed_regs[REGNO (SET_DEST (set))] && general_operand (SET_SRC (set), VOIDmode)) return true; if (REG_P (SET_SRC (set)) && FUNCTION_VALUE_REGNO_P (REGNO (SET_SRC (set))) && REG_P (SET_DEST (set)) && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER) return true; /* There may be a stack pop just after the call and before the store of the return register. Search for the actual store when deciding if we can break or not. */ if (SET_DEST (set) == stack_pointer_rtx) { rtx i2 = next_nonnote_insn (insn); if (i2 && keep_with_call_p (i2)) return true; } } return false; } /* Return true if LABEL is a target of JUMP_INSN. This applies only to non-complex jumps. That is, direct unconditional, conditional, and tablejumps, but not computed jumps or returns. It also does not apply to the fallthru case of a conditional jump. */ bool label_is_jump_target_p (rtx label, rtx jump_insn) { rtx tmp = JUMP_LABEL (jump_insn); if (label == tmp) return true; if (tablejump_p (jump_insn, NULL, &tmp)) { rtvec vec = XVEC (PATTERN (tmp), GET_CODE (PATTERN (tmp)) == ADDR_DIFF_VEC); int i, veclen = GET_NUM_ELEM (vec); for (i = 0; i < veclen; ++i) if (XEXP (RTVEC_ELT (vec, i), 0) == label) return true; } return false; } /* Return an estimate of the cost of computing rtx X. One use is in cse, to decide which expression to keep in the hash table. Another is in rtl generation, to pick the cheapest way to multiply. Other uses like the latter are expected in the future. */ int rtx_cost (rtx x, enum rtx_code outer_code ATTRIBUTE_UNUSED) { int i, j; enum rtx_code code; const char *fmt; int total; if (x == 0) return 0; /* Compute the default costs of certain things. Note that targetm.rtx_costs can override the defaults. */ code = GET_CODE (x); switch (code) { case MULT: total = COSTS_N_INSNS (5); break; case DIV: case UDIV: case MOD: case UMOD: total = COSTS_N_INSNS (7); break; case USE: /* Used in combine.c as a marker. */ total = 0; break; default: total = COSTS_N_INSNS (1); } switch (code) { case REG: return 0; case SUBREG: total = 0; /* If we can't tie these modes, make this expensive. The larger the mode, the more expensive it is. */ if (! MODES_TIEABLE_P (GET_MODE (x), GET_MODE (SUBREG_REG (x)))) return COSTS_N_INSNS (2 + GET_MODE_SIZE (GET_MODE (x)) / UNITS_PER_WORD); break; default: if (targetm.rtx_costs (x, code, outer_code, &total)) return total; break; } /* Sum the costs of the sub-rtx's, plus cost of this operation, which is already in total. */ fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) if (fmt[i] == 'e') total += rtx_cost (XEXP (x, i), code); else if (fmt[i] == 'E') for (j = 0; j < XVECLEN (x, i); j++) total += rtx_cost (XVECEXP (x, i, j), code); return total; } /* Return cost of address expression X. Expect that X is properly formed address reference. */ int address_cost (rtx x, enum machine_mode mode) { /* We may be asked for cost of various unusual addresses, such as operands of push instruction. It is not worthwhile to complicate writing of the target hook by such cases. */ if (!memory_address_p (mode, x)) return 1000; return targetm.address_cost (x); } /* If the target doesn't override, compute the cost as with arithmetic. */ int default_address_cost (rtx x) { return rtx_cost (x, MEM); } unsigned HOST_WIDE_INT nonzero_bits (rtx x, enum machine_mode mode) { return cached_nonzero_bits (x, mode, NULL_RTX, VOIDmode, 0); } unsigned int num_sign_bit_copies (rtx x, enum machine_mode mode) { return cached_num_sign_bit_copies (x, mode, NULL_RTX, VOIDmode, 0); } /* The function cached_nonzero_bits is a wrapper around nonzero_bits1. It avoids exponential behavior in nonzero_bits1 when X has identical subexpressions on the first or the second level. */ static unsigned HOST_WIDE_INT cached_nonzero_bits (rtx x, enum machine_mode mode, rtx known_x, enum machine_mode known_mode, unsigned HOST_WIDE_INT known_ret) { if (x == known_x && mode == known_mode) return known_ret; /* Try to find identical subexpressions. If found call nonzero_bits1 on X with the subexpressions as KNOWN_X and the precomputed value for the subexpression as KNOWN_RET. */ if (ARITHMETIC_P (x)) { rtx x0 = XEXP (x, 0); rtx x1 = XEXP (x, 1); /* Check the first level. */ if (x0 == x1) return nonzero_bits1 (x, mode, x0, mode, cached_nonzero_bits (x0, mode, known_x, known_mode, known_ret)); /* Check the second level. */ if (ARITHMETIC_P (x0) && (x1 == XEXP (x0, 0) || x1 == XEXP (x0, 1))) return nonzero_bits1 (x, mode, x1, mode, cached_nonzero_bits (x1, mode, known_x, known_mode, known_ret)); if (ARITHMETIC_P (x1) && (x0 == XEXP (x1, 0) || x0 == XEXP (x1, 1))) return nonzero_bits1 (x, mode, x0, mode, cached_nonzero_bits (x0, mode, known_x, known_mode, known_ret)); } return nonzero_bits1 (x, mode, known_x, known_mode, known_ret); } /* We let num_sign_bit_copies recur into nonzero_bits as that is useful. We don't let nonzero_bits recur into num_sign_bit_copies, because that is less useful. We can't allow both, because that results in exponential run time recursion. There is a nullstone testcase that triggered this. This macro avoids accidental uses of num_sign_bit_copies. */ #define cached_num_sign_bit_copies sorry_i_am_preventing_exponential_behavior /* Given an expression, X, compute which bits in X can be nonzero. We don't care about bits outside of those defined in MODE. For most X this is simply GET_MODE_MASK (GET_MODE (MODE)), but if X is an arithmetic operation, we can do better. */ static unsigned HOST_WIDE_INT nonzero_bits1 (rtx x, enum machine_mode mode, rtx known_x, enum machine_mode known_mode, unsigned HOST_WIDE_INT known_ret) { unsigned HOST_WIDE_INT nonzero = GET_MODE_MASK (mode); unsigned HOST_WIDE_INT inner_nz; enum rtx_code code; unsigned int mode_width = GET_MODE_BITSIZE (mode); /* For floating-point values, assume all bits are needed. */ if (FLOAT_MODE_P (GET_MODE (x)) || FLOAT_MODE_P (mode)) return nonzero; /* If X is wider than MODE, use its mode instead. */ if (GET_MODE_BITSIZE (GET_MODE (x)) > mode_width) { mode = GET_MODE (x); nonzero = GET_MODE_MASK (mode); mode_width = GET_MODE_BITSIZE (mode); } if (mode_width > HOST_BITS_PER_WIDE_INT) /* Our only callers in this case look for single bit values. So just return the mode mask. Those tests will then be false. */ return nonzero; #ifndef WORD_REGISTER_OPERATIONS /* If MODE is wider than X, but both are a single word for both the host and target machines, we can compute this from which bits of the object might be nonzero in its own mode, taking into account the fact that on many CISC machines, accessing an object in a wider mode causes the high-order bits to become undefined. So they are not known to be zero. */ if (GET_MODE (x) != VOIDmode && GET_MODE (x) != mode && GET_MODE_BITSIZE (GET_MODE (x)) <= BITS_PER_WORD && GET_MODE_BITSIZE (GET_MODE (x)) <= HOST_BITS_PER_WIDE_INT && GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (GET_MODE (x))) { nonzero &= cached_nonzero_bits (x, GET_MODE (x), known_x, known_mode, known_ret); nonzero |= GET_MODE_MASK (mode) & ~GET_MODE_MASK (GET_MODE (x)); return nonzero; } #endif code = GET_CODE (x); switch (code) { case REG: #if defined(POINTERS_EXTEND_UNSIGNED) && !defined(HAVE_ptr_extend) /* If pointers extend unsigned and this is a pointer in Pmode, say that all the bits above ptr_mode are known to be zero. */ if (POINTERS_EXTEND_UNSIGNED && GET_MODE (x) == Pmode && REG_POINTER (x)) nonzero &= GET_MODE_MASK (ptr_mode); #endif /* Include declared information about alignment of pointers. */ /* ??? We don't properly preserve REG_POINTER changes across pointer-to-integer casts, so we can't trust it except for things that we know must be pointers. See execute/960116-1.c. */ if ((x == stack_pointer_rtx || x == frame_pointer_rtx || x == arg_pointer_rtx) && REGNO_POINTER_ALIGN (REGNO (x))) { unsigned HOST_WIDE_INT alignment = REGNO_POINTER_ALIGN (REGNO (x)) / BITS_PER_UNIT; #ifdef PUSH_ROUNDING /* If PUSH_ROUNDING is defined, it is possible for the stack to be momentarily aligned only to that amount, so we pick the least alignment. */ if (x == stack_pointer_rtx && PUSH_ARGS) alignment = MIN ((unsigned HOST_WIDE_INT) PUSH_ROUNDING (1), alignment); #endif nonzero &= ~(alignment - 1); } { unsigned HOST_WIDE_INT nonzero_for_hook = nonzero; rtx new = rtl_hooks.reg_nonzero_bits (x, mode, known_x, known_mode, known_ret, &nonzero_for_hook); if (new) nonzero_for_hook &= cached_nonzero_bits (new, mode, known_x, known_mode, known_ret); return nonzero_for_hook; } case CONST_INT: #ifdef SHORT_IMMEDIATES_SIGN_EXTEND /* If X is negative in MODE, sign-extend the value. */ if (INTVAL (x) > 0 && mode_width < BITS_PER_WORD && 0 != (INTVAL (x) & ((HOST_WIDE_INT) 1 << (mode_width - 1)))) return (INTVAL (x) | ((HOST_WIDE_INT) (-1) << mode_width)); #endif return INTVAL (x); case MEM: #ifdef LOAD_EXTEND_OP /* In many, if not most, RISC machines, reading a byte from memory zeros the rest of the register. Noticing that fact saves a lot of extra zero-extends. */ if (LOAD_EXTEND_OP (GET_MODE (x)) == ZERO_EXTEND) nonzero &= GET_MODE_MASK (GET_MODE (x)); #endif break; case EQ: case NE: case UNEQ: case LTGT: case GT: case GTU: case UNGT: case LT: case LTU: case UNLT: case GE: case GEU: case UNGE: case LE: case LEU: case UNLE: case UNORDERED: case ORDERED: /* If this produces an integer result, we know which bits are set. Code here used to clear bits outside the mode of X, but that is now done above. */ /* Mind that MODE is the mode the caller wants to look at this operation in, and not the actual operation mode. We can wind up with (subreg:DI (gt:V4HI x y)), and we don't have anything that describes the results of a vector compare. */ if (GET_MODE_CLASS (GET_MODE (x)) == MODE_INT && mode_width <= HOST_BITS_PER_WIDE_INT) nonzero = STORE_FLAG_VALUE; break; case NEG: #if 0 /* Disabled to avoid exponential mutual recursion between nonzero_bits and num_sign_bit_copies. */ if (num_sign_bit_copies (XEXP (x, 0), GET_MODE (x)) == GET_MODE_BITSIZE (GET_MODE (x))) nonzero = 1; #endif if (GET_MODE_SIZE (GET_MODE (x)) < mode_width) nonzero |= (GET_MODE_MASK (mode) & ~GET_MODE_MASK (GET_MODE (x))); break; case ABS: #if 0 /* Disabled to avoid exponential mutual recursion between nonzero_bits and num_sign_bit_copies. */ if (num_sign_bit_copies (XEXP (x, 0), GET_MODE (x)) == GET_MODE_BITSIZE (GET_MODE (x))) nonzero = 1; #endif break; case TRUNCATE: nonzero &= (cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret) & GET_MODE_MASK (mode)); break; case ZERO_EXTEND: nonzero &= cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret); if (GET_MODE (XEXP (x, 0)) != VOIDmode) nonzero &= GET_MODE_MASK (GET_MODE (XEXP (x, 0))); break; case SIGN_EXTEND: /* If the sign bit is known clear, this is the same as ZERO_EXTEND. Otherwise, show all the bits in the outer mode but not the inner may be nonzero. */ inner_nz = cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret); if (GET_MODE (XEXP (x, 0)) != VOIDmode) { inner_nz &= GET_MODE_MASK (GET_MODE (XEXP (x, 0))); if (inner_nz & (((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) - 1)))) inner_nz |= (GET_MODE_MASK (mode) & ~GET_MODE_MASK (GET_MODE (XEXP (x, 0)))); } nonzero &= inner_nz; break; case AND: nonzero &= cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret) & cached_nonzero_bits (XEXP (x, 1), mode, known_x, known_mode, known_ret); break; case XOR: case IOR: case UMIN: case UMAX: case SMIN: case SMAX: { unsigned HOST_WIDE_INT nonzero0 = cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret); /* Don't call nonzero_bits for the second time if it cannot change anything. */ if ((nonzero & nonzero0) != nonzero) nonzero &= nonzero0 | cached_nonzero_bits (XEXP (x, 1), mode, known_x, known_mode, known_ret); } break; case PLUS: case MINUS: case MULT: case DIV: case UDIV: case MOD: case UMOD: /* We can apply the rules of arithmetic to compute the number of high- and low-order zero bits of these operations. We start by computing the width (position of the highest-order nonzero bit) and the number of low-order zero bits for each value. */ { unsigned HOST_WIDE_INT nz0 = cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret); unsigned HOST_WIDE_INT nz1 = cached_nonzero_bits (XEXP (x, 1), mode, known_x, known_mode, known_ret); int sign_index = GET_MODE_BITSIZE (GET_MODE (x)) - 1; int width0 = floor_log2 (nz0) + 1; int width1 = floor_log2 (nz1) + 1; int low0 = floor_log2 (nz0 & -nz0); int low1 = floor_log2 (nz1 & -nz1); HOST_WIDE_INT op0_maybe_minusp = (nz0 & ((HOST_WIDE_INT) 1 << sign_index)); HOST_WIDE_INT op1_maybe_minusp = (nz1 & ((HOST_WIDE_INT) 1 << sign_index)); unsigned int result_width = mode_width; int result_low = 0; switch (code) { case PLUS: result_width = MAX (width0, width1) + 1; result_low = MIN (low0, low1); break; case MINUS: result_low = MIN (low0, low1); break; case MULT: result_width = width0 + width1; result_low = low0 + low1; break; case DIV: if (width1 == 0) break; if (! op0_maybe_minusp && ! op1_maybe_minusp) result_width = width0; break; case UDIV: if (width1 == 0) break; result_width = width0; break; case MOD: if (width1 == 0) break; if (! op0_maybe_minusp && ! op1_maybe_minusp) result_width = MIN (width0, width1); result_low = MIN (low0, low1); break; case UMOD: if (width1 == 0) break; result_width = MIN (width0, width1); result_low = MIN (low0, low1); break; default: gcc_unreachable (); } if (result_width < mode_width) nonzero &= ((HOST_WIDE_INT) 1 << result_width) - 1; if (result_low > 0) nonzero &= ~(((HOST_WIDE_INT) 1 << result_low) - 1); #ifdef POINTERS_EXTEND_UNSIGNED /* If pointers extend unsigned and this is an addition or subtraction to a pointer in Pmode, all the bits above ptr_mode are known to be zero. */ if (POINTERS_EXTEND_UNSIGNED > 0 && GET_MODE (x) == Pmode && (code == PLUS || code == MINUS) && REG_P (XEXP (x, 0)) && REG_POINTER (XEXP (x, 0))) nonzero &= GET_MODE_MASK (ptr_mode); #endif } break; case ZERO_EXTRACT: if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT) nonzero &= ((HOST_WIDE_INT) 1 << INTVAL (XEXP (x, 1))) - 1; break; case SUBREG: /* If this is a SUBREG formed for a promoted variable that has been zero-extended, we know that at least the high-order bits are zero, though others might be too. */ if (SUBREG_PROMOTED_VAR_P (x) && SUBREG_PROMOTED_UNSIGNED_P (x) > 0) nonzero = GET_MODE_MASK (GET_MODE (x)) & cached_nonzero_bits (SUBREG_REG (x), GET_MODE (x), known_x, known_mode, known_ret); /* If the inner mode is a single word for both the host and target machines, we can compute this from which bits of the inner object might be nonzero. */ if (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x))) <= BITS_PER_WORD && (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x))) <= HOST_BITS_PER_WIDE_INT)) { nonzero &= cached_nonzero_bits (SUBREG_REG (x), mode, known_x, known_mode, known_ret); #if defined (WORD_REGISTER_OPERATIONS) && defined (LOAD_EXTEND_OP) /* If this is a typical RISC machine, we only have to worry about the way loads are extended. */ if ((LOAD_EXTEND_OP (GET_MODE (SUBREG_REG (x))) == SIGN_EXTEND ? (((nonzero & (((unsigned HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x))) - 1)))) != 0)) : LOAD_EXTEND_OP (GET_MODE (SUBREG_REG (x))) != ZERO_EXTEND) || !MEM_P (SUBREG_REG (x))) #endif { /* On many CISC machines, accessing an object in a wider mode causes the high-order bits to become undefined. So they are not known to be zero. */ if (GET_MODE_SIZE (GET_MODE (x)) > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x)))) nonzero |= (GET_MODE_MASK (GET_MODE (x)) & ~GET_MODE_MASK (GET_MODE (SUBREG_REG (x)))); } } break; case ASHIFTRT: case LSHIFTRT: case ASHIFT: case ROTATE: /* The nonzero bits are in two classes: any bits within MODE that aren't in GET_MODE (x) are always significant. The rest of the nonzero bits are those that are significant in the operand of the shift when shifted the appropriate number of bits. This shows that high-order bits are cleared by the right shift and low-order bits by left shifts. */ if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) >= 0 && INTVAL (XEXP (x, 1)) < HOST_BITS_PER_WIDE_INT) { enum machine_mode inner_mode = GET_MODE (x); unsigned int width = GET_MODE_BITSIZE (inner_mode); int count = INTVAL (XEXP (x, 1)); unsigned HOST_WIDE_INT mode_mask = GET_MODE_MASK (inner_mode); unsigned HOST_WIDE_INT op_nonzero = cached_nonzero_bits (XEXP (x, 0), mode, known_x, known_mode, known_ret); unsigned HOST_WIDE_INT inner = op_nonzero & mode_mask; unsigned HOST_WIDE_INT outer = 0; if (mode_width > width) outer = (op_nonzero & nonzero & ~mode_mask); if (code == LSHIFTRT) inner >>= count; else if (code == ASHIFTRT) { inner >>= count; /* If the sign bit may have been nonzero before the shift, we need to mark all the places it could have been copied to by the shift as possibly nonzero. */ if (inner & ((HOST_WIDE_INT) 1 << (width - 1 - count))) inner |= (((HOST_WIDE_INT) 1 << count) - 1) << (width - count); } else if (code == ASHIFT) inner <<= count; else inner = ((inner << (count % width) | (inner >> (width - (count % width)))) & mode_mask); nonzero &= (outer | inner); } break; case FFS: case POPCOUNT: /* This is at most the number of bits in the mode. */ nonzero = ((HOST_WIDE_INT) 2 << (floor_log2 (mode_width))) - 1; break; case CLZ: /* If CLZ has a known value at zero, then the nonzero bits are that value, plus the number of bits in the mode minus one. */ if (CLZ_DEFINED_VALUE_AT_ZERO (mode, nonzero)) nonzero |= ((HOST_WIDE_INT) 1 << (floor_log2 (mode_width))) - 1; else nonzero = -1; break; case CTZ: /* If CTZ has a known value at zero, then the nonzero bits are that value, plus the number of bits in the mode minus one. */ if (CTZ_DEFINED_VALUE_AT_ZERO (mode, nonzero)) nonzero |= ((HOST_WIDE_INT) 1 << (floor_log2 (mode_width))) - 1; else nonzero = -1; break; case PARITY: nonzero = 1; break; case IF_THEN_ELSE: { unsigned HOST_WIDE_INT nonzero_true = cached_nonzero_bits (XEXP (x, 1), mode, known_x, known_mode, known_ret); /* Don't call nonzero_bits for the second time if it cannot change anything. */ if ((nonzero & nonzero_true) != nonzero) nonzero &= nonzero_true | cached_nonzero_bits (XEXP (x, 2), mode, known_x, known_mode, known_ret); } break; default: break; } return nonzero; } /* See the macro definition above. */ #undef cached_num_sign_bit_copies /* The function cached_num_sign_bit_copies is a wrapper around num_sign_bit_copies1. It avoids exponential behavior in num_sign_bit_copies1 when X has identical subexpressions on the first or the second level. */ static unsigned int cached_num_sign_bit_copies (rtx x, enum machine_mode mode, rtx known_x, enum machine_mode known_mode, unsigned int known_ret) { if (x == known_x && mode == known_mode) return known_ret; /* Try to find identical subexpressions. If found call num_sign_bit_copies1 on X with the subexpressions as KNOWN_X and the precomputed value for the subexpression as KNOWN_RET. */ if (ARITHMETIC_P (x)) { rtx x0 = XEXP (x, 0); rtx x1 = XEXP (x, 1); /* Check the first level. */ if (x0 == x1) return num_sign_bit_copies1 (x, mode, x0, mode, cached_num_sign_bit_copies (x0, mode, known_x, known_mode, known_ret)); /* Check the second level. */ if (ARITHMETIC_P (x0) && (x1 == XEXP (x0, 0) || x1 == XEXP (x0, 1))) return num_sign_bit_copies1 (x, mode, x1, mode, cached_num_sign_bit_copies (x1, mode, known_x, known_mode, known_ret)); if (ARITHMETIC_P (x1) && (x0 == XEXP (x1, 0) || x0 == XEXP (x1, 1))) return num_sign_bit_copies1 (x, mode, x0, mode, cached_num_sign_bit_copies (x0, mode, known_x, known_mode, known_ret)); } return num_sign_bit_copies1 (x, mode, known_x, known_mode, known_ret); } /* Return the number of bits at the high-order end of X that are known to be equal to the sign bit. X will be used in mode MODE; if MODE is VOIDmode, X will be used in its own mode. The returned value will always be between 1 and the number of bits in MODE. */ static unsigned int num_sign_bit_copies1 (rtx x, enum machine_mode mode, rtx known_x, enum machine_mode known_mode, unsigned int known_ret) { enum rtx_code code = GET_CODE (x); unsigned int bitwidth = GET_MODE_BITSIZE (mode); int num0, num1, result; unsigned HOST_WIDE_INT nonzero; /* If we weren't given a mode, use the mode of X. If the mode is still VOIDmode, we don't know anything. Likewise if one of the modes is floating-point. */ if (mode == VOIDmode) mode = GET_MODE (x); if (mode == VOIDmode || FLOAT_MODE_P (mode) || FLOAT_MODE_P (GET_MODE (x))) return 1; /* For a smaller object, just ignore the high bits. */ if (bitwidth < GET_MODE_BITSIZE (GET_MODE (x))) { num0 = cached_num_sign_bit_copies (x, GET_MODE (x), known_x, known_mode, known_ret); return MAX (1, num0 - (int) (GET_MODE_BITSIZE (GET_MODE (x)) - bitwidth)); } if (GET_MODE (x) != VOIDmode && bitwidth > GET_MODE_BITSIZE (GET_MODE (x))) { #ifndef WORD_REGISTER_OPERATIONS /* If this machine does not do all register operations on the entire register and MODE is wider than the mode of X, we can say nothing at all about the high-order bits. */ return 1; #else /* Likewise on machines that do, if the mode of the object is smaller than a word and loads of that size don't sign extend, we can say nothing about the high order bits. */ if (GET_MODE_BITSIZE (GET_MODE (x)) < BITS_PER_WORD #ifdef LOAD_EXTEND_OP && LOAD_EXTEND_OP (GET_MODE (x)) != SIGN_EXTEND #endif ) return 1; #endif } switch (code) { case REG: #if defined(POINTERS_EXTEND_UNSIGNED) && !defined(HAVE_ptr_extend) /* If pointers extend signed and this is a pointer in Pmode, say that all the bits above ptr_mode are known to be sign bit copies. */ if (! POINTERS_EXTEND_UNSIGNED && GET_MODE (x) == Pmode && mode == Pmode && REG_POINTER (x)) return GET_MODE_BITSIZE (Pmode) - GET_MODE_BITSIZE (ptr_mode) + 1; #endif { unsigned int copies_for_hook = 1, copies = 1; rtx new = rtl_hooks.reg_num_sign_bit_copies (x, mode, known_x, known_mode, known_ret, &copies_for_hook); if (new) copies = cached_num_sign_bit_copies (new, mode, known_x, known_mode, known_ret); if (copies > 1 || copies_for_hook > 1) return MAX (copies, copies_for_hook); /* Else, use nonzero_bits to guess num_sign_bit_copies (see below). */ } break; case MEM: #ifdef LOAD_EXTEND_OP /* Some RISC machines sign-extend all loads of smaller than a word. */ if (LOAD_EXTEND_OP (GET_MODE (x)) == SIGN_EXTEND) return MAX (1, ((int) bitwidth - (int) GET_MODE_BITSIZE (GET_MODE (x)) + 1)); #endif break; case CONST_INT: /* If the constant is negative, take its 1's complement and remask. Then see how many zero bits we have. */ nonzero = INTVAL (x) & GET_MODE_MASK (mode); if (bitwidth <= HOST_BITS_PER_WIDE_INT && (nonzero & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0) nonzero = (~nonzero) & GET_MODE_MASK (mode); return (nonzero == 0 ? bitwidth : bitwidth - floor_log2 (nonzero) - 1); case SUBREG: /* If this is a SUBREG for a promoted object that is sign-extended and we are looking at it in a wider mode, we know that at least the high-order bits are known to be sign bit copies. */ if (SUBREG_PROMOTED_VAR_P (x) && ! SUBREG_PROMOTED_UNSIGNED_P (x)) { num0 = cached_num_sign_bit_copies (SUBREG_REG (x), mode, known_x, known_mode, known_ret); return MAX ((int) bitwidth - (int) GET_MODE_BITSIZE (GET_MODE (x)) + 1, num0); } /* For a smaller object, just ignore the high bits. */ if (bitwidth <= GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x)))) { num0 = cached_num_sign_bit_copies (SUBREG_REG (x), VOIDmode, known_x, known_mode, known_ret); return MAX (1, (num0 - (int) (GET_MODE_BITSIZE (GET_MODE (SUBREG_REG (x))) - bitwidth))); } #ifdef WORD_REGISTER_OPERATIONS #ifdef LOAD_EXTEND_OP /* For paradoxical SUBREGs on machines where all register operations affect the entire register, just look inside. Note that we are passing MODE to the recursive call, so the number of sign bit copies will remain relative to that mode, not the inner mode. */ /* This works only if loads sign extend. Otherwise, if we get a reload for the inner part, it may be loaded from the stack, and then we lose all sign bit copies that existed before the store to the stack. */ if ((GET_MODE_SIZE (GET_MODE (x)) > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x)))) && LOAD_EXTEND_OP (GET_MODE (SUBREG_REG (x))) == SIGN_EXTEND && MEM_P (SUBREG_REG (x))) return cached_num_sign_bit_copies (SUBREG_REG (x), mode, known_x, known_mode, known_ret); #endif #endif break; case SIGN_EXTRACT: if (GET_CODE (XEXP (x, 1)) == CONST_INT) return MAX (1, (int) bitwidth - INTVAL (XEXP (x, 1))); break; case SIGN_EXTEND: return (bitwidth - GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) + cached_num_sign_bit_copies (XEXP (x, 0), VOIDmode, known_x, known_mode, known_ret)); case TRUNCATE: /* For a smaller object, just ignore the high bits. */ num0 = cached_num_sign_bit_copies (XEXP (x, 0), VOIDmode, known_x, known_mode, known_ret); return MAX (1, (num0 - (int) (GET_MODE_BITSIZE (GET_MODE (XEXP (x, 0))) - bitwidth))); case NOT: return cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); case ROTATE: case ROTATERT: /* If we are rotating left by a number of bits less than the number of sign bit copies, we can just subtract that amount from the number. */ if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) >= 0 && INTVAL (XEXP (x, 1)) < (int) bitwidth) { num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); return MAX (1, num0 - (code == ROTATE ? INTVAL (XEXP (x, 1)) : (int) bitwidth - INTVAL (XEXP (x, 1)))); } break; case NEG: /* In general, this subtracts one sign bit copy. But if the value is known to be positive, the number of sign bit copies is the same as that of the input. Finally, if the input has just one bit that might be nonzero, all the bits are copies of the sign bit. */ num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); if (bitwidth > HOST_BITS_PER_WIDE_INT) return num0 > 1 ? num0 - 1 : 1; nonzero = nonzero_bits (XEXP (x, 0), mode); if (nonzero == 1) return bitwidth; if (num0 > 1 && (((HOST_WIDE_INT) 1 << (bitwidth - 1)) & nonzero)) num0--; return num0; case IOR: case AND: case XOR: case SMIN: case SMAX: case UMIN: case UMAX: /* Logical operations will preserve the number of sign-bit copies. MIN and MAX operations always return one of the operands. */ num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); num1 = cached_num_sign_bit_copies (XEXP (x, 1), mode, known_x, known_mode, known_ret); return MIN (num0, num1); case PLUS: case MINUS: /* For addition and subtraction, we can have a 1-bit carry. However, if we are subtracting 1 from a positive number, there will not be such a carry. Furthermore, if the positive number is known to be 0 or 1, we know the result is either -1 or 0. */ if (code == PLUS && XEXP (x, 1) == constm1_rtx && bitwidth <= HOST_BITS_PER_WIDE_INT) { nonzero = nonzero_bits (XEXP (x, 0), mode); if ((((HOST_WIDE_INT) 1 << (bitwidth - 1)) & nonzero) == 0) return (nonzero == 1 || nonzero == 0 ? bitwidth : bitwidth - floor_log2 (nonzero) - 1); } num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); num1 = cached_num_sign_bit_copies (XEXP (x, 1), mode, known_x, known_mode, known_ret); result = MAX (1, MIN (num0, num1) - 1); #ifdef POINTERS_EXTEND_UNSIGNED /* If pointers extend signed and this is an addition or subtraction to a pointer in Pmode, all the bits above ptr_mode are known to be sign bit copies. */ if (! POINTERS_EXTEND_UNSIGNED && GET_MODE (x) == Pmode && (code == PLUS || code == MINUS) && REG_P (XEXP (x, 0)) && REG_POINTER (XEXP (x, 0))) result = MAX ((int) (GET_MODE_BITSIZE (Pmode) - GET_MODE_BITSIZE (ptr_mode) + 1), result); #endif return result; case MULT: /* The number of bits of the product is the sum of the number of bits of both terms. However, unless one of the terms if known to be positive, we must allow for an additional bit since negating a negative number can remove one sign bit copy. */ num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); num1 = cached_num_sign_bit_copies (XEXP (x, 1), mode, known_x, known_mode, known_ret); result = bitwidth - (bitwidth - num0) - (bitwidth - num1); if (result > 0 && (bitwidth > HOST_BITS_PER_WIDE_INT || (((nonzero_bits (XEXP (x, 0), mode) & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0) && ((nonzero_bits (XEXP (x, 1), mode) & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)))) result--; return MAX (1, result); case UDIV: /* The result must be <= the first operand. If the first operand has the high bit set, we know nothing about the number of sign bit copies. */ if (bitwidth > HOST_BITS_PER_WIDE_INT) return 1; else if ((nonzero_bits (XEXP (x, 0), mode) & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0) return 1; else return cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); case UMOD: /* The result must be <= the second operand. */ return cached_num_sign_bit_copies (XEXP (x, 1), mode, known_x, known_mode, known_ret); case DIV: /* Similar to unsigned division, except that we have to worry about the case where the divisor is negative, in which case we have to add 1. */ result = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); if (result > 1 && (bitwidth > HOST_BITS_PER_WIDE_INT || (nonzero_bits (XEXP (x, 1), mode) & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)) result--; return result; case MOD: result = cached_num_sign_bit_copies (XEXP (x, 1), mode, known_x, known_mode, known_ret); if (result > 1 && (bitwidth > HOST_BITS_PER_WIDE_INT || (nonzero_bits (XEXP (x, 1), mode) & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0)) result--; return result; case ASHIFTRT: /* Shifts by a constant add to the number of bits equal to the sign bit. */ num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); if (GET_CODE (XEXP (x, 1)) == CONST_INT && INTVAL (XEXP (x, 1)) > 0) num0 = MIN ((int) bitwidth, num0 + INTVAL (XEXP (x, 1))); return num0; case ASHIFT: /* Left shifts destroy copies. */ if (GET_CODE (XEXP (x, 1)) != CONST_INT || INTVAL (XEXP (x, 1)) < 0 || INTVAL (XEXP (x, 1)) >= (int) bitwidth) return 1; num0 = cached_num_sign_bit_copies (XEXP (x, 0), mode, known_x, known_mode, known_ret); return MAX (1, num0 - INTVAL (XEXP (x, 1))); case IF_THEN_ELSE: num0 = cached_num_sign_bit_copies (XEXP (x, 1), mode, known_x, known_mode, known_ret); num1 = cached_num_sign_bit_copies (XEXP (x, 2), mode, known_x, known_mode, known_ret); return MIN (num0, num1); case EQ: case NE: case GE: case GT: case LE: case LT: case UNEQ: case LTGT: case UNGE: case UNGT: case UNLE: case UNLT: case GEU: case GTU: case LEU: case LTU: case UNORDERED: case ORDERED: /* If the constant is negative, take its 1's complement and remask. Then see how many zero bits we have. */ nonzero = STORE_FLAG_VALUE; if (bitwidth <= HOST_BITS_PER_WIDE_INT && (nonzero & ((HOST_WIDE_INT) 1 << (bitwidth - 1))) != 0) nonzero = (~nonzero) & GET_MODE_MASK (mode); return (nonzero == 0 ? bitwidth : bitwidth - floor_log2 (nonzero) - 1); default: break; } /* If we haven't been able to figure it out by one of the above rules, see if some of the high-order bits are known to be zero. If so, count those bits and return one less than that amount. If we can't safely compute the mask for this mode, always return BITWIDTH. */ bitwidth = GET_MODE_BITSIZE (mode); if (bitwidth > HOST_BITS_PER_WIDE_INT) return 1; nonzero = nonzero_bits (x, mode); return nonzero & ((HOST_WIDE_INT) 1 << (bitwidth - 1)) ? 1 : bitwidth - floor_log2 (nonzero) - 1; } /* Calculate the rtx_cost of a single instruction. A return value of zero indicates an instruction pattern without a known cost. */ int insn_rtx_cost (rtx pat) { int i, cost; rtx set; /* Extract the single set rtx from the instruction pattern. We can't use single_set since we only have the pattern. */ if (GET_CODE (pat) == SET) set = pat; else if (GET_CODE (pat) == PARALLEL) { set = NULL_RTX; for (i = 0; i < XVECLEN (pat, 0); i++) { rtx x = XVECEXP (pat, 0, i); if (GET_CODE (x) == SET) { if (set) return 0; set = x; } } if (!set) return 0; } else return 0; cost = rtx_cost (SET_SRC (set), SET); return cost > 0 ? cost : COSTS_N_INSNS (1); } /* Given an insn INSN and condition COND, return the condition in a canonical form to simplify testing by callers. Specifically: (1) The code will always be a comparison operation (EQ, NE, GT, etc.). (2) Both operands will be machine operands; (cc0) will have been replaced. (3) If an operand is a constant, it will be the second operand. (4) (LE x const) will be replaced with (LT x ) and similarly for GE, GEU, and LEU. If the condition cannot be understood, or is an inequality floating-point comparison which needs to be reversed, 0 will be returned. If REVERSE is nonzero, then reverse the condition prior to canonizing it. If EARLIEST is nonzero, it is a pointer to a place where the earliest insn used in locating the condition was found. If a replacement test of the condition is desired, it should be placed in front of that insn and we will be sure that the inputs are still valid. If WANT_REG is nonzero, we wish the condition to be relative to that register, if possible. Therefore, do not canonicalize the condition further. If ALLOW_CC_MODE is nonzero, allow the condition returned to be a compare to a CC mode register. If VALID_AT_INSN_P, the condition must be valid at both *EARLIEST and at INSN. */ rtx canonicalize_condition (rtx insn, rtx cond, int reverse, rtx *earliest, rtx want_reg, int allow_cc_mode, int valid_at_insn_p) { enum rtx_code code; rtx prev = insn; rtx set; rtx tem; rtx op0, op1; int reverse_code = 0; enum machine_mode mode; basic_block bb = BLOCK_FOR_INSN (insn); code = GET_CODE (cond); mode = GET_MODE (cond); op0 = XEXP (cond, 0); op1 = XEXP (cond, 1); if (reverse) code = reversed_comparison_code (cond, insn); if (code == UNKNOWN) return 0; if (earliest) *earliest = insn; /* If we are comparing a register with zero, see if the register is set in the previous insn to a COMPARE or a comparison operation. Perform the same tests as a function of STORE_FLAG_VALUE as find_comparison_args in cse.c */ while ((GET_RTX_CLASS (code) == RTX_COMPARE || GET_RTX_CLASS (code) == RTX_COMM_COMPARE) && op1 == CONST0_RTX (GET_MODE (op0)) && op0 != want_reg) { /* Set nonzero when we find something of interest. */ rtx x = 0; #ifdef HAVE_cc0 /* If comparison with cc0, import actual comparison from compare insn. */ if (op0 == cc0_rtx) { if ((prev = prev_nonnote_insn (prev)) == 0 || !NONJUMP_INSN_P (prev) || (set = single_set (prev)) == 0 || SET_DEST (set) != cc0_rtx) return 0; op0 = SET_SRC (set); op1 = CONST0_RTX (GET_MODE (op0)); if (earliest) *earliest = prev; } #endif /* If this is a COMPARE, pick up the two things being compared. */ if (GET_CODE (op0) == COMPARE) { op1 = XEXP (op0, 1); op0 = XEXP (op0, 0); continue; } else if (!REG_P (op0)) break; /* Go back to the previous insn. Stop if it is not an INSN. We also stop if it isn't a single set or if it has a REG_INC note because we don't want to bother dealing with it. */ if ((prev = prev_nonnote_insn (prev)) == 0 || !NONJUMP_INSN_P (prev) || FIND_REG_INC_NOTE (prev, NULL_RTX) /* In cfglayout mode, there do not have to be labels at the beginning of a block, or jumps at the end, so the previous conditions would not stop us when we reach bb boundary. */ || BLOCK_FOR_INSN (prev) != bb) break; set = set_of (op0, prev); if (set && (GET_CODE (set) != SET || !rtx_equal_p (SET_DEST (set), op0))) break; /* If this is setting OP0, get what it sets it to if it looks relevant. */ if (set) { enum machine_mode inner_mode = GET_MODE (SET_DEST (set)); #ifdef FLOAT_STORE_FLAG_VALUE REAL_VALUE_TYPE fsfv; #endif /* ??? We may not combine comparisons done in a CCmode with comparisons not done in a CCmode. This is to aid targets like Alpha that have an IEEE compliant EQ instruction, and a non-IEEE compliant BEQ instruction. The use of CCmode is actually artificial, simply to prevent the combination, but should not affect other platforms. However, we must allow VOIDmode comparisons to match either CCmode or non-CCmode comparison, because some ports have modeless comparisons inside branch patterns. ??? This mode check should perhaps look more like the mode check in simplify_comparison in combine. */ if ((GET_CODE (SET_SRC (set)) == COMPARE || (((code == NE || (code == LT && GET_MODE_CLASS (inner_mode) == MODE_INT && (GET_MODE_BITSIZE (inner_mode) <= HOST_BITS_PER_WIDE_INT) && (STORE_FLAG_VALUE & ((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (inner_mode) - 1)))) #ifdef FLOAT_STORE_FLAG_VALUE || (code == LT && SCALAR_FLOAT_MODE_P (inner_mode) && (fsfv = FLOAT_STORE_FLAG_VALUE (inner_mode), REAL_VALUE_NEGATIVE (fsfv))) #endif )) && COMPARISON_P (SET_SRC (set)))) && (((GET_MODE_CLASS (mode) == MODE_CC) == (GET_MODE_CLASS (inner_mode) == MODE_CC)) || mode == VOIDmode || inner_mode == VOIDmode)) x = SET_SRC (set); else if (((code == EQ || (code == GE && (GET_MODE_BITSIZE (inner_mode) <= HOST_BITS_PER_WIDE_INT) && GET_MODE_CLASS (inner_mode) == MODE_INT && (STORE_FLAG_VALUE & ((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (inner_mode) - 1)))) #ifdef FLOAT_STORE_FLAG_VALUE || (code == GE && SCALAR_FLOAT_MODE_P (inner_mode) && (fsfv = FLOAT_STORE_FLAG_VALUE (inner_mode), REAL_VALUE_NEGATIVE (fsfv))) #endif )) && COMPARISON_P (SET_SRC (set)) && (((GET_MODE_CLASS (mode) == MODE_CC) == (GET_MODE_CLASS (inner_mode) == MODE_CC)) || mode == VOIDmode || inner_mode == VOIDmode)) { reverse_code = 1; x = SET_SRC (set); } else break; } else if (reg_set_p (op0, prev)) /* If this sets OP0, but not directly, we have to give up. */ break; if (x) { /* If the caller is expecting the condition to be valid at INSN, make sure X doesn't change before INSN. */ if (valid_at_insn_p) if (modified_in_p (x, prev) || modified_between_p (x, prev, insn)) break; if (COMPARISON_P (x)) code = GET_CODE (x); if (reverse_code) { code = reversed_comparison_code (x, prev); if (code == UNKNOWN) return 0; reverse_code = 0; } op0 = XEXP (x, 0), op1 = XEXP (x, 1); if (earliest) *earliest = prev; } } /* If constant is first, put it last. */ if (CONSTANT_P (op0)) code = swap_condition (code), tem = op0, op0 = op1, op1 = tem; /* If OP0 is the result of a comparison, we weren't able to find what was really being compared, so fail. */ if (!allow_cc_mode && GET_MODE_CLASS (GET_MODE (op0)) == MODE_CC) return 0; /* Canonicalize any ordered comparison with integers involving equality if we can do computations in the relevant mode and we do not overflow. */ if (GET_MODE_CLASS (GET_MODE (op0)) != MODE_CC && GET_CODE (op1) == CONST_INT && GET_MODE (op0) != VOIDmode && GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT) { HOST_WIDE_INT const_val = INTVAL (op1); unsigned HOST_WIDE_INT uconst_val = const_val; unsigned HOST_WIDE_INT max_val = (unsigned HOST_WIDE_INT) GET_MODE_MASK (GET_MODE (op0)); switch (code) { case LE: if ((unsigned HOST_WIDE_INT) const_val != max_val >> 1) code = LT, op1 = gen_int_mode (const_val + 1, GET_MODE (op0)); break; /* When cross-compiling, const_val might be sign-extended from BITS_PER_WORD to HOST_BITS_PER_WIDE_INT */ case GE: if ((HOST_WIDE_INT) (const_val & max_val) != (((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1)))) code = GT, op1 = gen_int_mode (const_val - 1, GET_MODE (op0)); break; case LEU: if (uconst_val < max_val) code = LTU, op1 = gen_int_mode (uconst_val + 1, GET_MODE (op0)); break; case GEU: if (uconst_val != 0) code = GTU, op1 = gen_int_mode (uconst_val - 1, GET_MODE (op0)); break; default: break; } } /* Never return CC0; return zero instead. */ if (CC0_P (op0)) return 0; return gen_rtx_fmt_ee (code, VOIDmode, op0, op1); } /* Given a jump insn JUMP, return the condition that will cause it to branch to its JUMP_LABEL. If the condition cannot be understood, or is an inequality floating-point comparison which needs to be reversed, 0 will be returned. If EARLIEST is nonzero, it is a pointer to a place where the earliest insn used in locating the condition was found. If a replacement test of the condition is desired, it should be placed in front of that insn and we will be sure that the inputs are still valid. If EARLIEST is null, the returned condition will be valid at INSN. If ALLOW_CC_MODE is nonzero, allow the condition returned to be a compare CC mode register. VALID_AT_INSN_P is the same as for canonicalize_condition. */ rtx get_condition (rtx jump, rtx *earliest, int allow_cc_mode, int valid_at_insn_p) { rtx cond; int reverse; rtx set; /* If this is not a standard conditional jump, we can't parse it. */ if (!JUMP_P (jump) || ! any_condjump_p (jump)) return 0; set = pc_set (jump); cond = XEXP (SET_SRC (set), 0); /* If this branches to JUMP_LABEL when the condition is false, reverse the condition. */ reverse = GET_CODE (XEXP (SET_SRC (set), 2)) == LABEL_REF && XEXP (XEXP (SET_SRC (set), 2), 0) == JUMP_LABEL (jump); return canonicalize_condition (jump, cond, reverse, earliest, NULL_RTX, allow_cc_mode, valid_at_insn_p); } /* Initialize the table NUM_SIGN_BIT_COPIES_IN_REP based on TARGET_MODE_REP_EXTENDED. Note that we assume that the property of TARGET_MODE_REP_EXTENDED(B, C) is sticky to the integral modes narrower than mode B. I.e., if A is a mode narrower than B then in order to be able to operate on it in mode B, mode A needs to satisfy the requirements set by the representation of mode B. */ static void init_num_sign_bit_copies_in_rep (void) { enum machine_mode mode, in_mode; for (in_mode = GET_CLASS_NARROWEST_MODE (MODE_INT); in_mode != VOIDmode; in_mode = GET_MODE_WIDER_MODE (mode)) for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); mode != in_mode; mode = GET_MODE_WIDER_MODE (mode)) { enum machine_mode i; /* Currently, it is assumed that TARGET_MODE_REP_EXTENDED extends to the next widest mode. */ gcc_assert (targetm.mode_rep_extended (mode, in_mode) == UNKNOWN || GET_MODE_WIDER_MODE (mode) == in_mode); /* We are in in_mode. Count how many bits outside of mode have to be copies of the sign-bit. */ for (i = mode; i != in_mode; i = GET_MODE_WIDER_MODE (i)) { enum machine_mode wider = GET_MODE_WIDER_MODE (i); if (targetm.mode_rep_extended (i, wider) == SIGN_EXTEND /* We can only check sign-bit copies starting from the top-bit. In order to be able to check the bits we have already seen we pretend that subsequent bits have to be sign-bit copies too. */ || num_sign_bit_copies_in_rep [in_mode][mode]) num_sign_bit_copies_in_rep [in_mode][mode] += GET_MODE_BITSIZE (wider) - GET_MODE_BITSIZE (i); } } } /* Suppose that truncation from the machine mode of X to MODE is not a no-op. See if there is anything special about X so that we can assume it already contains a truncated value of MODE. */ bool truncated_to_mode (enum machine_mode mode, rtx x) { /* This register has already been used in MODE without explicit truncation. */ if (REG_P (x) && rtl_hooks.reg_truncated_to_mode (mode, x)) return true; /* See if we already satisfy the requirements of MODE. If yes we can just switch to MODE. */ if (num_sign_bit_copies_in_rep[GET_MODE (x)][mode] && (num_sign_bit_copies (x, GET_MODE (x)) >= num_sign_bit_copies_in_rep[GET_MODE (x)][mode] + 1)) return true; return false; } /* Initialize non_rtx_starting_operands, which is used to speed up for_each_rtx. */ void init_rtlanal (void) { int i; for (i = 0; i < NUM_RTX_CODE; i++) { const char *format = GET_RTX_FORMAT (i); const char *first = strpbrk (format, "eEV"); non_rtx_starting_operands[i] = first ? first - format : -1; } init_num_sign_bit_copies_in_rep (); } /* Check whether this is a constant pool constant. */ bool constant_pool_constant_p (rtx x) { x = avoid_constant_pool_reference (x); return GET_CODE (x) == CONST_DOUBLE; }