| /* Expands front end tree to back end RTL for GCC. |
| Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, |
| 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005 |
| Free Software Foundation, Inc. |
| |
| This file is part of GCC. |
| |
| GCC is free software; you can redistribute it and/or modify it under |
| the terms of the GNU General Public License as published by the Free |
| Software Foundation; either version 2, or (at your option) any later |
| version. |
| |
| GCC is distributed in the hope that it will be useful, but WITHOUT ANY |
| WARRANTY; without even the implied warranty of MERCHANTABILITY or |
| FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
| for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with GCC; see the file COPYING. If not, write to the Free |
| Software Foundation, 59 Temple Place - Suite 330, Boston, MA |
| 02111-1307, USA. */ |
| |
| /* This file handles the generation of rtl code from tree structure |
| at the level of the function as a whole. |
| It creates the rtl expressions for parameters and auto variables |
| and has full responsibility for allocating stack slots. |
| |
| `expand_function_start' is called at the beginning of a function, |
| before the function body is parsed, and `expand_function_end' is |
| called after parsing the body. |
| |
| Call `assign_stack_local' to allocate a stack slot for a local variable. |
| This is usually done during the RTL generation for the function body, |
| but it can also be done in the reload pass when a pseudo-register does |
| not get a hard register. */ |
| |
| #include "config.h" |
| #include "system.h" |
| #include "coretypes.h" |
| #include "tm.h" |
| #include "rtl.h" |
| #include "tree.h" |
| #include "flags.h" |
| #include "except.h" |
| #include "function.h" |
| #include "expr.h" |
| #include "optabs.h" |
| #include "libfuncs.h" |
| #include "regs.h" |
| #include "hard-reg-set.h" |
| #include "insn-config.h" |
| #include "recog.h" |
| #include "output.h" |
| #include "basic-block.h" |
| #include "toplev.h" |
| #include "hashtab.h" |
| #include "ggc.h" |
| #include "tm_p.h" |
| #include "integrate.h" |
| #include "langhooks.h" |
| #include "target.h" |
| #include "cfglayout.h" |
| #include "tree-gimple.h" |
| /* APPLE LOCAL mainline */ |
| #include "predict.h" |
| |
| #ifndef LOCAL_ALIGNMENT |
| #define LOCAL_ALIGNMENT(TYPE, ALIGNMENT) ALIGNMENT |
| #endif |
| |
| #ifndef STACK_ALIGNMENT_NEEDED |
| #define STACK_ALIGNMENT_NEEDED 1 |
| #endif |
| |
| #define STACK_BYTES (STACK_BOUNDARY / BITS_PER_UNIT) |
| |
| /* Some systems use __main in a way incompatible with its use in gcc, in these |
| cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to |
| give the same symbol without quotes for an alternative entry point. You |
| must define both, or neither. */ |
| #ifndef NAME__MAIN |
| #define NAME__MAIN "__main" |
| #endif |
| |
| /* Round a value to the lowest integer less than it that is a multiple of |
| the required alignment. Avoid using division in case the value is |
| negative. Assume the alignment is a power of two. */ |
| #define FLOOR_ROUND(VALUE,ALIGN) ((VALUE) & ~((ALIGN) - 1)) |
| |
| /* Similar, but round to the next highest integer that meets the |
| alignment. */ |
| #define CEIL_ROUND(VALUE,ALIGN) (((VALUE) + (ALIGN) - 1) & ~((ALIGN)- 1)) |
| |
| /* Nonzero if function being compiled doesn't contain any calls |
| (ignoring the prologue and epilogue). This is set prior to |
| local register allocation and is valid for the remaining |
| compiler passes. */ |
| int current_function_is_leaf; |
| |
| /* Nonzero if function being compiled doesn't modify the stack pointer |
| (ignoring the prologue and epilogue). This is only valid after |
| life_analysis has run. */ |
| int current_function_sp_is_unchanging; |
| |
| /* Nonzero if the function being compiled is a leaf function which only |
| uses leaf registers. This is valid after reload (specifically after |
| sched2) and is useful only if the port defines LEAF_REGISTERS. */ |
| int current_function_uses_only_leaf_regs; |
| |
| /* Nonzero once virtual register instantiation has been done. |
| assign_stack_local uses frame_pointer_rtx when this is nonzero. |
| calls.c:emit_library_call_value_1 uses it to set up |
| post-instantiation libcalls. */ |
| int virtuals_instantiated; |
| |
| /* Assign unique numbers to labels generated for profiling, debugging, etc. */ |
| static GTY(()) int funcdef_no; |
| |
| /* These variables hold pointers to functions to create and destroy |
| target specific, per-function data structures. */ |
| struct machine_function * (*init_machine_status) (void); |
| |
| /* The currently compiled function. */ |
| struct function *cfun = 0; |
| |
| /* These arrays record the INSN_UIDs of the prologue and epilogue insns. */ |
| static GTY(()) varray_type prologue; |
| static GTY(()) varray_type epilogue; |
| |
| /* Array of INSN_UIDs to hold the INSN_UIDs for each sibcall epilogue |
| in this function. */ |
| static GTY(()) varray_type sibcall_epilogue; |
| |
| /* In order to evaluate some expressions, such as function calls returning |
| structures in memory, we need to temporarily allocate stack locations. |
| We record each allocated temporary in the following structure. |
| |
| Associated with each temporary slot is a nesting level. When we pop up |
| one level, all temporaries associated with the previous level are freed. |
| Normally, all temporaries are freed after the execution of the statement |
| in which they were created. However, if we are inside a ({...}) grouping, |
| the result may be in a temporary and hence must be preserved. If the |
| result could be in a temporary, we preserve it if we can determine which |
| one it is in. If we cannot determine which temporary may contain the |
| result, all temporaries are preserved. A temporary is preserved by |
| pretending it was allocated at the previous nesting level. |
| |
| Automatic variables are also assigned temporary slots, at the nesting |
| level where they are defined. They are marked a "kept" so that |
| free_temp_slots will not free them. */ |
| |
| struct temp_slot GTY(()) |
| { |
| /* Points to next temporary slot. */ |
| struct temp_slot *next; |
| /* Points to previous temporary slot. */ |
| struct temp_slot *prev; |
| |
| /* The rtx to used to reference the slot. */ |
| rtx slot; |
| /* The rtx used to represent the address if not the address of the |
| slot above. May be an EXPR_LIST if multiple addresses exist. */ |
| rtx address; |
| /* The alignment (in bits) of the slot. */ |
| unsigned int align; |
| /* The size, in units, of the slot. */ |
| HOST_WIDE_INT size; |
| /* The type of the object in the slot, or zero if it doesn't correspond |
| to a type. We use this to determine whether a slot can be reused. |
| It can be reused if objects of the type of the new slot will always |
| conflict with objects of the type of the old slot. */ |
| tree type; |
| /* Nonzero if this temporary is currently in use. */ |
| char in_use; |
| /* Nonzero if this temporary has its address taken. */ |
| char addr_taken; |
| /* Nesting level at which this slot is being used. */ |
| int level; |
| /* Nonzero if this should survive a call to free_temp_slots. */ |
| int keep; |
| /* The offset of the slot from the frame_pointer, including extra space |
| for alignment. This info is for combine_temp_slots. */ |
| HOST_WIDE_INT base_offset; |
| /* The size of the slot, including extra space for alignment. This |
| info is for combine_temp_slots. */ |
| HOST_WIDE_INT full_size; |
| }; |
| |
| /* Forward declarations. */ |
| |
| static rtx assign_stack_local_1 (enum machine_mode, HOST_WIDE_INT, int, |
| struct function *); |
| static struct temp_slot *find_temp_slot_from_address (rtx); |
| static void instantiate_decls (tree, int); |
| static void instantiate_decls_1 (tree, int); |
| static void instantiate_decl (rtx, HOST_WIDE_INT, int); |
| static rtx instantiate_new_reg (rtx, HOST_WIDE_INT *); |
| static int instantiate_virtual_regs_1 (rtx *, rtx, int); |
| static void pad_to_arg_alignment (struct args_size *, int, struct args_size *); |
| static void pad_below (struct args_size *, enum machine_mode, tree); |
| static void reorder_blocks_1 (rtx, tree, varray_type *); |
| static void reorder_fix_fragments (tree); |
| static int all_blocks (tree, tree *); |
| static tree *get_block_vector (tree, int *); |
| extern tree debug_find_var_in_block_tree (tree, tree); |
| /* We always define `record_insns' even if it's not used so that we |
| can always export `prologue_epilogue_contains'. */ |
| static void record_insns (rtx, varray_type *) ATTRIBUTE_UNUSED; |
| static int contains (rtx, varray_type); |
| #ifdef HAVE_return |
| static void emit_return_into_block (basic_block, rtx); |
| #endif |
| #if defined(HAVE_epilogue) && defined(INCOMING_RETURN_ADDR_RTX) |
| static rtx keep_stack_depressed (rtx); |
| #endif |
| static void prepare_function_start (tree); |
| static void do_clobber_return_reg (rtx, void *); |
| static void do_use_return_reg (rtx, void *); |
| static void instantiate_virtual_regs_lossage (rtx); |
| static void set_insn_locators (rtx, int) ATTRIBUTE_UNUSED; |
| |
| /* Pointer to chain of `struct function' for containing functions. */ |
| struct function *outer_function_chain; |
| |
| /* Given a function decl for a containing function, |
| return the `struct function' for it. */ |
| |
| struct function * |
| find_function_data (tree decl) |
| { |
| struct function *p; |
| |
| for (p = outer_function_chain; p; p = p->outer) |
| if (p->decl == decl) |
| return p; |
| |
| gcc_unreachable (); |
| } |
| |
| /* Save the current context for compilation of a nested function. |
| This is called from language-specific code. The caller should use |
| the enter_nested langhook to save any language-specific state, |
| since this function knows only about language-independent |
| variables. */ |
| |
| void |
| push_function_context_to (tree context) |
| { |
| struct function *p; |
| |
| if (context) |
| { |
| if (context == current_function_decl) |
| cfun->contains_functions = 1; |
| else |
| { |
| struct function *containing = find_function_data (context); |
| containing->contains_functions = 1; |
| } |
| } |
| |
| if (cfun == 0) |
| init_dummy_function_start (); |
| p = cfun; |
| |
| p->outer = outer_function_chain; |
| outer_function_chain = p; |
| |
| lang_hooks.function.enter_nested (p); |
| |
| cfun = 0; |
| } |
| |
| void |
| push_function_context (void) |
| { |
| push_function_context_to (current_function_decl); |
| } |
| |
| /* Restore the last saved context, at the end of a nested function. |
| This function is called from language-specific code. */ |
| |
| void |
| pop_function_context_from (tree context ATTRIBUTE_UNUSED) |
| { |
| struct function *p = outer_function_chain; |
| |
| cfun = p; |
| outer_function_chain = p->outer; |
| |
| current_function_decl = p->decl; |
| |
| lang_hooks.function.leave_nested (p); |
| |
| /* Reset variables that have known state during rtx generation. */ |
| virtuals_instantiated = 0; |
| generating_concat_p = 1; |
| } |
| |
| void |
| pop_function_context (void) |
| { |
| pop_function_context_from (current_function_decl); |
| } |
| |
| /* Clear out all parts of the state in F that can safely be discarded |
| after the function has been parsed, but not compiled, to let |
| garbage collection reclaim the memory. */ |
| |
| void |
| free_after_parsing (struct function *f) |
| { |
| /* f->expr->forced_labels is used by code generation. */ |
| /* f->emit->regno_reg_rtx is used by code generation. */ |
| /* f->varasm is used by code generation. */ |
| /* f->eh->eh_return_stub_label is used by code generation. */ |
| |
| lang_hooks.function.final (f); |
| } |
| |
| /* Clear out all parts of the state in F that can safely be discarded |
| after the function has been compiled, to let garbage collection |
| reclaim the memory. */ |
| |
| void |
| free_after_compilation (struct function *f) |
| { |
| f->eh = NULL; |
| f->expr = NULL; |
| f->emit = NULL; |
| f->varasm = NULL; |
| f->machine = NULL; |
| |
| f->x_avail_temp_slots = NULL; |
| f->x_used_temp_slots = NULL; |
| f->arg_offset_rtx = NULL; |
| f->return_rtx = NULL; |
| f->internal_arg_pointer = NULL; |
| f->x_nonlocal_goto_handler_labels = NULL; |
| f->x_return_label = NULL; |
| f->x_naked_return_label = NULL; |
| f->x_stack_slot_list = NULL; |
| f->x_tail_recursion_reentry = NULL; |
| f->x_arg_pointer_save_area = NULL; |
| f->x_parm_birth_insn = NULL; |
| f->original_arg_vector = NULL; |
| f->original_decl_initial = NULL; |
| f->epilogue_delay_list = NULL; |
| } |
| |
| /* Allocate fixed slots in the stack frame of the current function. */ |
| |
| /* Return size needed for stack frame based on slots so far allocated in |
| function F. |
| This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY; |
| the caller may have to do that. */ |
| |
| HOST_WIDE_INT |
| get_func_frame_size (struct function *f) |
| { |
| /* APPLE LOCAL begin mainline */ |
| if (FRAME_GROWS_DOWNWARD) |
| return -f->x_frame_offset; |
| else |
| return f->x_frame_offset; |
| /* APPLE LOCAL end mainline */ |
| } |
| |
| /* Return size needed for stack frame based on slots so far allocated. |
| This size counts from zero. It is not rounded to PREFERRED_STACK_BOUNDARY; |
| the caller may have to do that. */ |
| HOST_WIDE_INT |
| get_frame_size (void) |
| { |
| return get_func_frame_size (cfun); |
| } |
| |
| /* Allocate a stack slot of SIZE bytes and return a MEM rtx for it |
| with machine mode MODE. |
| |
| ALIGN controls the amount of alignment for the address of the slot: |
| 0 means according to MODE, |
| -1 means use BIGGEST_ALIGNMENT and round size to multiple of that, |
| -2 means use BITS_PER_UNIT, |
| positive specifies alignment boundary in bits. |
| |
| We do not round to stack_boundary here. |
| |
| FUNCTION specifies the function to allocate in. */ |
| |
| static rtx |
| assign_stack_local_1 (enum machine_mode mode, HOST_WIDE_INT size, int align, |
| struct function *function) |
| { |
| rtx x, addr; |
| int bigend_correction = 0; |
| unsigned int alignment; |
| int frame_off, frame_alignment, frame_phase; |
| |
| if (align == 0) |
| { |
| tree type; |
| |
| if (mode == BLKmode) |
| alignment = BIGGEST_ALIGNMENT; |
| else |
| alignment = GET_MODE_ALIGNMENT (mode); |
| |
| /* Allow the target to (possibly) increase the alignment of this |
| stack slot. */ |
| type = lang_hooks.types.type_for_mode (mode, 0); |
| if (type) |
| alignment = LOCAL_ALIGNMENT (type, alignment); |
| |
| alignment /= BITS_PER_UNIT; |
| } |
| else if (align == -1) |
| { |
| alignment = BIGGEST_ALIGNMENT / BITS_PER_UNIT; |
| size = CEIL_ROUND (size, alignment); |
| } |
| else if (align == -2) |
| alignment = 1; /* BITS_PER_UNIT / BITS_PER_UNIT */ |
| else |
| alignment = align / BITS_PER_UNIT; |
| |
| /* APPLE LOCAL begin mainline */ |
| if (FRAME_GROWS_DOWNWARD) |
| function->x_frame_offset -= size; |
| /* APPLE LOCAL end mainline */ |
| |
| /* Ignore alignment we can't do with expected alignment of the boundary. */ |
| if (alignment * BITS_PER_UNIT > PREFERRED_STACK_BOUNDARY) |
| alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT; |
| |
| if (function->stack_alignment_needed < alignment * BITS_PER_UNIT) |
| function->stack_alignment_needed = alignment * BITS_PER_UNIT; |
| |
| /* Calculate how many bytes the start of local variables is off from |
| stack alignment. */ |
| frame_alignment = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT; |
| frame_off = STARTING_FRAME_OFFSET % frame_alignment; |
| frame_phase = frame_off ? frame_alignment - frame_off : 0; |
| |
| /* Round the frame offset to the specified alignment. The default is |
| to always honor requests to align the stack but a port may choose to |
| do its own stack alignment by defining STACK_ALIGNMENT_NEEDED. */ |
| if (STACK_ALIGNMENT_NEEDED |
| || mode != BLKmode |
| || size != 0) |
| { |
| /* We must be careful here, since FRAME_OFFSET might be negative and |
| division with a negative dividend isn't as well defined as we might |
| like. So we instead assume that ALIGNMENT is a power of two and |
| use logical operations which are unambiguous. */ |
| /* APPLE LOCAL begin mainline */ |
| if (FRAME_GROWS_DOWNWARD) |
| function->x_frame_offset |
| = (FLOOR_ROUND (function->x_frame_offset - frame_phase, |
| (unsigned HOST_WIDE_INT) alignment) |
| + frame_phase); |
| else |
| function->x_frame_offset |
| = (CEIL_ROUND (function->x_frame_offset - frame_phase, |
| (unsigned HOST_WIDE_INT) alignment) |
| + frame_phase); |
| /* APPLE LOCAL end mainline */ |
| } |
| |
| /* On a big-endian machine, if we are allocating more space than we will use, |
| use the least significant bytes of those that are allocated. */ |
| if (BYTES_BIG_ENDIAN && mode != BLKmode) |
| bigend_correction = size - GET_MODE_SIZE (mode); |
| |
| /* If we have already instantiated virtual registers, return the actual |
| address relative to the frame pointer. */ |
| if (function == cfun && virtuals_instantiated) |
| addr = plus_constant (frame_pointer_rtx, |
| trunc_int_for_mode |
| (frame_offset + bigend_correction |
| + STARTING_FRAME_OFFSET, Pmode)); |
| else |
| addr = plus_constant (virtual_stack_vars_rtx, |
| trunc_int_for_mode |
| (function->x_frame_offset + bigend_correction, |
| Pmode)); |
| |
| /* APPLE LOCAL begin mainline */ |
| if (!FRAME_GROWS_DOWNWARD) |
| function->x_frame_offset += size; |
| /* APPLE LOCAL end mainline */ |
| |
| x = gen_rtx_MEM (mode, addr); |
| |
| function->x_stack_slot_list |
| = gen_rtx_EXPR_LIST (VOIDmode, x, function->x_stack_slot_list); |
| |
| return x; |
| } |
| |
| /* Wrapper around assign_stack_local_1; assign a local stack slot for the |
| current function. */ |
| |
| rtx |
| assign_stack_local (enum machine_mode mode, HOST_WIDE_INT size, int align) |
| { |
| return assign_stack_local_1 (mode, size, align, cfun); |
| } |
| |
| /* APPLE LOCAL begin new function for rs6000 consumption */ |
| /* Wrapper around assign_stack_local_1; assign a local stack slot for the |
| current function, then set the mem_alias to a new alias set. |
| This can be used only in situations where the target code can |
| guarantee that the slot is used in a way that cannot conflict |
| with anything else. */ |
| |
| rtx |
| assign_stack_local_with_alias (enum machine_mode mode, HOST_WIDE_INT size, |
| int align) |
| { |
| rtx mem = assign_stack_local_1 (mode, size, align, cfun); |
| set_mem_alias_set (mem, new_alias_set ()); |
| return mem; |
| } |
| /* APPLE LOCAL end new function for rs6000 consumption */ |
| |
| |
| /* Removes temporary slot TEMP from LIST. */ |
| |
| static void |
| cut_slot_from_list (struct temp_slot *temp, struct temp_slot **list) |
| { |
| if (temp->next) |
| temp->next->prev = temp->prev; |
| if (temp->prev) |
| temp->prev->next = temp->next; |
| else |
| *list = temp->next; |
| |
| temp->prev = temp->next = NULL; |
| } |
| |
| /* Inserts temporary slot TEMP to LIST. */ |
| |
| static void |
| insert_slot_to_list (struct temp_slot *temp, struct temp_slot **list) |
| { |
| temp->next = *list; |
| if (*list) |
| (*list)->prev = temp; |
| temp->prev = NULL; |
| *list = temp; |
| } |
| |
| /* Returns the list of used temp slots at LEVEL. */ |
| |
| static struct temp_slot ** |
| temp_slots_at_level (int level) |
| { |
| |
| if (!used_temp_slots) |
| VARRAY_GENERIC_PTR_INIT (used_temp_slots, 3, "used_temp_slots"); |
| |
| while (level >= (int) VARRAY_ACTIVE_SIZE (used_temp_slots)) |
| VARRAY_PUSH_GENERIC_PTR (used_temp_slots, NULL); |
| |
| return (struct temp_slot **) &VARRAY_GENERIC_PTR (used_temp_slots, level); |
| } |
| |
| /* Returns the maximal temporary slot level. */ |
| |
| static int |
| max_slot_level (void) |
| { |
| if (!used_temp_slots) |
| return -1; |
| |
| return VARRAY_ACTIVE_SIZE (used_temp_slots) - 1; |
| } |
| |
| /* Moves temporary slot TEMP to LEVEL. */ |
| |
| static void |
| move_slot_to_level (struct temp_slot *temp, int level) |
| { |
| cut_slot_from_list (temp, temp_slots_at_level (temp->level)); |
| insert_slot_to_list (temp, temp_slots_at_level (level)); |
| temp->level = level; |
| } |
| |
| /* Make temporary slot TEMP available. */ |
| |
| static void |
| make_slot_available (struct temp_slot *temp) |
| { |
| cut_slot_from_list (temp, temp_slots_at_level (temp->level)); |
| insert_slot_to_list (temp, &avail_temp_slots); |
| temp->in_use = 0; |
| temp->level = -1; |
| } |
| |
| /* Allocate a temporary stack slot and record it for possible later |
| reuse. |
| |
| MODE is the machine mode to be given to the returned rtx. |
| |
| SIZE is the size in units of the space required. We do no rounding here |
| since assign_stack_local will do any required rounding. |
| |
| KEEP is 1 if this slot is to be retained after a call to |
| free_temp_slots. Automatic variables for a block are allocated |
| with this flag. KEEP values of 2 or 3 were needed respectively |
| for variables whose lifetime is controlled by CLEANUP_POINT_EXPRs |
| or for SAVE_EXPRs, but they are now unused and will abort. |
| |
| TYPE is the type that will be used for the stack slot. */ |
| |
| rtx |
| assign_stack_temp_for_type (enum machine_mode mode, HOST_WIDE_INT size, int keep, |
| tree type) |
| { |
| unsigned int align; |
| struct temp_slot *p, *best_p = 0, *selected = NULL, **pp; |
| rtx slot; |
| |
| /* If SIZE is -1 it means that somebody tried to allocate a temporary |
| of a variable size. */ |
| gcc_assert (size != -1); |
| |
| /* These are now unused. */ |
| gcc_assert (keep <= 1); |
| |
| if (mode == BLKmode) |
| align = BIGGEST_ALIGNMENT; |
| else |
| align = GET_MODE_ALIGNMENT (mode); |
| |
| if (! type) |
| type = lang_hooks.types.type_for_mode (mode, 0); |
| |
| if (type) |
| align = LOCAL_ALIGNMENT (type, align); |
| |
| /* Try to find an available, already-allocated temporary of the proper |
| mode which meets the size and alignment requirements. Choose the |
| smallest one with the closest alignment. */ |
| for (p = avail_temp_slots; p; p = p->next) |
| { |
| if (p->align >= align && p->size >= size && GET_MODE (p->slot) == mode |
| && objects_must_conflict_p (p->type, type) |
| && (best_p == 0 || best_p->size > p->size |
| || (best_p->size == p->size && best_p->align > p->align))) |
| { |
| if (p->align == align && p->size == size) |
| { |
| selected = p; |
| cut_slot_from_list (selected, &avail_temp_slots); |
| best_p = 0; |
| break; |
| } |
| best_p = p; |
| } |
| } |
| |
| /* Make our best, if any, the one to use. */ |
| if (best_p) |
| { |
| selected = best_p; |
| cut_slot_from_list (selected, &avail_temp_slots); |
| |
| /* If there are enough aligned bytes left over, make them into a new |
| temp_slot so that the extra bytes don't get wasted. Do this only |
| for BLKmode slots, so that we can be sure of the alignment. */ |
| if (GET_MODE (best_p->slot) == BLKmode) |
| { |
| int alignment = best_p->align / BITS_PER_UNIT; |
| HOST_WIDE_INT rounded_size = CEIL_ROUND (size, alignment); |
| |
| if (best_p->size - rounded_size >= alignment) |
| { |
| p = ggc_alloc (sizeof (struct temp_slot)); |
| p->in_use = p->addr_taken = 0; |
| p->size = best_p->size - rounded_size; |
| p->base_offset = best_p->base_offset + rounded_size; |
| p->full_size = best_p->full_size - rounded_size; |
| p->slot = gen_rtx_MEM (BLKmode, |
| plus_constant (XEXP (best_p->slot, 0), |
| rounded_size)); |
| p->align = best_p->align; |
| p->address = 0; |
| p->type = best_p->type; |
| insert_slot_to_list (p, &avail_temp_slots); |
| |
| stack_slot_list = gen_rtx_EXPR_LIST (VOIDmode, p->slot, |
| stack_slot_list); |
| |
| best_p->size = rounded_size; |
| best_p->full_size = rounded_size; |
| } |
| } |
| } |
| |
| /* If we still didn't find one, make a new temporary. */ |
| if (selected == 0) |
| { |
| HOST_WIDE_INT frame_offset_old = frame_offset; |
| |
| p = ggc_alloc (sizeof (struct temp_slot)); |
| |
| /* We are passing an explicit alignment request to assign_stack_local. |
| One side effect of that is assign_stack_local will not round SIZE |
| to ensure the frame offset remains suitably aligned. |
| |
| So for requests which depended on the rounding of SIZE, we go ahead |
| and round it now. We also make sure ALIGNMENT is at least |
| BIGGEST_ALIGNMENT. */ |
| gcc_assert (mode != BLKmode || align == BIGGEST_ALIGNMENT); |
| p->slot = assign_stack_local (mode, |
| (mode == BLKmode |
| ? CEIL_ROUND (size, (int) align / BITS_PER_UNIT) |
| : size), |
| align); |
| |
| p->align = align; |
| |
| /* The following slot size computation is necessary because we don't |
| know the actual size of the temporary slot until assign_stack_local |
| has performed all the frame alignment and size rounding for the |
| requested temporary. Note that extra space added for alignment |
| can be either above or below this stack slot depending on which |
| way the frame grows. We include the extra space if and only if it |
| is above this slot. */ |
| /* APPLE LOCAL begin mainline */ |
| if (FRAME_GROWS_DOWNWARD) |
| p->size = frame_offset_old - frame_offset; |
| else |
| p->size = size; |
| |
| /* Now define the fields used by combine_temp_slots. */ |
| if (FRAME_GROWS_DOWNWARD) |
| { |
| p->base_offset = frame_offset; |
| p->full_size = frame_offset_old - frame_offset; |
| } |
| else |
| { |
| p->base_offset = frame_offset_old; |
| p->full_size = frame_offset - frame_offset_old; |
| } |
| /* APPLE LOCAL end mainline */ |
| p->address = 0; |
| |
| selected = p; |
| } |
| |
| p = selected; |
| p->in_use = 1; |
| p->addr_taken = 0; |
| p->type = type; |
| p->level = temp_slot_level; |
| p->keep = keep; |
| |
| pp = temp_slots_at_level (p->level); |
| insert_slot_to_list (p, pp); |
| |
| /* Create a new MEM rtx to avoid clobbering MEM flags of old slots. */ |
| slot = gen_rtx_MEM (mode, XEXP (p->slot, 0)); |
| stack_slot_list = gen_rtx_EXPR_LIST (VOIDmode, slot, stack_slot_list); |
| |
| /* If we know the alias set for the memory that will be used, use |
| it. If there's no TYPE, then we don't know anything about the |
| alias set for the memory. */ |
| set_mem_alias_set (slot, type ? get_alias_set (type) : 0); |
| set_mem_align (slot, align); |
| |
| /* If a type is specified, set the relevant flags. */ |
| if (type != 0) |
| { |
| MEM_VOLATILE_P (slot) = TYPE_VOLATILE (type); |
| MEM_SET_IN_STRUCT_P (slot, AGGREGATE_TYPE_P (type)); |
| } |
| |
| return slot; |
| } |
| |
| /* Allocate a temporary stack slot and record it for possible later |
| reuse. First three arguments are same as in preceding function. */ |
| |
| rtx |
| assign_stack_temp (enum machine_mode mode, HOST_WIDE_INT size, int keep) |
| { |
| return assign_stack_temp_for_type (mode, size, keep, NULL_TREE); |
| } |
| |
| /* Assign a temporary. |
| If TYPE_OR_DECL is a decl, then we are doing it on behalf of the decl |
| and so that should be used in error messages. In either case, we |
| allocate of the given type. |
| KEEP is as for assign_stack_temp. |
| MEMORY_REQUIRED is 1 if the result must be addressable stack memory; |
| it is 0 if a register is OK. |
| DONT_PROMOTE is 1 if we should not promote values in register |
| to wider modes. */ |
| |
| rtx |
| assign_temp (tree type_or_decl, int keep, int memory_required, |
| int dont_promote ATTRIBUTE_UNUSED) |
| { |
| tree type, decl; |
| enum machine_mode mode; |
| #ifdef PROMOTE_MODE |
| int unsignedp; |
| #endif |
| |
| if (DECL_P (type_or_decl)) |
| decl = type_or_decl, type = TREE_TYPE (decl); |
| else |
| decl = NULL, type = type_or_decl; |
| |
| mode = TYPE_MODE (type); |
| #ifdef PROMOTE_MODE |
| unsignedp = TYPE_UNSIGNED (type); |
| #endif |
| |
| if (mode == BLKmode || memory_required) |
| { |
| HOST_WIDE_INT size = int_size_in_bytes (type); |
| tree size_tree; |
| rtx tmp; |
| |
| /* Zero sized arrays are GNU C extension. Set size to 1 to avoid |
| problems with allocating the stack space. */ |
| if (size == 0) |
| size = 1; |
| |
| /* Unfortunately, we don't yet know how to allocate variable-sized |
| temporaries. However, sometimes we have a fixed upper limit on |
| the size (which is stored in TYPE_ARRAY_MAX_SIZE) and can use that |
| instead. This is the case for Chill variable-sized strings. */ |
| if (size == -1 && TREE_CODE (type) == ARRAY_TYPE |
| && TYPE_ARRAY_MAX_SIZE (type) != NULL_TREE |
| && host_integerp (TYPE_ARRAY_MAX_SIZE (type), 1)) |
| size = tree_low_cst (TYPE_ARRAY_MAX_SIZE (type), 1); |
| |
| /* If we still haven't been able to get a size, see if the language |
| can compute a maximum size. */ |
| if (size == -1 |
| && (size_tree = lang_hooks.types.max_size (type)) != 0 |
| && host_integerp (size_tree, 1)) |
| size = tree_low_cst (size_tree, 1); |
| |
| /* The size of the temporary may be too large to fit into an integer. */ |
| /* ??? Not sure this should happen except for user silliness, so limit |
| this to things that aren't compiler-generated temporaries. The |
| rest of the time we'll abort in assign_stack_temp_for_type. */ |
| if (decl && size == -1 |
| && TREE_CODE (TYPE_SIZE_UNIT (type)) == INTEGER_CST) |
| { |
| error ("%Jsize of variable %qD is too large", decl, decl); |
| size = 1; |
| } |
| |
| tmp = assign_stack_temp_for_type (mode, size, keep, type); |
| return tmp; |
| } |
| |
| #ifdef PROMOTE_MODE |
| if (! dont_promote) |
| mode = promote_mode (type, mode, &unsignedp, 0); |
| #endif |
| |
| return gen_reg_rtx (mode); |
| } |
| |
| /* Combine temporary stack slots which are adjacent on the stack. |
| |
| This allows for better use of already allocated stack space. This is only |
| done for BLKmode slots because we can be sure that we won't have alignment |
| problems in this case. */ |
| |
| static void |
| combine_temp_slots (void) |
| { |
| struct temp_slot *p, *q, *next, *next_q; |
| int num_slots; |
| |
| /* We can't combine slots, because the information about which slot |
| is in which alias set will be lost. */ |
| if (flag_strict_aliasing) |
| return; |
| |
| /* If there are a lot of temp slots, don't do anything unless |
| high levels of optimization. */ |
| if (! flag_expensive_optimizations) |
| for (p = avail_temp_slots, num_slots = 0; p; p = p->next, num_slots++) |
| if (num_slots > 100 || (num_slots > 10 && optimize == 0)) |
| return; |
| |
| for (p = avail_temp_slots; p; p = next) |
| { |
| int delete_p = 0; |
| |
| next = p->next; |
| |
| if (GET_MODE (p->slot) != BLKmode) |
| continue; |
| |
| for (q = p->next; q; q = next_q) |
| { |
| int delete_q = 0; |
| |
| next_q = q->next; |
| |
| if (GET_MODE (q->slot) != BLKmode) |
| continue; |
| |
| if (p->base_offset + p->full_size == q->base_offset) |
| { |
| /* Q comes after P; combine Q into P. */ |
| p->size += q->size; |
| p->full_size += q->full_size; |
| delete_q = 1; |
| } |
| else if (q->base_offset + q->full_size == p->base_offset) |
| { |
| /* P comes after Q; combine P into Q. */ |
| q->size += p->size; |
| q->full_size += p->full_size; |
| delete_p = 1; |
| break; |
| } |
| if (delete_q) |
| cut_slot_from_list (q, &avail_temp_slots); |
| } |
| |
| /* Either delete P or advance past it. */ |
| if (delete_p) |
| cut_slot_from_list (p, &avail_temp_slots); |
| } |
| } |
| |
| /* Find the temp slot corresponding to the object at address X. */ |
| |
| static struct temp_slot * |
| find_temp_slot_from_address (rtx x) |
| { |
| struct temp_slot *p; |
| rtx next; |
| int i; |
| |
| for (i = max_slot_level (); i >= 0; i--) |
| for (p = *temp_slots_at_level (i); p; p = p->next) |
| { |
| if (XEXP (p->slot, 0) == x |
| || p->address == x |
| || (GET_CODE (x) == PLUS |
| && XEXP (x, 0) == virtual_stack_vars_rtx |
| && GET_CODE (XEXP (x, 1)) == CONST_INT |
| && INTVAL (XEXP (x, 1)) >= p->base_offset |
| && INTVAL (XEXP (x, 1)) < p->base_offset + p->full_size)) |
| return p; |
| |
| else if (p->address != 0 && GET_CODE (p->address) == EXPR_LIST) |
| for (next = p->address; next; next = XEXP (next, 1)) |
| if (XEXP (next, 0) == x) |
| return p; |
| } |
| |
| /* If we have a sum involving a register, see if it points to a temp |
| slot. */ |
| if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 0)) |
| && (p = find_temp_slot_from_address (XEXP (x, 0))) != 0) |
| return p; |
| else if (GET_CODE (x) == PLUS && REG_P (XEXP (x, 1)) |
| && (p = find_temp_slot_from_address (XEXP (x, 1))) != 0) |
| return p; |
| |
| return 0; |
| } |
| |
| /* Indicate that NEW is an alternate way of referring to the temp slot |
| that previously was known by OLD. */ |
| |
| void |
| update_temp_slot_address (rtx old, rtx new) |
| { |
| struct temp_slot *p; |
| |
| if (rtx_equal_p (old, new)) |
| return; |
| |
| p = find_temp_slot_from_address (old); |
| |
| /* If we didn't find one, see if both OLD is a PLUS. If so, and NEW |
| is a register, see if one operand of the PLUS is a temporary |
| location. If so, NEW points into it. Otherwise, if both OLD and |
| NEW are a PLUS and if there is a register in common between them. |
| If so, try a recursive call on those values. */ |
| if (p == 0) |
| { |
| if (GET_CODE (old) != PLUS) |
| return; |
| |
| if (REG_P (new)) |
| { |
| update_temp_slot_address (XEXP (old, 0), new); |
| update_temp_slot_address (XEXP (old, 1), new); |
| return; |
| } |
| else if (GET_CODE (new) != PLUS) |
| return; |
| |
| if (rtx_equal_p (XEXP (old, 0), XEXP (new, 0))) |
| update_temp_slot_address (XEXP (old, 1), XEXP (new, 1)); |
| else if (rtx_equal_p (XEXP (old, 1), XEXP (new, 0))) |
| update_temp_slot_address (XEXP (old, 0), XEXP (new, 1)); |
| else if (rtx_equal_p (XEXP (old, 0), XEXP (new, 1))) |
| update_temp_slot_address (XEXP (old, 1), XEXP (new, 0)); |
| else if (rtx_equal_p (XEXP (old, 1), XEXP (new, 1))) |
| update_temp_slot_address (XEXP (old, 0), XEXP (new, 0)); |
| |
| return; |
| } |
| |
| /* Otherwise add an alias for the temp's address. */ |
| else if (p->address == 0) |
| p->address = new; |
| else |
| { |
| if (GET_CODE (p->address) != EXPR_LIST) |
| p->address = gen_rtx_EXPR_LIST (VOIDmode, p->address, NULL_RTX); |
| |
| p->address = gen_rtx_EXPR_LIST (VOIDmode, new, p->address); |
| } |
| } |
| |
| /* If X could be a reference to a temporary slot, mark the fact that its |
| address was taken. */ |
| |
| void |
| mark_temp_addr_taken (rtx x) |
| { |
| struct temp_slot *p; |
| |
| if (x == 0) |
| return; |
| |
| /* If X is not in memory or is at a constant address, it cannot be in |
| a temporary slot. */ |
| if (!MEM_P (x) || CONSTANT_P (XEXP (x, 0))) |
| return; |
| |
| p = find_temp_slot_from_address (XEXP (x, 0)); |
| if (p != 0) |
| p->addr_taken = 1; |
| } |
| |
| /* If X could be a reference to a temporary slot, mark that slot as |
| belonging to the to one level higher than the current level. If X |
| matched one of our slots, just mark that one. Otherwise, we can't |
| easily predict which it is, so upgrade all of them. Kept slots |
| need not be touched. |
| |
| This is called when an ({...}) construct occurs and a statement |
| returns a value in memory. */ |
| |
| void |
| preserve_temp_slots (rtx x) |
| { |
| struct temp_slot *p = 0, *next; |
| |
| /* If there is no result, we still might have some objects whose address |
| were taken, so we need to make sure they stay around. */ |
| if (x == 0) |
| { |
| for (p = *temp_slots_at_level (temp_slot_level); p; p = next) |
| { |
| next = p->next; |
| |
| if (p->addr_taken) |
| move_slot_to_level (p, temp_slot_level - 1); |
| } |
| |
| return; |
| } |
| |
| /* If X is a register that is being used as a pointer, see if we have |
| a temporary slot we know it points to. To be consistent with |
| the code below, we really should preserve all non-kept slots |
| if we can't find a match, but that seems to be much too costly. */ |
| if (REG_P (x) && REG_POINTER (x)) |
| p = find_temp_slot_from_address (x); |
| |
| /* If X is not in memory or is at a constant address, it cannot be in |
| a temporary slot, but it can contain something whose address was |
| taken. */ |
| if (p == 0 && (!MEM_P (x) || CONSTANT_P (XEXP (x, 0)))) |
| { |
| for (p = *temp_slots_at_level (temp_slot_level); p; p = next) |
| { |
| next = p->next; |
| |
| if (p->addr_taken) |
| move_slot_to_level (p, temp_slot_level - 1); |
| } |
| |
| return; |
| } |
| |
| /* First see if we can find a match. */ |
| if (p == 0) |
| p = find_temp_slot_from_address (XEXP (x, 0)); |
| |
| if (p != 0) |
| { |
| /* Move everything at our level whose address was taken to our new |
| level in case we used its address. */ |
| struct temp_slot *q; |
| |
| if (p->level == temp_slot_level) |
| { |
| for (q = *temp_slots_at_level (temp_slot_level); q; q = next) |
| { |
| next = q->next; |
| |
| if (p != q && q->addr_taken) |
| move_slot_to_level (q, temp_slot_level - 1); |
| } |
| |
| move_slot_to_level (p, temp_slot_level - 1); |
| p->addr_taken = 0; |
| } |
| return; |
| } |
| |
| /* Otherwise, preserve all non-kept slots at this level. */ |
| for (p = *temp_slots_at_level (temp_slot_level); p; p = next) |
| { |
| next = p->next; |
| |
| if (!p->keep) |
| move_slot_to_level (p, temp_slot_level - 1); |
| } |
| } |
| |
| /* Free all temporaries used so far. This is normally called at the |
| end of generating code for a statement. */ |
| |
| void |
| free_temp_slots (void) |
| { |
| struct temp_slot *p, *next; |
| |
| for (p = *temp_slots_at_level (temp_slot_level); p; p = next) |
| { |
| next = p->next; |
| |
| if (!p->keep) |
| make_slot_available (p); |
| } |
| |
| combine_temp_slots (); |
| } |
| |
| /* Push deeper into the nesting level for stack temporaries. */ |
| |
| void |
| push_temp_slots (void) |
| { |
| temp_slot_level++; |
| } |
| |
| /* Pop a temporary nesting level. All slots in use in the current level |
| are freed. */ |
| |
| void |
| pop_temp_slots (void) |
| { |
| struct temp_slot *p, *next; |
| |
| for (p = *temp_slots_at_level (temp_slot_level); p; p = next) |
| { |
| next = p->next; |
| make_slot_available (p); |
| } |
| |
| combine_temp_slots (); |
| |
| temp_slot_level--; |
| } |
| |
| /* Initialize temporary slots. */ |
| |
| void |
| init_temp_slots (void) |
| { |
| /* We have not allocated any temporaries yet. */ |
| avail_temp_slots = 0; |
| used_temp_slots = 0; |
| temp_slot_level = 0; |
| } |
| |
| /* These routines are responsible for converting virtual register references |
| to the actual hard register references once RTL generation is complete. |
| |
| The following four variables are used for communication between the |
| routines. They contain the offsets of the virtual registers from their |
| respective hard registers. */ |
| |
| static int in_arg_offset; |
| static int var_offset; |
| static int dynamic_offset; |
| static int out_arg_offset; |
| static int cfa_offset; |
| |
| /* In most machines, the stack pointer register is equivalent to the bottom |
| of the stack. */ |
| |
| #ifndef STACK_POINTER_OFFSET |
| #define STACK_POINTER_OFFSET 0 |
| #endif |
| |
| /* If not defined, pick an appropriate default for the offset of dynamically |
| allocated memory depending on the value of ACCUMULATE_OUTGOING_ARGS, |
| REG_PARM_STACK_SPACE, and OUTGOING_REG_PARM_STACK_SPACE. */ |
| |
| #ifndef STACK_DYNAMIC_OFFSET |
| |
| /* The bottom of the stack points to the actual arguments. If |
| REG_PARM_STACK_SPACE is defined, this includes the space for the register |
| parameters. However, if OUTGOING_REG_PARM_STACK space is not defined, |
| stack space for register parameters is not pushed by the caller, but |
| rather part of the fixed stack areas and hence not included in |
| `current_function_outgoing_args_size'. Nevertheless, we must allow |
| for it when allocating stack dynamic objects. */ |
| |
| #if defined(REG_PARM_STACK_SPACE) && ! defined(OUTGOING_REG_PARM_STACK_SPACE) |
| #define STACK_DYNAMIC_OFFSET(FNDECL) \ |
| ((ACCUMULATE_OUTGOING_ARGS \ |
| ? (current_function_outgoing_args_size + REG_PARM_STACK_SPACE (FNDECL)) : 0)\ |
| + (STACK_POINTER_OFFSET)) \ |
| |
| #else |
| #define STACK_DYNAMIC_OFFSET(FNDECL) \ |
| ((ACCUMULATE_OUTGOING_ARGS ? current_function_outgoing_args_size : 0) \ |
| + (STACK_POINTER_OFFSET)) |
| #endif |
| #endif |
| |
| /* On most machines, the CFA coincides with the first incoming parm. */ |
| |
| #ifndef ARG_POINTER_CFA_OFFSET |
| #define ARG_POINTER_CFA_OFFSET(FNDECL) FIRST_PARM_OFFSET (FNDECL) |
| #endif |
| |
| |
| /* Pass through the INSNS of function FNDECL and convert virtual register |
| references to hard register references. */ |
| |
| void |
| instantiate_virtual_regs (void) |
| { |
| rtx insn; |
| |
| /* Compute the offsets to use for this function. */ |
| in_arg_offset = FIRST_PARM_OFFSET (current_function_decl); |
| var_offset = STARTING_FRAME_OFFSET; |
| dynamic_offset = STACK_DYNAMIC_OFFSET (current_function_decl); |
| out_arg_offset = STACK_POINTER_OFFSET; |
| cfa_offset = ARG_POINTER_CFA_OFFSET (current_function_decl); |
| |
| /* Scan all variables and parameters of this function. For each that is |
| in memory, instantiate all virtual registers if the result is a valid |
| address. If not, we do it later. That will handle most uses of virtual |
| regs on many machines. */ |
| instantiate_decls (current_function_decl, 1); |
| |
| /* Initialize recognition, indicating that volatile is OK. */ |
| init_recog (); |
| |
| /* Scan through all the insns, instantiating every virtual register still |
| present. */ |
| for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) |
| if (GET_CODE (insn) == INSN || GET_CODE (insn) == JUMP_INSN |
| || GET_CODE (insn) == CALL_INSN) |
| { |
| instantiate_virtual_regs_1 (&PATTERN (insn), insn, 1); |
| if (INSN_DELETED_P (insn)) |
| continue; |
| instantiate_virtual_regs_1 (®_NOTES (insn), NULL_RTX, 0); |
| /* Instantiate any virtual registers in CALL_INSN_FUNCTION_USAGE. */ |
| if (GET_CODE (insn) == CALL_INSN) |
| instantiate_virtual_regs_1 (&CALL_INSN_FUNCTION_USAGE (insn), |
| NULL_RTX, 0); |
| |
| /* Past this point all ASM statements should match. Verify that |
| to avoid failures later in the compilation process. */ |
| if (asm_noperands (PATTERN (insn)) >= 0 |
| && ! check_asm_operands (PATTERN (insn))) |
| instantiate_virtual_regs_lossage (insn); |
| } |
| |
| /* Now instantiate the remaining register equivalences for debugging info. |
| These will not be valid addresses. */ |
| instantiate_decls (current_function_decl, 0); |
| |
| /* Indicate that, from now on, assign_stack_local should use |
| frame_pointer_rtx. */ |
| virtuals_instantiated = 1; |
| } |
| |
| /* Scan all decls in FNDECL (both variables and parameters) and instantiate |
| all virtual registers in their DECL_RTL's. |
| |
| If VALID_ONLY, do this only if the resulting address is still valid. |
| Otherwise, always do it. */ |
| |
| static void |
| instantiate_decls (tree fndecl, int valid_only) |
| { |
| tree decl; |
| |
| /* Process all parameters of the function. */ |
| for (decl = DECL_ARGUMENTS (fndecl); decl; decl = TREE_CHAIN (decl)) |
| { |
| HOST_WIDE_INT size = int_size_in_bytes (TREE_TYPE (decl)); |
| HOST_WIDE_INT size_rtl; |
| |
| instantiate_decl (DECL_RTL (decl), size, valid_only); |
| |
| /* If the parameter was promoted, then the incoming RTL mode may be |
| larger than the declared type size. We must use the larger of |
| the two sizes. */ |
| size_rtl = GET_MODE_SIZE (GET_MODE (DECL_INCOMING_RTL (decl))); |
| size = MAX (size_rtl, size); |
| instantiate_decl (DECL_INCOMING_RTL (decl), size, valid_only); |
| } |
| |
| /* Now process all variables defined in the function or its subblocks. */ |
| instantiate_decls_1 (DECL_INITIAL (fndecl), valid_only); |
| } |
| |
| /* Subroutine of instantiate_decls: Process all decls in the given |
| BLOCK node and all its subblocks. */ |
| |
| static void |
| instantiate_decls_1 (tree let, int valid_only) |
| { |
| tree t; |
| |
| for (t = BLOCK_VARS (let); t; t = TREE_CHAIN (t)) |
| if (DECL_RTL_SET_P (t)) |
| instantiate_decl (DECL_RTL (t), |
| int_size_in_bytes (TREE_TYPE (t)), |
| valid_only); |
| |
| /* Process all subblocks. */ |
| for (t = BLOCK_SUBBLOCKS (let); t; t = TREE_CHAIN (t)) |
| instantiate_decls_1 (t, valid_only); |
| } |
| |
| /* Subroutine of the preceding procedures: Given RTL representing a |
| decl and the size of the object, do any instantiation required. |
| |
| If VALID_ONLY is nonzero, it means that the RTL should only be |
| changed if the new address is valid. */ |
| |
| static void |
| instantiate_decl (rtx x, HOST_WIDE_INT size, int valid_only) |
| { |
| enum machine_mode mode; |
| rtx addr; |
| |
| if (x == 0) |
| return; |
| |
| /* If this is a CONCAT, recurse for the pieces. */ |
| if (GET_CODE (x) == CONCAT) |
| { |
| instantiate_decl (XEXP (x, 0), size / 2, valid_only); |
| instantiate_decl (XEXP (x, 1), size / 2, valid_only); |
| return; |
| } |
| |
| /* If this is not a MEM, no need to do anything. Similarly if the |
| address is a constant or a register that is not a virtual register. */ |
| if (!MEM_P (x)) |
| return; |
| |
| addr = XEXP (x, 0); |
| if (CONSTANT_P (addr) |
| || (REG_P (addr) |
| && (REGNO (addr) < FIRST_VIRTUAL_REGISTER |
| || REGNO (addr) > LAST_VIRTUAL_REGISTER))) |
| return; |
| |
| /* If we should only do this if the address is valid, copy the address. |
| We need to do this so we can undo any changes that might make the |
| address invalid. This copy is unfortunate, but probably can't be |
| avoided. */ |
| |
| if (valid_only) |
| addr = copy_rtx (addr); |
| |
| instantiate_virtual_regs_1 (&addr, NULL_RTX, 0); |
| |
| if (valid_only && size >= 0) |
| { |
| unsigned HOST_WIDE_INT decl_size = size; |
| |
| /* Now verify that the resulting address is valid for every integer or |
| floating-point mode up to and including SIZE bytes long. We do this |
| since the object might be accessed in any mode and frame addresses |
| are shared. */ |
| |
| for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); |
| mode != VOIDmode && GET_MODE_SIZE (mode) <= decl_size; |
| mode = GET_MODE_WIDER_MODE (mode)) |
| if (! memory_address_p (mode, addr)) |
| return; |
| |
| for (mode = GET_CLASS_NARROWEST_MODE (MODE_FLOAT); |
| mode != VOIDmode && GET_MODE_SIZE (mode) <= decl_size; |
| mode = GET_MODE_WIDER_MODE (mode)) |
| if (! memory_address_p (mode, addr)) |
| return; |
| } |
| |
| /* Put back the address now that we have updated it and we either know |
| it is valid or we don't care whether it is valid. */ |
| |
| XEXP (x, 0) = addr; |
| } |
| |
| /* Given a piece of RTX and a pointer to a HOST_WIDE_INT, if the RTX |
| is a virtual register, return the equivalent hard register and set the |
| offset indirectly through the pointer. Otherwise, return 0. */ |
| |
| static rtx |
| instantiate_new_reg (rtx x, HOST_WIDE_INT *poffset) |
| { |
| rtx new; |
| HOST_WIDE_INT offset; |
| |
| if (x == virtual_incoming_args_rtx) |
| new = arg_pointer_rtx, offset = in_arg_offset; |
| else if (x == virtual_stack_vars_rtx) |
| new = frame_pointer_rtx, offset = var_offset; |
| else if (x == virtual_stack_dynamic_rtx) |
| new = stack_pointer_rtx, offset = dynamic_offset; |
| else if (x == virtual_outgoing_args_rtx) |
| new = stack_pointer_rtx, offset = out_arg_offset; |
| else if (x == virtual_cfa_rtx) |
| new = arg_pointer_rtx, offset = cfa_offset; |
| else |
| return 0; |
| |
| *poffset = offset; |
| return new; |
| } |
| |
| |
| /* Called when instantiate_virtual_regs has failed to update the instruction. |
| Usually this means that non-matching instruction has been emit, however for |
| asm statements it may be the problem in the constraints. */ |
| static void |
| instantiate_virtual_regs_lossage (rtx insn) |
| { |
| gcc_assert (asm_noperands (PATTERN (insn)) >= 0); |
| error_for_asm (insn, "impossible constraint in %<asm%>"); |
| delete_insn (insn); |
| } |
| /* Given a pointer to a piece of rtx and an optional pointer to the |
| containing object, instantiate any virtual registers present in it. |
| |
| If EXTRA_INSNS, we always do the replacement and generate |
| any extra insns before OBJECT. If it zero, we do nothing if replacement |
| is not valid. |
| |
| Return 1 if we either had nothing to do or if we were able to do the |
| needed replacement. Return 0 otherwise; we only return zero if |
| EXTRA_INSNS is zero. |
| |
| We first try some simple transformations to avoid the creation of extra |
| pseudos. */ |
| |
| static int |
| instantiate_virtual_regs_1 (rtx *loc, rtx object, int extra_insns) |
| { |
| rtx x; |
| RTX_CODE code; |
| rtx new = 0; |
| HOST_WIDE_INT offset = 0; |
| rtx temp; |
| rtx seq; |
| int i, j; |
| const char *fmt; |
| |
| /* Re-start here to avoid recursion in common cases. */ |
| restart: |
| |
| x = *loc; |
| if (x == 0) |
| return 1; |
| |
| /* We may have detected and deleted invalid asm statements. */ |
| if (object && INSN_P (object) && INSN_DELETED_P (object)) |
| return 1; |
| |
| code = GET_CODE (x); |
| |
| /* Check for some special cases. */ |
| switch (code) |
| { |
| case CONST_INT: |
| case CONST_DOUBLE: |
| case CONST_VECTOR: |
| case CONST: |
| case SYMBOL_REF: |
| case CODE_LABEL: |
| case PC: |
| case CC0: |
| case ASM_INPUT: |
| case ADDR_VEC: |
| case ADDR_DIFF_VEC: |
| case RETURN: |
| return 1; |
| |
| case SET: |
| /* We are allowed to set the virtual registers. This means that |
| the actual register should receive the source minus the |
| appropriate offset. This is used, for example, in the handling |
| of non-local gotos. */ |
| if ((new = instantiate_new_reg (SET_DEST (x), &offset)) != 0) |
| { |
| rtx src = SET_SRC (x); |
| |
| /* We are setting the register, not using it, so the relevant |
| offset is the negative of the offset to use were we using |
| the register. */ |
| offset = - offset; |
| instantiate_virtual_regs_1 (&src, NULL_RTX, 0); |
| |
| /* The only valid sources here are PLUS or REG. Just do |
| the simplest possible thing to handle them. */ |
| if (!REG_P (src) && GET_CODE (src) != PLUS) |
| { |
| instantiate_virtual_regs_lossage (object); |
| return 1; |
| } |
| |
| start_sequence (); |
| if (!REG_P (src)) |
| temp = force_operand (src, NULL_RTX); |
| else |
| temp = src; |
| temp = force_operand (plus_constant (temp, offset), NULL_RTX); |
| seq = get_insns (); |
| end_sequence (); |
| |
| emit_insn_before (seq, object); |
| SET_DEST (x) = new; |
| |
| if (! validate_change (object, &SET_SRC (x), temp, 0) |
| || ! extra_insns) |
| instantiate_virtual_regs_lossage (object); |
| |
| return 1; |
| } |
| |
| instantiate_virtual_regs_1 (&SET_DEST (x), object, extra_insns); |
| loc = &SET_SRC (x); |
| goto restart; |
| |
| case PLUS: |
| /* Handle special case of virtual register plus constant. */ |
| if (CONSTANT_P (XEXP (x, 1))) |
| { |
| rtx old, new_offset; |
| |
| /* Check for (plus (plus VIRT foo) (const_int)) first. */ |
| if (GET_CODE (XEXP (x, 0)) == PLUS) |
| { |
| if ((new = instantiate_new_reg (XEXP (XEXP (x, 0), 0), &offset))) |
| { |
| instantiate_virtual_regs_1 (&XEXP (XEXP (x, 0), 1), object, |
| extra_insns); |
| new = gen_rtx_PLUS (Pmode, new, XEXP (XEXP (x, 0), 1)); |
| } |
| else |
| { |
| loc = &XEXP (x, 0); |
| goto restart; |
| } |
| } |
| |
| #ifdef POINTERS_EXTEND_UNSIGNED |
| /* If we have (plus (subreg (virtual-reg)) (const_int)), we know |
| we can commute the PLUS and SUBREG because pointers into the |
| frame are well-behaved. */ |
| else if (GET_CODE (XEXP (x, 0)) == SUBREG && GET_MODE (x) == ptr_mode |
| && GET_CODE (XEXP (x, 1)) == CONST_INT |
| && 0 != (new |
| = instantiate_new_reg (SUBREG_REG (XEXP (x, 0)), |
| &offset)) |
| && validate_change (object, loc, |
| plus_constant (gen_lowpart (ptr_mode, |
| new), |
| offset |
| + INTVAL (XEXP (x, 1))), |
| 0)) |
| return 1; |
| #endif |
| else if ((new = instantiate_new_reg (XEXP (x, 0), &offset)) == 0) |
| { |
| /* We know the second operand is a constant. Unless the |
| first operand is a REG (which has been already checked), |
| it needs to be checked. */ |
| if (!REG_P (XEXP (x, 0))) |
| { |
| loc = &XEXP (x, 0); |
| goto restart; |
| } |
| return 1; |
| } |
| |
| new_offset = plus_constant (XEXP (x, 1), offset); |
| |
| /* If the new constant is zero, try to replace the sum with just |
| the register. */ |
| if (new_offset == const0_rtx |
| && validate_change (object, loc, new, 0)) |
| return 1; |
| |
| /* Next try to replace the register and new offset. |
| There are two changes to validate here and we can't assume that |
| in the case of old offset equals new just changing the register |
| will yield a valid insn. In the interests of a little efficiency, |
| however, we only call validate change once (we don't queue up the |
| changes and then call apply_change_group). */ |
| |
| old = XEXP (x, 0); |
| if (offset == 0 |
| ? ! validate_change (object, &XEXP (x, 0), new, 0) |
| : (XEXP (x, 0) = new, |
| ! validate_change (object, &XEXP (x, 1), new_offset, 0))) |
| { |
| if (! extra_insns) |
| { |
| XEXP (x, 0) = old; |
| return 0; |
| } |
| |
| /* Otherwise copy the new constant into a register and replace |
| constant with that register. */ |
| temp = gen_reg_rtx (Pmode); |
| XEXP (x, 0) = new; |
| if (validate_change (object, &XEXP (x, 1), temp, 0)) |
| emit_insn_before (gen_move_insn (temp, new_offset), object); |
| else |
| { |
| /* If that didn't work, replace this expression with a |
| register containing the sum. */ |
| |
| XEXP (x, 0) = old; |
| new = gen_rtx_PLUS (Pmode, new, new_offset); |
| |
| start_sequence (); |
| temp = force_operand (new, NULL_RTX); |
| seq = get_insns (); |
| end_sequence (); |
| |
| emit_insn_before (seq, object); |
| if (! validate_change (object, loc, temp, 0) |
| && ! validate_replace_rtx (x, temp, object)) |
| { |
| instantiate_virtual_regs_lossage (object); |
| return 1; |
| } |
| } |
| } |
| |
| return 1; |
| } |
| |
| /* Fall through to generic two-operand expression case. */ |
| case EXPR_LIST: |
| case CALL: |
| case COMPARE: |
| case MINUS: |
| case MULT: |
| case DIV: case UDIV: |
| case MOD: case UMOD: |
| case AND: case IOR: case XOR: |
| case ROTATERT: case ROTATE: |
| case ASHIFTRT: case LSHIFTRT: case ASHIFT: |
| case NE: case EQ: |
| case GE: case GT: case GEU: case GTU: |
| case LE: case LT: case LEU: case LTU: |
| if (XEXP (x, 1) && ! CONSTANT_P (XEXP (x, 1))) |
| instantiate_virtual_regs_1 (&XEXP (x, 1), object, extra_insns); |
| loc = &XEXP (x, 0); |
| goto restart; |
| |
| case MEM: |
| /* Most cases of MEM that convert to valid addresses have already been |
| handled by our scan of decls. The only special handling we |
| need here is to make a copy of the rtx to ensure it isn't being |
| shared if we have to change it to a pseudo. |
| |
| If the rtx is a simple reference to an address via a virtual register, |
| it can potentially be shared. In such cases, first try to make it |
| a valid address, which can also be shared. Otherwise, copy it and |
| proceed normally. |
| |
| First check for common cases that need no processing. These are |
| usually due to instantiation already being done on a previous instance |
| of a shared rtx. */ |
| |
| temp = XEXP (x, 0); |
| if (CONSTANT_ADDRESS_P (temp) |
| #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM |
| || temp == arg_pointer_rtx |
| #endif |
| #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM |
| || temp == hard_frame_pointer_rtx |
| #endif |
| || temp == frame_pointer_rtx) |
| return 1; |
| |
| if (GET_CODE (temp) == PLUS |
| && CONSTANT_ADDRESS_P (XEXP (temp, 1)) |
| && (XEXP (temp, 0) == frame_pointer_rtx |
| #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM |
| || XEXP (temp, 0) == hard_frame_pointer_rtx |
| #endif |
| #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM |
| || XEXP (temp, 0) == arg_pointer_rtx |
| #endif |
| )) |
| return 1; |
| |
| if (temp == virtual_stack_vars_rtx |
| || temp == virtual_incoming_args_rtx |
| || (GET_CODE (temp) == PLUS |
| && CONSTANT_ADDRESS_P (XEXP (temp, 1)) |
| && (XEXP (temp, 0) == virtual_stack_vars_rtx |
| || XEXP (temp, 0) == virtual_incoming_args_rtx))) |
| { |
| /* This MEM may be shared. If the substitution can be done without |
| the need to generate new pseudos, we want to do it in place |
| so all copies of the shared rtx benefit. The call below will |
| only make substitutions if the resulting address is still |
| valid. |
| |
| Note that we cannot pass X as the object in the recursive call |
| since the insn being processed may not allow all valid |
| addresses. However, if we were not passed on object, we can |
| only modify X without copying it if X will have a valid |
| address. |
| |
| ??? Also note that this can still lose if OBJECT is an insn that |
| has less restrictions on an address that some other insn. |
| In that case, we will modify the shared address. This case |
| doesn't seem very likely, though. One case where this could |
| happen is in the case of a USE or CLOBBER reference, but we |
| take care of that below. */ |
| |
| if (instantiate_virtual_regs_1 (&XEXP (x, 0), |
| object ? object : x, 0)) |
| return 1; |
| |
| /* Otherwise make a copy and process that copy. We copy the entire |
| RTL expression since it might be a PLUS which could also be |
| shared. */ |
| *loc = x = copy_rtx (x); |
| } |
| |
| /* Fall through to generic unary operation case. */ |
| case PREFETCH: |
| case SUBREG: |
| case STRICT_LOW_PART: |
| case NEG: case NOT: |
| case PRE_DEC: case PRE_INC: case POST_DEC: case POST_INC: |
| case SIGN_EXTEND: case ZERO_EXTEND: |
| case TRUNCATE: case FLOAT_EXTEND: case FLOAT_TRUNCATE: |
| case FLOAT: case FIX: |
| case UNSIGNED_FIX: case UNSIGNED_FLOAT: |
| case ABS: |
| case SQRT: |
| case FFS: |
| case CLZ: case CTZ: |
| case POPCOUNT: case PARITY: |
| /* These case either have just one operand or we know that we need not |
| check the rest of the operands. */ |
| loc = &XEXP (x, 0); |
| goto restart; |
| |
| case USE: |
| case CLOBBER: |
| /* If the operand is a MEM, see if the change is a valid MEM. If not, |
| go ahead and make the invalid one, but do it to a copy. For a REG, |
| just make the recursive call, since there's no chance of a problem. */ |
| |
| if ((MEM_P (XEXP (x, 0)) |
| && instantiate_virtual_regs_1 (&XEXP (XEXP (x, 0), 0), XEXP (x, 0), |
| 0)) |
| || (REG_P (XEXP (x, 0)) |
| && instantiate_virtual_regs_1 (&XEXP (x, 0), object, 0))) |
| return 1; |
| |
| XEXP (x, 0) = copy_rtx (XEXP (x, 0)); |
| loc = &XEXP (x, 0); |
| goto restart; |
| |
| case REG: |
| /* Try to replace with a PLUS. If that doesn't work, compute the sum |
| in front of this insn and substitute the temporary. */ |
| if ((new = instantiate_new_reg (x, &offset)) != 0) |
| { |
| temp = plus_constant (new, offset); |
| if (!validate_change (object, loc, temp, 0)) |
| { |
| if (! extra_insns) |
| return 0; |
| |
| start_sequence (); |
| temp = force_operand (temp, NULL_RTX); |
| seq = get_insns (); |
| end_sequence (); |
| |
| emit_insn_before (seq, object); |
| if (! validate_change (object, loc, temp, 0) |
| && ! validate_replace_rtx (x, temp, object)) |
| instantiate_virtual_regs_lossage (object); |
| } |
| } |
| |
| return 1; |
| |
| default: |
| break; |
| } |
| |
| /* Scan all subexpressions. */ |
| fmt = GET_RTX_FORMAT (code); |
| for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++) |
| if (*fmt == 'e') |
| { |
| if (!instantiate_virtual_regs_1 (&XEXP (x, i), object, extra_insns)) |
| return 0; |
| } |
| else if (*fmt == 'E') |
| for (j = 0; j < XVECLEN (x, i); j++) |
| if (! instantiate_virtual_regs_1 (&XVECEXP (x, i, j), object, |
| extra_insns)) |
| return 0; |
| |
| return 1; |
| } |
| |
| /* Return 1 if EXP is an aggregate type (or a value with aggregate type). |
| This means a type for which function calls must pass an address to the |
| function or get an address back from the function. |
| EXP may be a type node or an expression (whose type is tested). */ |
| |
| int |
| aggregate_value_p (tree exp, tree fntype) |
| { |
| int i, regno, nregs; |
| rtx reg; |
| |
| tree type = (TYPE_P (exp)) ? exp : TREE_TYPE (exp); |
| |
| if (fntype) |
| switch (TREE_CODE (fntype)) |
| { |
| case CALL_EXPR: |
| fntype = get_callee_fndecl (fntype); |
| fntype = fntype ? TREE_TYPE (fntype) : 0; |
| break; |
| case FUNCTION_DECL: |
| fntype = TREE_TYPE (fntype); |
| break; |
| case FUNCTION_TYPE: |
| case METHOD_TYPE: |
| break; |
| case IDENTIFIER_NODE: |
| fntype = 0; |
| break; |
| default: |
| /* We don't expect other rtl types here. */ |
| gcc_unreachable (); |
| } |
| |
| if (TREE_CODE (type) == VOID_TYPE) |
| return 0; |
| /* If the front end has decided that this needs to be passed by |
| reference, do so. */ |
| if ((TREE_CODE (exp) == PARM_DECL || TREE_CODE (exp) == RESULT_DECL) |
| && DECL_BY_REFERENCE (exp)) |
| return 1; |
| if (targetm.calls.return_in_memory (type, fntype)) |
| return 1; |
| /* Types that are TREE_ADDRESSABLE must be constructed in memory, |
| and thus can't be returned in registers. */ |
| if (TREE_ADDRESSABLE (type)) |
| return 1; |
| if (flag_pcc_struct_return && AGGREGATE_TYPE_P (type)) |
| return 1; |
| /* Make sure we have suitable call-clobbered regs to return |
| the value in; if not, we must return it in memory. */ |
| reg = hard_function_value (type, 0, 0); |
| |
| /* If we have something other than a REG (e.g. a PARALLEL), then assume |
| it is OK. */ |
| if (!REG_P (reg)) |
| return 0; |
| |
| regno = REGNO (reg); |
| nregs = hard_regno_nregs[regno][TYPE_MODE (type)]; |
| for (i = 0; i < nregs; i++) |
| if (! call_used_regs[regno + i]) |
| return 1; |
| return 0; |
| } |
| |
| /* Return true if we should assign DECL a pseudo register; false if it |
| should live on the local stack. */ |
| |
| bool |
| use_register_for_decl (tree decl) |
| { |
| /* Honor volatile. */ |
| if (TREE_SIDE_EFFECTS (decl)) |
| return false; |
| |
| /* Honor addressability. */ |
| if (TREE_ADDRESSABLE (decl)) |
| return false; |
| |
| /* Only register-like things go in registers. */ |
| if (DECL_MODE (decl) == BLKmode) |
| return false; |
| |
| /* If -ffloat-store specified, don't put explicit float variables |
| into registers. */ |
| /* ??? This should be checked after DECL_ARTIFICIAL, but tree-ssa |
| propagates values across these stores, and it probably shouldn't. */ |
| if (flag_float_store && FLOAT_TYPE_P (TREE_TYPE (decl))) |
| return false; |
| |
| /* If we're not interested in tracking debugging information for |
| this decl, then we can certainly put it in a register. */ |
| if (DECL_IGNORED_P (decl)) |
| return true; |
| |
| return (optimize || DECL_REGISTER (decl)); |
| } |
| |
| /* Return true if TYPE should be passed by invisible reference. */ |
| |
| bool |
| pass_by_reference (CUMULATIVE_ARGS *ca, enum machine_mode mode, |
| tree type, bool named_arg) |
| { |
| if (type) |
| { |
| /* If this type contains non-trivial constructors, then it is |
| forbidden for the middle-end to create any new copies. */ |
| if (TREE_ADDRESSABLE (type)) |
| return true; |
| |
| /* GCC post 3.4 passes *all* variable sized types by reference. */ |
| if (!TYPE_SIZE (type) || TREE_CODE (TYPE_SIZE (type)) != INTEGER_CST) |
| return true; |
| } |
| |
| return targetm.calls.pass_by_reference (ca, mode, type, named_arg); |
| } |
| |
| /* Return true if TYPE, which is passed by reference, should be callee |
| copied instead of caller copied. */ |
| |
| bool |
| reference_callee_copied (CUMULATIVE_ARGS *ca, enum machine_mode mode, |
| tree type, bool named_arg) |
| { |
| if (type && TREE_ADDRESSABLE (type)) |
| return false; |
| return targetm.calls.callee_copies (ca, mode, type, named_arg); |
| } |
| |
| /* Structures to communicate between the subroutines of assign_parms. |
| The first holds data persistent across all parameters, the second |
| is cleared out for each parameter. */ |
| |
| struct assign_parm_data_all |
| { |
| CUMULATIVE_ARGS args_so_far; |
| struct args_size stack_args_size; |
| tree function_result_decl; |
| tree orig_fnargs; |
| rtx conversion_insns; |
| HOST_WIDE_INT pretend_args_size; |
| HOST_WIDE_INT extra_pretend_bytes; |
| int reg_parm_stack_space; |
| }; |
| |
| struct assign_parm_data_one |
| { |
| tree nominal_type; |
| tree passed_type; |
| rtx entry_parm; |
| rtx stack_parm; |
| enum machine_mode nominal_mode; |
| enum machine_mode passed_mode; |
| enum machine_mode promoted_mode; |
| struct locate_and_pad_arg_data locate; |
| int partial; |
| BOOL_BITFIELD named_arg : 1; |
| BOOL_BITFIELD passed_pointer : 1; |
| BOOL_BITFIELD on_stack : 1; |
| BOOL_BITFIELD loaded_in_reg : 1; |
| }; |
| |
| /* A subroutine of assign_parms. Initialize ALL. */ |
| |
| static void |
| assign_parms_initialize_all (struct assign_parm_data_all *all) |
| { |
| tree fntype; |
| |
| memset (all, 0, sizeof (*all)); |
| |
| fntype = TREE_TYPE (current_function_decl); |
| |
| #ifdef INIT_CUMULATIVE_INCOMING_ARGS |
| INIT_CUMULATIVE_INCOMING_ARGS (all->args_so_far, fntype, NULL_RTX); |
| #else |
| INIT_CUMULATIVE_ARGS (all->args_so_far, fntype, NULL_RTX, |
| current_function_decl, -1); |
| #endif |
| |
| #ifdef REG_PARM_STACK_SPACE |
| all->reg_parm_stack_space = REG_PARM_STACK_SPACE (current_function_decl); |
| #endif |
| } |
| |
| /* If ARGS contains entries with complex types, split the entry into two |
| entries of the component type. Return a new list of substitutions are |
| needed, else the old list. */ |
| |
| static tree |
| split_complex_args (tree args) |
| { |
| tree p; |
| |
| /* Before allocating memory, check for the common case of no complex. */ |
| for (p = args; p; p = TREE_CHAIN (p)) |
| { |
| tree type = TREE_TYPE (p); |
| if (TREE_CODE (type) == COMPLEX_TYPE |
| && targetm.calls.split_complex_arg (type)) |
| goto found; |
| } |
| return args; |
| |
| found: |
| args = copy_list (args); |
| |
| for (p = args; p; p = TREE_CHAIN (p)) |
| { |
| tree type = TREE_TYPE (p); |
| if (TREE_CODE (type) == COMPLEX_TYPE |
| && targetm.calls.split_complex_arg (type)) |
| { |
| tree decl; |
| tree subtype = TREE_TYPE (type); |
| bool addressable = TREE_ADDRESSABLE (p); |
| |
| /* Rewrite the PARM_DECL's type with its component. */ |
| TREE_TYPE (p) = subtype; |
| DECL_ARG_TYPE (p) = TREE_TYPE (DECL_ARG_TYPE (p)); |
| DECL_MODE (p) = VOIDmode; |
| DECL_SIZE (p) = NULL; |
| DECL_SIZE_UNIT (p) = NULL; |
| /* If this arg must go in memory, put it in a pseudo here. |
| We can't allow it to go in memory as per normal parms, |
| because the usual place might not have the imag part |
| adjacent to the real part. */ |
| DECL_ARTIFICIAL (p) = addressable; |
| DECL_IGNORED_P (p) = addressable; |
| TREE_ADDRESSABLE (p) = 0; |
| layout_decl (p, 0); |
| |
| /* Build a second synthetic decl. */ |
| decl = build_decl (PARM_DECL, NULL_TREE, subtype); |
| DECL_ARG_TYPE (decl) = DECL_ARG_TYPE (p); |
| DECL_ARTIFICIAL (decl) = addressable; |
| DECL_IGNORED_P (decl) = addressable; |
| layout_decl (decl, 0); |
| |
| /* Splice it in; skip the new decl. */ |
| TREE_CHAIN (decl) = TREE_CHAIN (p); |
| TREE_CHAIN (p) = decl; |
| p = decl; |
| } |
| } |
| |
| return args; |
| } |
| |
| /* A subroutine of assign_parms. Adjust the parameter list to incorporate |
| the hidden struct return argument, and (abi willing) complex args. |
| Return the new parameter list. */ |
| |
| static tree |
| assign_parms_augmented_arg_list (struct assign_parm_data_all *all) |
| { |
| tree fndecl = current_function_decl; |
| tree fntype = TREE_TYPE (fndecl); |
| tree fnargs = DECL_ARGUMENTS (fndecl); |
| |
| /* If struct value address is treated as the first argument, make it so. */ |
| if (aggregate_value_p (DECL_RESULT (fndecl), fndecl) |
| && ! current_function_returns_pcc_struct |
| && targetm.calls.struct_value_rtx (TREE_TYPE (fndecl), 1) == 0) |
| { |
| tree type = build_pointer_type (TREE_TYPE (fntype)); |
| tree decl; |
| |
| decl = build_decl (PARM_DECL, NULL_TREE, type); |
| DECL_ARG_TYPE (decl) = type; |
| DECL_ARTIFICIAL (decl) = 1; |
| DECL_IGNORED_P (decl) = 1; |
| |
| TREE_CHAIN (decl) = fnargs; |
| fnargs = decl; |
| all->function_result_decl = decl; |
| } |
| |
| all->orig_fnargs = fnargs; |
| |
| /* If the target wants to split complex arguments into scalars, do so. */ |
| if (targetm.calls.split_complex_arg) |
| fnargs = split_complex_args (fnargs); |
| |
| return fnargs; |
| } |
| |
| /* A subroutine of assign_parms. Examine PARM and pull out type and mode |
| data for the parameter. Incorporate ABI specifics such as pass-by- |
| reference and type promotion. */ |
| |
| static void |
| assign_parm_find_data_types (struct assign_parm_data_all *all, tree parm, |
| struct assign_parm_data_one *data) |
| { |
| tree nominal_type, passed_type; |
| enum machine_mode nominal_mode, passed_mode, promoted_mode; |
| |
| memset (data, 0, sizeof (*data)); |
| |
| /* NAMED_ARG is a mis-nomer. We really mean 'non-varadic'. */ |
| if (!current_function_stdarg) |
| data->named_arg = 1; /* No varadic parms. */ |
| else if (TREE_CHAIN (parm)) |
| data->named_arg = 1; /* Not the last non-varadic parm. */ |
| else if (targetm.calls.strict_argument_naming (&all->args_so_far)) |
| data->named_arg = 1; /* Only varadic ones are unnamed. */ |
| else |
| data->named_arg = 0; /* Treat as varadic. */ |
| |
| nominal_type = TREE_TYPE (parm); |
| passed_type = DECL_ARG_TYPE (parm); |
| |
| /* Look out for errors propagating this far. Also, if the parameter's |
| type is void then its value doesn't matter. */ |
| if (TREE_TYPE (parm) == error_mark_node |
| /* This can happen after weird syntax errors |
| or if an enum type is defined among the parms. */ |
| || TREE_CODE (parm) != PARM_DECL |
| || passed_type == NULL |
| || VOID_TYPE_P (nominal_type)) |
| { |
| nominal_type = passed_type = void_type_node; |
| nominal_mode = passed_mode = promoted_mode = VOIDmode; |
| goto egress; |
| } |
| |
| /* Find mode of arg as it is passed, and mode of arg as it should be |
| during execution of this function. */ |
| passed_mode = TYPE_MODE (passed_type); |
| nominal_mode = TYPE_MODE (nominal_type); |
| |
| /* If the parm is to be passed as a transparent union, use the type of |
| the first field for the tests below. We have already verified that |
| the modes are the same. */ |
| if (DECL_TRANSPARENT_UNION (parm) |
| || (TREE_CODE (passed_type) == UNION_TYPE |
| && TYPE_TRANSPARENT_UNION (passed_type))) |
| passed_type = TREE_TYPE (TYPE_FIELDS (passed_type)); |
| |
| /* See if this arg was passed by invisible reference. */ |
| if (pass_by_reference (&all->args_so_far, passed_mode, |
| passed_type, data->named_arg)) |
| { |
| passed_type = nominal_type = build_pointer_type (passed_type); |
| data->passed_pointer = true; |
| passed_mode = nominal_mode = Pmode; |
| } |
| |
| /* Find mode as it is passed by the ABI. */ |
| promoted_mode = passed_mode; |
| if (targetm.calls.promote_function_args (TREE_TYPE (current_function_decl))) |
| { |
| int unsignedp = TYPE_UNSIGNED (passed_type); |
| promoted_mode = promote_mode (passed_type, promoted_mode, |
| &unsignedp, 1); |
| } |
| |
| egress: |
| data->nominal_type = nominal_type; |
| data->passed_type = passed_type; |
| data->nominal_mode = nominal_mode; |
| data->passed_mode = passed_mode; |
| data->promoted_mode = promoted_mode; |
| } |
| |
| /* A subroutine of assign_parms. Invoke setup_incoming_varargs. */ |
| |
| static void |
| assign_parms_setup_varargs (struct assign_parm_data_all *all, |
| struct assign_parm_data_one *data, bool no_rtl) |
| { |
| int varargs_pretend_bytes = 0; |
| |
| targetm.calls.setup_incoming_varargs (&all->args_so_far, |
| data->promoted_mode, |
| data->passed_type, |
| &varargs_pretend_bytes, no_rtl); |
| |
| /* If the back-end has requested extra stack space, record how much is |
| needed. Do not change pretend_args_size otherwise since it may be |
| nonzero from an earlier partial argument. */ |
| if (varargs_pretend_bytes > 0) |
| all->pretend_args_size = varargs_pretend_bytes; |
| } |
| |
| /* A subroutine of assign_parms. Set DATA->ENTRY_PARM corresponding to |
| the incoming location of the current parameter. */ |
| |
| static void |
| assign_parm_find_entry_rtl (struct assign_parm_data_all *all, |
| struct assign_parm_data_one *data) |
| { |
| HOST_WIDE_INT pretend_bytes = 0; |
| rtx entry_parm; |
| bool in_regs; |
| |
| if (data->promoted_mode == VOIDmode) |
| { |
| data->entry_parm = data->stack_parm = const0_rtx; |
| return; |
| } |
| |
| #ifdef FUNCTION_INCOMING_ARG |
| entry_parm = FUNCTION_INCOMING_ARG (all->args_so_far, data->promoted_mode, |
| data->passed_type, data->named_arg); |
| #else |
| entry_parm = FUNCTION_ARG (all->args_so_far, data->promoted_mode, |
| data->passed_type, data->named_arg); |
| #endif |
| |
| if (entry_parm == 0) |
| data->promoted_mode = data->passed_mode; |
| |
| /* Determine parm's home in the stack, in case it arrives in the stack |
| or we should pretend it did. Compute the stack position and rtx where |
| the argument arrives and its size. |
| |
| There is one complexity here: If this was a parameter that would |
| have been passed in registers, but wasn't only because it is |
| __builtin_va_alist, we want locate_and_pad_parm to treat it as if |
| it came in a register so that REG_PARM_STACK_SPACE isn't skipped. |
| In this case, we call FUNCTION_ARG with NAMED set to 1 instead of 0 |
| as it was the previous time. */ |
| in_regs = entry_parm != 0; |
| #ifdef STACK_PARMS_IN_REG_PARM_AREA |
| in_regs = true; |
| #endif |
| if (!in_regs && !data->named_arg) |
| { |
| if (targetm.calls.pretend_outgoing_varargs_named (&all->args_so_far)) |
| { |
| rtx tem; |
| #ifdef FUNCTION_INCOMING_ARG |
| tem = FUNCTION_INCOMING_ARG (all->args_so_far, data->promoted_mode, |
| data->passed_type, true); |
| #else |
| tem = FUNCTION_ARG (all->args_so_far, data->promoted_mode, |
| data->passed_type, true); |
| #endif |
| in_regs = tem != NULL; |
| } |
| } |
| |
| /* If this parameter was passed both in registers and in the stack, use |
| the copy on the stack. */ |
| if (targetm.calls.must_pass_in_stack (data->promoted_mode, |
| data->passed_type)) |
| entry_parm = 0; |
| |
| if (entry_parm) |
| { |
| int partial; |
| |
| partial = targetm.calls.arg_partial_bytes (&all->args_so_far, |
| data->promoted_mode, |
| data->passed_type, |
| data->named_arg); |
| data->partial = partial; |
| |
| /* The caller might already have allocated stack space for the |
| register parameters. */ |
| if (partial != 0 && all->reg_parm_stack_space == 0) |
| { |
| /* Part of this argument is passed in registers and part |
| is passed on the stack. Ask the prologue code to extend |
| the stack part so that we can recreate the full value. |
| |
| PRETEND_BYTES is the size of the registers we need to store. |
| CURRENT_FUNCTION_PRETEND_ARGS_SIZE is the amount of extra |
| stack space that the prologue should allocate. |
| |
| Internally, gcc assumes that the argument pointer is aligned |
| to STACK_BOUNDARY bits. This is used both for alignment |
| optimizations (see init_emit) and to locate arguments that are |
| aligned to more than PARM_BOUNDARY bits. We must preserve this |
| invariant by rounding CURRENT_FUNCTION_PRETEND_ARGS_SIZE up to |
| a stack boundary. */ |
| |
| /* We assume at most one partial arg, and it must be the first |
| argument on the stack. */ |
| gcc_assert (!all->extra_pretend_bytes && !all->pretend_args_size); |
| |
| pretend_bytes = partial; |
| all->pretend_args_size = CEIL_ROUND (pretend_bytes, STACK_BYTES); |
| |
| /* We want to align relative to the actual stack pointer, so |
| don't include this in the stack size until later. */ |
| all->extra_pretend_bytes = all->pretend_args_size; |
| } |
| } |
| |
| locate_and_pad_parm (data->promoted_mode, data->passed_type, in_regs, |
| entry_parm ? data->partial : 0, current_function_decl, |
| &all->stack_args_size, &data->locate); |
| |
| /* Adjust offsets to include the pretend args. */ |
| pretend_bytes = all->extra_pretend_bytes - pretend_bytes; |
| data->locate.slot_offset.constant += pretend_bytes; |
| data->locate.offset.constant += pretend_bytes; |
| |
| data->entry_parm = entry_parm; |
| } |
| |
| /* A subroutine of assign_parms. If there is actually space on the stack |
| for this parm, count it in stack_args_size and return true. */ |
| |
| static bool |
| assign_parm_is_stack_parm (struct assign_parm_data_all *all, |
| struct assign_parm_data_one *data) |
| { |
| /* Trivially true if we've no incoming register. */ |
| if (data->entry_parm == NULL) |
| ; |
| /* Also true if we're partially in registers and partially not, |
| since we've arranged to drop the entire argument on the stack. */ |
| else if (data->partial != 0) |
| ; |
| /* Also true if the target says that it's passed in both registers |
| and on the stack. */ |
| else if (GET_CODE (data->entry_parm) == PARALLEL |
| && XEXP (XVECEXP (data->entry_parm, 0, 0), 0) == NULL_RTX) |
| ; |
| /* Also true if the target says that there's stack allocated for |
| all register parameters. */ |
| else if (all->reg_parm_stack_space > 0) |
| ; |
| /* Otherwise, no, this parameter has no ABI defined stack slot. */ |
| else |
| return false; |
| |
| all->stack_args_size.constant += data->locate.size.constant; |
| if (data->locate.size.var) |
| ADD_PARM_SIZE (all->stack_args_size, data->locate.size.var); |
| |
| return true; |
| } |
| |
| /* A subroutine of assign_parms. Given that this parameter is allocated |
| stack space by the ABI, find it. */ |
| |
| static void |
| assign_parm_find_stack_rtl (tree parm, struct assign_parm_data_one *data) |
| { |
| rtx offset_rtx, stack_parm; |
| unsigned int align, boundary; |
| |
| /* If we're passing this arg using a reg, make its stack home the |
| aligned stack slot. */ |
| if (data->entry_parm) |
| offset_rtx = ARGS_SIZE_RTX (data->locate.slot_offset); |
| else |
| offset_rtx = ARGS_SIZE_RTX (data->locate.offset); |
| |
| stack_parm = current_function_internal_arg_pointer; |
| if (offset_rtx != const0_rtx) |
| stack_parm = gen_rtx_PLUS (Pmode, stack_parm, offset_rtx); |
| stack_parm = gen_rtx_MEM (data->promoted_mode, stack_parm); |
| |
| set_mem_attributes (stack_parm, parm, 1); |
| |
| boundary = data->locate.boundary; |
| align = BITS_PER_UNIT; |
| |
| /* If we're padding upward, we know that the alignment of the slot |
| is FUNCTION_ARG_BOUNDARY. If we're using slot_offset, we're |
| intentionally forcing upward padding. Otherwise we have to come |
| up with a guess at the alignment based on OFFSET_RTX. */ |
| if (data->locate.where_pad != downward || data->entry_parm) |
| align = boundary; |
| else if (GET_CODE (offset_rtx) == CONST_INT) |
| { |
| align = INTVAL (offset_rtx) * BITS_PER_UNIT | boundary; |
| align = align & -align; |
| } |
| set_mem_align (stack_parm, align); |
| |
| if (data->entry_parm) |
| set_reg_attrs_for_parm (data->entry_parm, stack_parm); |
| |
| data->stack_parm = stack_parm; |
| } |
| |
| /* A subroutine of assign_parms. Adjust DATA->ENTRY_RTL such that it's |
| always valid and contiguous. */ |
| |
| static void |
| assign_parm_adjust_entry_rtl (struct assign_parm_data_one *data) |
| { |
| rtx entry_parm = data->entry_parm; |
| rtx stack_parm = data->stack_parm; |
| |
| /* If this parm was passed part in regs and part in memory, pretend it |
| arrived entirely in memory by pushing the register-part onto the stack. |
| In the special case of a DImode or DFmode that is split, we could put |
| it together in a pseudoreg directly, but for now that's not worth |
| bothering with. */ |
| if (data->partial != 0) |
| { |
| /* Handle calls that pass values in multiple non-contiguous |
| locations. The Irix 6 ABI has examples of this. */ |
| if (GET_CODE (entry_parm) == PARALLEL) |
| emit_group_store (validize_mem (stack_parm), entry_parm, |
| data->passed_type, |
| int_size_in_bytes (data->passed_type)); |
| else |
| { |
| gcc_assert (data->partial % UNITS_PER_WORD == 0); |
| move_block_from_reg (REGNO (entry_parm), validize_mem (stack_parm), |
| data->partial / UNITS_PER_WORD); |
| } |
| |
| entry_parm = stack_parm; |
| } |
| |
| /* If we didn't decide this parm came in a register, by default it came |
| on the stack. */ |
| else if (entry_parm == NULL) |
| entry_parm = stack_parm; |
| |
| /* When an argument is passed in multiple locations, we can't make use |
| of this information, but we can save some copying if the whole argument |
| is passed in a single register. */ |
| else if (GET_CODE (entry_parm) == PARALLEL |
| && data->nominal_mode != BLKmode |
| && data->passed_mode != BLKmode) |
| { |
| size_t i, len = XVECLEN (entry_parm, 0); |
| |
| for (i = 0; i < len; i++) |
| if (XEXP (XVECEXP (entry_parm, 0, i), 0) != NULL_RTX |
| && REG_P (XEXP (XVECEXP (entry_parm, 0, i), 0)) |
| && (GET_MODE (XEXP (XVECEXP (entry_parm, 0, i), 0)) |
| == data->passed_mode) |
| && INTVAL (XEXP (XVECEXP (entry_parm, 0, i), 1)) == 0) |
| { |
| entry_parm = XEXP (XVECEXP (entry_parm, 0, i), 0); |
| break; |
| } |
| } |
| |
| data->entry_parm = entry_parm; |
| } |
| |
| /* A subroutine of assign_parms. Adjust DATA->STACK_RTL such that it's |
| always valid and properly aligned. */ |
| |
| static void |
| assign_parm_adjust_stack_rtl (struct assign_parm_data_one *data) |
| { |
| rtx stack_parm = data->stack_parm; |
| |
| /* If we can't trust the parm stack slot to be aligned enough for its |
| ultimate type, don't use that slot after entry. We'll make another |
| stack slot, if we need one. */ |
| if (stack_parm |
| && ((STRICT_ALIGNMENT |
| && GET_MODE_ALIGNMENT (data->nominal_mode) > MEM_ALIGN (stack_parm)) |
| || (data->nominal_type |
| && TYPE_ALIGN (data->nominal_type) > MEM_ALIGN (stack_parm) |
| && MEM_ALIGN (stack_parm) < PREFERRED_STACK_BOUNDARY))) |
| stack_parm = NULL; |
| |
| /* If parm was passed in memory, and we need to convert it on entry, |
| don't store it back in that same slot. */ |
| else if (data->entry_parm == stack_parm |
| && data->nominal_mode != BLKmode |
| && data->nominal_mode != data->passed_mode) |
| stack_parm = NULL; |
| /* APPLE LOCAL begin mainline */ |
| /* If stack protection is in effect for this function, don't leave any |
| pointers in their passed stack slots. */ |
| else if (cfun->stack_protect_guard |
| && (flag_stack_protect == 2 |
| || data->passed_pointer |
| || POINTER_TYPE_P (data->nominal_type))) |
| stack_parm = NULL; |
| /* APPLE LOCAL end mainline */ |
| |
| data->stack_parm = stack_parm; |
| } |
| |
| /* A subroutine of assign_parms. Return true if the current parameter |
| should be stored as a BLKmode in the current frame. */ |
| |
| static bool |
| assign_parm_setup_block_p (struct assign_parm_data_one *data) |
| { |
| if (data->nominal_mode == BLKmode) |
| return true; |
| if (GET_CODE (data->entry_parm) == PARALLEL) |
| return true; |
| |
| #ifdef BLOCK_REG_PADDING |
| /* Only assign_parm_setup_block knows how to deal with register arguments |
| that are padded at the least significant end. */ |
| if (REG_P (data->entry_parm) |
| && GET_MODE_SIZE (data->promoted_mode) < UNITS_PER_WORD |
| && (BLOCK_REG_PADDING (data->passed_mode, data->passed_type, 1) |
| == (BYTES_BIG_ENDIAN ? upward : downward))) |
| return true; |
| #endif |
| |
| return false; |
| } |
| |
| /* A subroutine of assign_parms. Arrange for the parameter to be |
| present and valid in DATA->STACK_RTL. */ |
| |
| static void |
| assign_parm_setup_block (struct assign_parm_data_all *all, |
| tree parm, struct assign_parm_data_one *data) |
| { |
| rtx entry_parm = data->entry_parm; |
| rtx stack_parm = data->stack_parm; |
| HOST_WIDE_INT size; |
| HOST_WIDE_INT size_stored; |
| rtx orig_entry_parm = entry_parm; |
| |
| if (GET_CODE (entry_parm) == PARALLEL) |
| entry_parm = emit_group_move_into_temps (entry_parm); |
| |
| /* If we've a non-block object that's nevertheless passed in parts, |
| reconstitute it in register operations rather than on the stack. */ |
| if (GET_CODE (entry_parm) == PARALLEL |
| && data->nominal_mode != BLKmode) |
| { |
| rtx elt0 = XEXP (XVECEXP (orig_entry_parm, 0, 0), 0); |
| |
| if ((XVECLEN (entry_parm, 0) > 1 |
| || hard_regno_nregs[REGNO (elt0)][GET_MODE (elt0)] > 1) |
| && use_register_for_decl (parm)) |
| { |
| rtx parmreg = gen_reg_rtx (data->nominal_mode); |
| |
| push_to_sequence (all->conversion_insns); |
| |
| /* For values returned in multiple registers, handle possible |
| incompatible calls to emit_group_store. |
| |
| For example, the following would be invalid, and would have to |
| be fixed by the conditional below: |
| |
| emit_group_store ((reg:SF), (parallel:DF)) |
| emit_group_store ((reg:SI), (parallel:DI)) |
| |
| An example of this are doubles in e500 v2: |
| (parallel:DF (expr_list (reg:SI) (const_int 0)) |
| (expr_list (reg:SI) (const_int 4))). */ |
| if (data->nominal_mode != data->passed_mode) |
| { |
| rtx t = gen_reg_rtx (GET_MODE (entry_parm)); |
| emit_group_store (t, entry_parm, NULL_TREE, |
| GET_MODE_SIZE (GET_MODE (entry_parm))); |
| convert_move (parmreg, t, 0); |
| } |
| else |
| emit_group_store (parmreg, entry_parm, data->nominal_type, |
| int_size_in_bytes (data->nominal_type)); |
| |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| |
| SET_DECL_RTL (parm, parmreg); |
| return; |
| } |
| } |
| |
| size = int_size_in_bytes (data->passed_type); |
| size_stored = CEIL_ROUND (size, UNITS_PER_WORD); |
| if (stack_parm == 0) |
| { |
| DECL_ALIGN (parm) = MAX (DECL_ALIGN (parm), BITS_PER_WORD); |
| stack_parm = assign_stack_local (BLKmode, size_stored, |
| DECL_ALIGN (parm)); |
| if (GET_MODE_SIZE (GET_MODE (entry_parm)) == size) |
| PUT_MODE (stack_parm, GET_MODE (entry_parm)); |
| set_mem_attributes (stack_parm, parm, 1); |
| } |
| |
| /* If a BLKmode arrives in registers, copy it to a stack slot. Handle |
| calls that pass values in multiple non-contiguous locations. */ |
| if (REG_P (entry_parm) || GET_CODE (entry_parm) == PARALLEL) |
| { |
| rtx mem; |
| |
| /* Note that we will be storing an integral number of words. |
| So we have to be careful to ensure that we allocate an |
| integral number of words. We do this above when we call |
| assign_stack_local if space was not allocated in the argument |
| list. If it was, this will not work if PARM_BOUNDARY is not |
| a multiple of BITS_PER_WORD. It isn't clear how to fix this |
| if it becomes a problem. Exception is when BLKmode arrives |
| with arguments not conforming to word_mode. */ |
| |
| if (data->stack_parm == 0) |
| ; |
| else if (GET_CODE (entry_parm) == PARALLEL) |
| ; |
| else |
| gcc_assert (!size || !(PARM_BOUNDARY % BITS_PER_WORD)); |
| |
| mem = validize_mem (stack_parm); |
| |
| /* Handle values in multiple non-contiguous locations. */ |
| if (GET_CODE (entry_parm) == PARALLEL) |
| { |
| push_to_sequence (all->conversion_insns); |
| emit_group_store (mem, entry_parm, data->passed_type, size); |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| } |
| |
| else if (size == 0) |
| ; |
| |
| /* If SIZE is that of a mode no bigger than a word, just use |
| that mode's store operation. */ |
| else if (size <= UNITS_PER_WORD) |
| { |
| enum machine_mode mode |
| = mode_for_size (size * BITS_PER_UNIT, MODE_INT, 0); |
| |
| if (mode != BLKmode |
| #ifdef BLOCK_REG_PADDING |
| && (size == UNITS_PER_WORD |
| || (BLOCK_REG_PADDING (mode, data->passed_type, 1) |
| != (BYTES_BIG_ENDIAN ? upward : downward))) |
| #endif |
| ) |
| { |
| rtx reg = gen_rtx_REG (mode, REGNO (entry_parm)); |
| emit_move_insn (change_address (mem, mode, 0), reg); |
| } |
| |
| /* Blocks smaller than a word on a BYTES_BIG_ENDIAN |
| machine must be aligned to the left before storing |
| to memory. Note that the previous test doesn't |
| handle all cases (e.g. SIZE == 3). */ |
| else if (size != UNITS_PER_WORD |
| #ifdef BLOCK_REG_PADDING |
| && (BLOCK_REG_PADDING (mode, data->passed_type, 1) |
| == downward) |
| #else |
| && BYTES_BIG_ENDIAN |
| #endif |
| ) |
| { |
| rtx tem, x; |
| int by = (UNITS_PER_WORD - size) * BITS_PER_UNIT; |
| rtx reg = gen_rtx_REG (word_mode, REGNO (entry_parm)); |
| |
| x = expand_shift (LSHIFT_EXPR, word_mode, reg, |
| build_int_cst (NULL_TREE, by), |
| NULL_RTX, 1); |
| tem = change_address (mem, word_mode, 0); |
| emit_move_insn (tem, x); |
| } |
| else |
| move_block_from_reg (REGNO (entry_parm), mem, |
| size_stored / UNITS_PER_WORD); |
| } |
| else |
| move_block_from_reg (REGNO (entry_parm), mem, |
| size_stored / UNITS_PER_WORD); |
| } |
| else if (data->stack_parm == 0) |
| { |
| push_to_sequence (all->conversion_insns); |
| emit_block_move (stack_parm, data->entry_parm, GEN_INT (size), |
| BLOCK_OP_NORMAL); |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| } |
| |
| data->stack_parm = stack_parm; |
| SET_DECL_RTL (parm, stack_parm); |
| } |
| |
| /* A subroutine of assign_parms. Allocate a pseudo to hold the current |
| parameter. Get it there. Perform all ABI specified conversions. */ |
| |
| static void |
| assign_parm_setup_reg (struct assign_parm_data_all *all, tree parm, |
| struct assign_parm_data_one *data) |
| { |
| rtx parmreg; |
| enum machine_mode promoted_nominal_mode; |
| int unsignedp = TYPE_UNSIGNED (TREE_TYPE (parm)); |
| bool did_conversion = false; |
| |
| /* Store the parm in a pseudoregister during the function, but we may |
| need to do it in a wider mode. */ |
| |
| promoted_nominal_mode |
| = promote_mode (data->nominal_type, data->nominal_mode, &unsignedp, 0); |
| |
| /* APPLE LOCAL begin CW asm blocks */ |
| /* In asm functions with no stack frame, leave it in the register. */ |
| if (cfun->iasm_frame_size == -2 |
| && cfun->iasm_noreturn) |
| { |
| parmreg = DECL_INCOMING_RTL (parm); |
| if (promoted_nominal_mode != GET_MODE (parmreg)) |
| warning ("wrong mode for arg %qD", parm); |
| } |
| else |
| /* APPLE LOCAL end CW asm blocks */ |
| parmreg = gen_reg_rtx (promoted_nominal_mode); |
| |
| if (!DECL_ARTIFICIAL (parm)) |
| mark_user_reg (parmreg); |
| |
| /* If this was an item that we received a pointer to, |
| set DECL_RTL appropriately. */ |
| if (data->passed_pointer) |
| { |
| rtx x = gen_rtx_MEM (TYPE_MODE (TREE_TYPE (data->passed_type)), parmreg); |
| set_mem_attributes (x, parm, 1); |
| SET_DECL_RTL (parm, x); |
| } |
| else |
| SET_DECL_RTL (parm, parmreg); |
| |
| /* Copy the value into the register. */ |
| if (data->nominal_mode != data->passed_mode |
| || promoted_nominal_mode != data->promoted_mode) |
| { |
| int save_tree_used; |
| |
| /* ENTRY_PARM has been converted to PROMOTED_MODE, its |
| mode, by the caller. We now have to convert it to |
| NOMINAL_MODE, if different. However, PARMREG may be in |
| a different mode than NOMINAL_MODE if it is being stored |
| promoted. |
| |
| If ENTRY_PARM is a hard register, it might be in a register |
| not valid for operating in its mode (e.g., an odd-numbered |
| register for a DFmode). In that case, moves are the only |
| thing valid, so we can't do a convert from there. This |
| occurs when the calling sequence allow such misaligned |
| usages. |
| |
| In addition, the conversion may involve a call, which could |
| clobber parameters which haven't been copied to pseudo |
| registers yet. Therefore, we must first copy the parm to |
| a pseudo reg here, and save the conversion until after all |
| parameters have been moved. */ |
| |
| rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm)); |
| |
| emit_move_insn (tempreg, validize_mem (data->entry_parm)); |
| |
| push_to_sequence (all->conversion_insns); |
| tempreg = convert_to_mode (data->nominal_mode, tempreg, unsignedp); |
| |
| if (GET_CODE (tempreg) == SUBREG |
| && GET_MODE (tempreg) == data->nominal_mode |
| && REG_P (SUBREG_REG (tempreg)) |
| && data->nominal_mode == data->passed_mode |
| && GET_MODE (SUBREG_REG (tempreg)) == GET_MODE (data->entry_parm) |
| && GET_MODE_SIZE (GET_MODE (tempreg)) |
| < GET_MODE_SIZE (GET_MODE (data->entry_parm))) |
| { |
| /* The argument is already sign/zero extended, so note it |
| into the subreg. */ |
| SUBREG_PROMOTED_VAR_P (tempreg) = 1; |
| SUBREG_PROMOTED_UNSIGNED_SET (tempreg, unsignedp); |
| } |
| |
| /* TREE_USED gets set erroneously during expand_assignment. */ |
| save_tree_used = TREE_USED (parm); |
| expand_assignment (parm, make_tree (data->nominal_type, tempreg)); |
| TREE_USED (parm) = save_tree_used; |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| |
| did_conversion = true; |
| } |
| else |
| emit_move_insn (parmreg, validize_mem (data->entry_parm)); |
| |
| /* If we were passed a pointer but the actual value can safely live |
| in a register, put it in one. */ |
| if (data->passed_pointer |
| && TYPE_MODE (TREE_TYPE (parm)) != BLKmode |
| /* If by-reference argument was promoted, demote it. */ |
| && (TYPE_MODE (TREE_TYPE (parm)) != GET_MODE (DECL_RTL (parm)) |
| || use_register_for_decl (parm))) |
| { |
| /* We can't use nominal_mode, because it will have been set to |
| Pmode above. We must use the actual mode of the parm. */ |
| parmreg = gen_reg_rtx (TYPE_MODE (TREE_TYPE (parm))); |
| mark_user_reg (parmreg); |
| |
| if (GET_MODE (parmreg) != GET_MODE (DECL_RTL (parm))) |
| { |
| rtx tempreg = gen_reg_rtx (GET_MODE (DECL_RTL (parm))); |
| int unsigned_p = TYPE_UNSIGNED (TREE_TYPE (parm)); |
| |
| push_to_sequence (all->conversion_insns); |
| emit_move_insn (tempreg, DECL_RTL (parm)); |
| tempreg = convert_to_mode (GET_MODE (parmreg), tempreg, unsigned_p); |
| emit_move_insn (parmreg, tempreg); |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| |
| did_conversion = true; |
| } |
| else |
| emit_move_insn (parmreg, DECL_RTL (parm)); |
| |
| SET_DECL_RTL (parm, parmreg); |
| |
| /* STACK_PARM is the pointer, not the parm, and PARMREG is |
| now the parm. */ |
| data->stack_parm = NULL; |
| } |
| |
| /* Mark the register as eliminable if we did no conversion and it was |
| copied from memory at a fixed offset, and the arg pointer was not |
| copied to a pseudo-reg. If the arg pointer is a pseudo reg or the |
| offset formed an invalid address, such memory-equivalences as we |
| make here would screw up life analysis for it. */ |
| if (data->nominal_mode == data->passed_mode |
| && !did_conversion |
| && data->stack_parm != 0 |
| && MEM_P (data->stack_parm) |
| && data->locate.offset.var == 0 |
| && reg_mentioned_p (virtual_incoming_args_rtx, |
| XEXP (data->stack_parm, 0))) |
| { |
| rtx linsn = get_last_insn (); |
| rtx sinsn, set; |
| |
| /* Mark complex types separately. */ |
| if (GET_CODE (parmreg) == CONCAT) |
| { |
| enum machine_mode submode |
| = GET_MODE_INNER (GET_MODE (parmreg)); |
| int regnor = REGNO (XEXP (parmreg, 0)); |
| int regnoi = REGNO (XEXP (parmreg, 1)); |
| rtx stackr = adjust_address_nv (data->stack_parm, submode, 0); |
| rtx stacki = adjust_address_nv (data->stack_parm, submode, |
| GET_MODE_SIZE (submode)); |
| |
| /* Scan backwards for the set of the real and |
| imaginary parts. */ |
| for (sinsn = linsn; sinsn != 0; |
| sinsn = prev_nonnote_insn (sinsn)) |
| { |
| set = single_set (sinsn); |
| if (set == 0) |
| continue; |
| |
| if (SET_DEST (set) == regno_reg_rtx [regnoi]) |
| REG_NOTES (sinsn) |
| = gen_rtx_EXPR_LIST (REG_EQUIV, stacki, |
| REG_NOTES (sinsn)); |
| else if (SET_DEST (set) == regno_reg_rtx [regnor]) |
| REG_NOTES (sinsn) |
| = gen_rtx_EXPR_LIST (REG_EQUIV, stackr, |
| REG_NOTES (sinsn)); |
| } |
| } |
| else if ((set = single_set (linsn)) != 0 |
| && SET_DEST (set) == parmreg) |
| REG_NOTES (linsn) |
| = gen_rtx_EXPR_LIST (REG_EQUIV, |
| data->stack_parm, REG_NOTES (linsn)); |
| } |
| |
| /* For pointer data type, suggest pointer register. */ |
| if (POINTER_TYPE_P (TREE_TYPE (parm))) |
| mark_reg_pointer (parmreg, |
| TYPE_ALIGN (TREE_TYPE (TREE_TYPE (parm)))); |
| } |
| |
| /* A subroutine of assign_parms. Allocate stack space to hold the current |
| parameter. Get it there. Perform all ABI specified conversions. */ |
| |
| static void |
| assign_parm_setup_stack (struct assign_parm_data_all *all, tree parm, |
| struct assign_parm_data_one *data) |
| { |
| /* Value must be stored in the stack slot STACK_PARM during function |
| execution. */ |
| bool to_conversion = false; |
| |
| if (data->promoted_mode != data->nominal_mode) |
| { |
| /* Conversion is required. */ |
| rtx tempreg = gen_reg_rtx (GET_MODE (data->entry_parm)); |
| |
| emit_move_insn (tempreg, validize_mem (data->entry_parm)); |
| |
| push_to_sequence (all->conversion_insns); |
| to_conversion = true; |
| |
| data->entry_parm = convert_to_mode (data->nominal_mode, tempreg, |
| TYPE_UNSIGNED (TREE_TYPE (parm))); |
| |
| if (data->stack_parm) |
| /* ??? This may need a big-endian conversion on sparc64. */ |
| data->stack_parm |
| = adjust_address (data->stack_parm, data->nominal_mode, 0); |
| } |
| |
| if (data->entry_parm != data->stack_parm) |
| { |
| rtx src, dest; |
| |
| if (data->stack_parm == 0) |
| { |
| data->stack_parm |
| = assign_stack_local (GET_MODE (data->entry_parm), |
| GET_MODE_SIZE (GET_MODE (data->entry_parm)), |
| TYPE_ALIGN (data->passed_type)); |
| set_mem_attributes (data->stack_parm, parm, 1); |
| } |
| |
| dest = validize_mem (data->stack_parm); |
| src = validize_mem (data->entry_parm); |
| |
| if (MEM_P (src)) |
| { |
| /* Use a block move to handle potentially misaligned entry_parm. */ |
| if (!to_conversion) |
| push_to_sequence (all->conversion_insns); |
| to_conversion = true; |
| |
| emit_block_move (dest, src, |
| GEN_INT (int_size_in_bytes (data->passed_type)), |
| BLOCK_OP_NORMAL); |
| } |
| else |
| emit_move_insn (dest, src); |
| } |
| |
| if (to_conversion) |
| { |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| } |
| |
| SET_DECL_RTL (parm, data->stack_parm); |
| } |
| |
| /* A subroutine of assign_parms. If the ABI splits complex arguments, then |
| undo the frobbing that we did in assign_parms_augmented_arg_list. */ |
| |
| static void |
| assign_parms_unsplit_complex (struct assign_parm_data_all *all, tree fnargs) |
| { |
| tree parm; |
| tree orig_fnargs = all->orig_fnargs; |
| |
| for (parm = orig_fnargs; parm; parm = TREE_CHAIN (parm)) |
| { |
| if (TREE_CODE (TREE_TYPE (parm)) == COMPLEX_TYPE |
| && targetm.calls.split_complex_arg (TREE_TYPE (parm))) |
| { |
| rtx tmp, real, imag; |
| enum machine_mode inner = GET_MODE_INNER (DECL_MODE (parm)); |
| |
| real = DECL_RTL (fnargs); |
| imag = DECL_RTL (TREE_CHAIN (fnargs)); |
| if (inner != GET_MODE (real)) |
| { |
| real = gen_lowpart_SUBREG (inner, real); |
| imag = gen_lowpart_SUBREG (inner, imag); |
| } |
| |
| if (TREE_ADDRESSABLE (parm)) |
| { |
| rtx rmem, imem; |
| HOST_WIDE_INT size = int_size_in_bytes (TREE_TYPE (parm)); |
| |
| /* split_complex_arg put the real and imag parts in |
| pseudos. Move them to memory. */ |
| tmp = assign_stack_local (DECL_MODE (parm), size, |
| TYPE_ALIGN (TREE_TYPE (parm))); |
| set_mem_attributes (tmp, parm, 1); |
| rmem = adjust_address_nv (tmp, inner, 0); |
| imem = adjust_address_nv (tmp, inner, GET_MODE_SIZE (inner)); |
| push_to_sequence (all->conversion_insns); |
| emit_move_insn (rmem, real); |
| emit_move_insn (imem, imag); |
| all->conversion_insns = get_insns (); |
| end_sequence (); |
| } |
| else |
| tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag); |
| SET_DECL_RTL (parm, tmp); |
| |
| real = DECL_INCOMING_RTL (fnargs); |
| imag = DECL_INCOMING_RTL (TREE_CHAIN (fnargs)); |
| if (inner != GET_MODE (real)) |
| { |
| real = gen_lowpart_SUBREG (inner, real); |
| imag = gen_lowpart_SUBREG (inner, imag); |
| } |
| tmp = gen_rtx_CONCAT (DECL_MODE (parm), real, imag); |
| set_decl_incoming_rtl (parm, tmp); |
| fnargs = TREE_CHAIN (fnargs); |
| } |
| else |
| { |
| SET_DECL_RTL (parm, DECL_RTL (fnargs)); |
| set_decl_incoming_rtl (parm, DECL_INCOMING_RTL (fnargs)); |
| |
| /* Set MEM_EXPR to the original decl, i.e. to PARM, |
| instead of the copy of decl, i.e. FNARGS. */ |
| if (DECL_INCOMING_RTL (parm) && MEM_P (DECL_INCOMING_RTL (parm))) |
| set_mem_expr (DECL_INCOMING_RTL (parm), parm); |
| } |
| |
| fnargs = TREE_CHAIN (fnargs); |
| } |
| } |
| |
| /* Assign RTL expressions to the function's parameters. This may involve |
| copying them into registers and using those registers as the DECL_RTL. */ |
| |
| static void |
| assign_parms (tree fndecl) |
| { |
| struct assign_parm_data_all all; |
| tree fnargs, parm; |
| /* APPLE LOCAL deletion mainline 2006-02-17 4356747 stack realign */ |
| /* APPLE LOCAL AltiVec */ |
| int pass, last_pass; |
| |
| /* APPLE LOCAL begin mainline 2006-02-17 4356747 stack realign */ |
| current_function_internal_arg_pointer |
| = targetm.calls.internal_arg_pointer (); |
| /* APPLE LOCAL end mainline 2006-02-17 4356747 stack realign */ |
| |
| assign_parms_initialize_all (&all); |
| fnargs = assign_parms_augmented_arg_list (&all); |
| |
| /* APPLE LOCAL begin AltiVec */ |
| last_pass = 1; |
| |
| for (pass = 1; pass <= last_pass; pass++) |
| { |
| for (parm = fnargs; parm; parm = TREE_CHAIN (parm)) |
| { |
| struct assign_parm_data_one data; |
| |
| tree type = TREE_TYPE (parm); |
| /* In 1st iteration over actual arguments, only consider non-vectors. |
| During 2nd iteration, finish off with vector parameters. */ |
| if (!current_function_stdarg && targetm.calls.skip_vec_args (type, pass, &last_pass)) |
| continue; |
| |
| /* Extract the type of PARM; adjust it according to ABI. */ |
| assign_parm_find_data_types (&all, parm, &data); |
| |
| /* Early out for errors and void parameters. */ |
| if (data.passed_mode == VOIDmode) |
| { |
| SET_DECL_RTL (parm, const0_rtx); |
| DECL_INCOMING_RTL (parm) = DECL_RTL (parm); |
| continue; |
| } |
| |
| if (current_function_stdarg && !TREE_CHAIN (parm)) |
| assign_parms_setup_varargs (&all, &data, false); |
| |
| /* Find out where the parameter arrives in this function. */ |
| assign_parm_find_entry_rtl (&all, &data); |
| |
| /* Find out where stack space for this parameter might be. */ |
| if (assign_parm_is_stack_parm (&all, &data)) |
| { |
| assign_parm_find_stack_rtl (parm, &data); |
| assign_parm_adjust_entry_rtl (&data); |
| } |
| |
| /* Record permanently how this parm was passed. */ |
| set_decl_incoming_rtl (parm, data.entry_parm); |
| |
| /* Update info on where next arg arrives in registers. */ |
| FUNCTION_ARG_ADVANCE (all.args_so_far, data.promoted_mode, |
| data.passed_type, data.named_arg); |
| |
| assign_parm_adjust_stack_rtl (&data); |
| |
| if (assign_parm_setup_block_p (&data)) |
| assign_parm_setup_block (&all, parm, &data); |
| else if (data.passed_pointer || use_register_for_decl (parm)) |
| assign_parm_setup_reg (&all, parm, &data); |
| else |
| assign_parm_setup_stack (&all, parm, &data); |
| } |
| } |
| /* APPLE LOCAL end AltiVec */ |
| |
| if (targetm.calls.split_complex_arg && fnargs != all.orig_fnargs) |
| assign_parms_unsplit_complex (&all, fnargs); |
| |
| /* Output all parameter conversion instructions (possibly including calls) |
| now that all parameters have been copied out of hard registers. */ |
| emit_insn (all.conversion_insns); |
| |
| /* If we are receiving a struct value address as the first argument, set up |
| the RTL for the function result. As this might require code to convert |
| the transmitted address to Pmode, we do this here to ensure that possible |
| preliminary conversions of the address have been emitted already. */ |
| if (all.function_result_decl) |
| { |
| tree result = DECL_RESULT (current_function_decl); |
| rtx addr = DECL_RTL (all.function_result_decl); |
| rtx x; |
| |
| if (DECL_BY_REFERENCE (result)) |
| x = addr; |
| else |
| { |
| addr = convert_memory_address (Pmode, addr); |
| x = gen_rtx_MEM (DECL_MODE (result), addr); |
| set_mem_attributes (x, result, 1); |
| } |
| SET_DECL_RTL (result, x); |
| } |
| |
| /* We have aligned all the args, so add space for the pretend args. */ |
| current_function_pretend_args_size = all.pretend_args_size; |
| all.stack_args_size.constant += all.extra_pretend_bytes; |
| current_function_args_size = all.stack_args_size.constant; |
| /* APPLE LOCAL sibcall optimization stomped CW frames (radar 3007352) */ |
| cfun->unrounded_args_size = all.stack_args_size.constant; |
| |
| /* Adjust function incoming argument size for alignment and |
| minimum length. */ |
| |
| #ifdef REG_PARM_STACK_SPACE |
| current_function_args_size = MAX (current_function_args_size, |
| REG_PARM_STACK_SPACE (fndecl)); |
| #endif |
| |
| current_function_args_size |
| = ((current_function_args_size + STACK_BYTES - 1) |
| / STACK_BYTES) * STACK_BYTES; |
| |
| #ifdef ARGS_GROW_DOWNWARD |
| current_function_arg_offset_rtx |
| = (all.stack_args_size.var == 0 ? GEN_INT (-all.stack_args_size.constant) |
| : expand_expr (size_diffop (all.stack_args_size.var, |
| |