mirror of
https://gcc.gnu.org/git/gcc.git
synced 2024-12-12 13:23:47 +08:00
e3b5732b21
PR testsuite/35843 * cfgexpand.c (pass_expand): Turn into RTL pass. * passes.c (execute_one_pass): Do pass typechecking after execution. * tree-pass.h (pass_expand): Turn into RTL pass. * function.h (struct rtl_data): Move here fields accesses_prior_frames, calls_eh_return, saves_all_registers, has_nonlocal_goto, has_asm_statement, is_thunk, all_throwers_are_sibcalls, limit_stack, profile, uses_const_pool, uses_pic_offset_table, uses_eh_lsda, tail_call_emit, arg_pointer_save_area_init from struct function; turn into bool. (struct function): Move calls_eh_return, saves_all_registers, has_nonlocal_goto, has_asm_statement, is_thunk, all_throwers_are_sibcalls, limit_stack, profile, uses_const_pool, uses_pic_offset_table, uses_eh_lsda, tail_call_emit, arg_pointer_save_area_init into struct rtl_data. Remove recursive_call_emit and gimplified flags. (current_function_returns_struct, current_function_returns_pcc_struct, current_function_calls_setjmp, current_function_calls_alloca, current_function_accesses_prior_frames, current_function_calls_eh_return, current_function_is_thunk, current_function_stdarg, current_function_profile, current_function_limit_stack, current_function_uses_pic_offset_table, current_function_uses_const_pool, current_function_has_nonlocal_label, current_function_saves_all_registers, current_function_has_nonlocal_goto, current_function_has_asm_statement): Remove accesor macros. * ra-conflict.c (global_conflicts): Update. * tree-tailcall.c (suitable_for_tail_opt_p): Update. (suitable_for_tail_call_opt_p): Update. * builtins.c (expand_builtin_return_addr): Update. (expand_builtin_setjmp_setup): Update. (expand_builtin_nonlocal_goto): Update. * final.c (final_start_function): Update. (profile_function): Update. (leaf_function_p): Update. (only_leaf_regs_used): Update. * df-scan.c (df_get_exit_block_use_set): Update. * dojump.c (clear_pending_stack_adjust): Update. * tree-stdarg.c (gate_optimize_stdarg): Update. * gimple-low.c (lower_function_body): Update. * global.c (compute_regsets): Update. (global_alloc): Update. * dwarf2out.c (dwarf2out_begin_prologue): Update. * expr.c (expand_assignment): Update. * dse.c (dse_step0): Update. (dse_step1): Update. * c-decl.c (store_parm_decls): Update. * local-alloc.c (combine_regs): Update. (find_free_reg): Update. * function.c (assign_parms_augmented_arg_list): Update. (assign_parm_find_data_types): Update. (assign_parms): Update. (allocate_struct_function): Update. (expand_function_start): Update. (expand_function_end): Update. (get_arg_pointer_save_area): Update. (thread_prologue_and_epilogue_insns): Update. (rest_of_match_asm_constraints): Update. * stor-layout.c (variable_size): Update. * gcse.c (gcse_main): Update. (bypass_jumps): Update. * gimplify.c (gimplify_function_tree): Update. * calls.c (emit_call_1): Update. (expand_call): Update. * bt-load.c (compute_defs_uses_and_gen): Update. * except.c (sjlj_assign_call_site_values): Update. (sjlj_emit_function_enter): Update. (can_throw_external): Update. (set_nothrow_function_flags): Update. (expand_builtin_unwind_init): Update. (expand_eh_return): Update. (convert_to_eh_region_ranges): Update. (output_function_exception_table): Update. * emit-rtl.c (gen_tmp_stack_mem): Update. * cfgexpand.c (expand_used_vars): Update. (tree_expand_cfg): Update. * cfgcleanup.c (rest_of_handle_jump): Update. * explow.c (allocate_dynamic_stack_space): Update. * varasm.c (assemble_start_function): Update. (force_const_mem): Update. (mark_constant_pool): Update. * tree-optimize.c (tree_rest_of_compilation): Update. * stack-ptr-mod.c (notice_stack_pointer_modification): Update. * tree-cfg.c (notice_special_calls): Update. (is_ctrl_altering_stmt): Update. (tree_can_make_abnormal_goto): Update. (tree_purge_dead_abnormal_call_edges): Update. * config/alpha/predicates.md: Update. * config/alpha/alpha.c (alpha_sa_mask): Update. (alpha_sa_size): Update. (alpha_does_function_need_gp): Update. (alpha_expand_prologue): Update. (alpha_start_function): Update. (alpha_output_function_end_prologue): Update. (alpha_expand_epilogue): Update. * config/frv/frv.c (frv_stack_info): Update. (frv_expand_epilogue): Update. * config/s390/s390.c (s390_regs_ever_clobbered): Update. (s390_register_info): Update. (s390_frame_info): Update. (s390_init_frame_layout): Update. (s390_can_eliminate): Update. (save_gprs): Update. * config/spu/spu.c (spu_split_immediate): Update. (need_to_save_reg): Update. (spu_expand_prologue): Update. (spu_expand_epilogue): Update. * config/sparc/sparc.md: Update. * config/sparc/sparc.c (eligible_for_return_delay): Update. (sparc_tls_got): Update. (legitimize_pic_address): Update. (sparc_emit_call_insn): Update. (sparc_expand_prologue): Update. (output_return): Update. (print_operand): Update. (sparc_function_ok_for_sibcall): Update. * config/sparc/sparc.h (EXIT_IGNORE_STACK): Update. * config/m32r/m32r.md: Update. * config/m32r/m32r.c (MUST_SAVE_RETURN_ADDR): Update. (m32r_compute_frame_size): Update. (m32r_expand_prologue): Update. (m32r_expand_epilogue): Update. (m32r_legitimize_pic_address): Update. * config/m32r/m32r.h (FRAME_POINTER_REQUIRED): Update. * config/i386/linux.h (SUBTARGET_FRAME_POINTER_REQUIRED): Update. * config/i386/i386.c (ix86_frame_pointer_required): Update. (gen_push): Update. (ix86_save_reg): Update. (ix86_compute_frame_layout): Update. (ix86_expand_prologue): Update. (ix86_expand_epilogue): Update. * config/sh/sh.c (output_stack_adjust): Update. (calc_live_regs): Update. (sh5_schedule_saves): Update. (sh_expand_prologue): Update. (sh_expand_epilogue): Update. (sh_setup_incoming_varargs): Update. (sh_allocate_initial_value): Update. (sh_get_pr_initial_val): Update. * config/sh/sh.h (SHMEDIA_REGS_STACK_ADJUST): Update. * config/sh/sh.md (label:): Update. * config/avr/avr.c (out_movhi_mr_r): Update. * config/crx/crx.h (enum): Update. * config/xtensa/xtensa.h (along): Update. * config/stormy16/stormy16.c Update. (xstormy16_compute_stack_layout): Update. * config/fr30/fr30.c (MUST_SAVE_RETURN_POINTER): Update. (fr30_expand_prologue): Update. * config/cris/cris.c (cris_conditional_register_usage): Update. (cris_reg_saved_in_regsave_area): Update. (cris_initial_frame_pointer_offset): Update. (cris_simple_epilogue): Update. (cris_expand_prologue): Update. (cris_expand_epilogue): Update. (cris_expand_pic_call_address): Update. (cris_asm_output_symbol_ref): Update. (cris_asm_output_label_ref): Update. * config/cris/cris.md Update. * config/iq2000/iq2000.c (compute_frame_size): Update. (iq2000_expand_epilogue): Update. * config/mt/mt.h (save_direction): Update. * config/mn10300/mn10300.c (mn10300_function_value): Update. * config/ia64/ia64.c (ia64_compute_frame_size): Update. (ia64_secondary_reload_class): Update. * config/m68k/m68k.c (m68k_save_reg): Update. (m68k_expand_prologue): Update. (m68k_expand_epilogue): Update. (legitimize_pic_address): Update. * config/rs6000/rs6000.c (rs6000_got_register): Update. (first_reg_to_save): Update. (first_altivec_reg_to_save): Update. (compute_vrsave_mask): Update. (compute_save_world_info): Update. (rs6000_stack_info): Update. (spe_func_has_64bit_regs_p): Update. (rs6000_ra_ever_killed): Update. (rs6000_emit_eh_reg_restore): Update. (rs6000_emit_allocate_stack): Update. (rs6000_emit_prologue): Update. (rs6000_emit_epilogue): Update. (rs6000_output_function_epilogue): Update. (output_profile_hook): Update. (rs6000_elf_declare_function_name): Update. * config/rs6000/rs6000.h (rs6000_args): Update. * config/rs6000/rs6000.md: Update. * config/mcore/mcore.c (mcore_expand_prolog): Update. * config/arc/arc.c (arc_output_function_epilogue): Update. * config/arc/arc.h (FRAME_POINTER_REQUIRED): Update. * config/darwin.c (machopic_function_base_name): Update. * config/score/score3.c (score3_compute_frame_size): Update. (rpush): Update. (rpop): Update. (score3_epilogue): Update. * config/score/score7.c (score7_compute_frame_size): Update. (score7_prologue): Update. (score7_epilogue): Update. * config/score/score.h (FRAME_POINTER_REQUIRED): Update. * config/arm/linux-elf.h (SUBTARGET_FRAME_POINTER_REQUIRED): Update. * config/arm/arm.c (use_return_insn): Update. (require_pic_register): Update. (arm_load_pic_register): Update. (arm_compute_save_reg0_reg12_mask): Update. (arm_compute_save_reg_mask): Update. (thumb1_compute_save_reg_mask): Update. (output_return_instruction): Update. (arm_output_function_prologue): Update. (arm_output_epilogue): Update. (arm_get_frame_offsets): Update. (arm_expand_prologue): Update. (thumb_pushpop): Update. (thumb_exit): Update. (thumb1_expand_prologue): Update. (thumb1_expand_epilogue): Update. (arm_unwind_emit): Update. (arm_output_fn_unwind): Update. * config/arm/arm.h (FRAME_POINTER_REQUIRED): Update. * config/arm/arm.md: Update. * config/pa/pa.md: Update. * config/pa/pa.c (legitimize_pic_address): Update. (compute_frame_size): Update. (hppa_expand_prologue): Update. (hppa_expand_epilogue): Update. (borx_reg_operand): Update. * config/pa/pa.h (FRAME_POINTER_REQUIRED): Update. (HARD_REGNO_RENAME_OK): Update. * config/mips/mips.c (mips_global_pointer): Update. (mips_save_reg_p): Update. (mips_compute_frame_info): Update. (mips_frame_pointer_required): Update. (mips_expand_prologue): Update. (mips_expand_epilogue): Update. (mips_can_use_return_insn): Update. (mips_reorg_process_insns): Update. * config/v850/v850.c (compute_register_save_size): Update. * config/mmix/mmix.h (FRAME_POINTER_REQUIRED): Update. * config/mmix/mmix.c (along): Update. (mmix_expand_epilogue): Update. * config/bfin/bfin.c (legitimize_pic_address): Update. (must_save_p): Update. (stack_frame_needed_p): Update. (add_to_reg): Update. (bfin_expand_prologue): Update. * stmt.c (expand_asm_operands): Update. * reload1.c (reload): Update. (init_elim_table): Update. From-SVN: r134682
925 lines
24 KiB
C
925 lines
24 KiB
C
/* Pass computing data for optimizing stdarg functions.
|
|
Copyright (C) 2004, 2005, 2007, 2008 Free Software Foundation, Inc.
|
|
Contributed by Jakub Jelinek <jakub@redhat.com>
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
GCC is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING3. If not see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "config.h"
|
|
#include "system.h"
|
|
#include "coretypes.h"
|
|
#include "tm.h"
|
|
#include "tree.h"
|
|
#include "function.h"
|
|
#include "langhooks.h"
|
|
#include "diagnostic.h"
|
|
#include "target.h"
|
|
#include "tree-flow.h"
|
|
#include "tree-pass.h"
|
|
#include "tree-stdarg.h"
|
|
|
|
/* A simple pass that attempts to optimize stdarg functions on architectures
|
|
that need to save register arguments to stack on entry to stdarg functions.
|
|
If the function doesn't use any va_start macros, no registers need to
|
|
be saved. If va_start macros are used, the va_list variables don't escape
|
|
the function, it is only necessary to save registers that will be used
|
|
in va_arg macros. E.g. if va_arg is only used with integral types
|
|
in the function, floating point registers don't need to be saved, etc. */
|
|
|
|
|
|
/* Return true if basic block VA_ARG_BB is dominated by VA_START_BB and
|
|
is executed at most as many times as VA_START_BB. */
|
|
|
|
static bool
|
|
reachable_at_most_once (basic_block va_arg_bb, basic_block va_start_bb)
|
|
{
|
|
VEC (edge, heap) *stack = NULL;
|
|
edge e;
|
|
edge_iterator ei;
|
|
sbitmap visited;
|
|
bool ret;
|
|
|
|
if (va_arg_bb == va_start_bb)
|
|
return true;
|
|
|
|
if (! dominated_by_p (CDI_DOMINATORS, va_arg_bb, va_start_bb))
|
|
return false;
|
|
|
|
visited = sbitmap_alloc (last_basic_block);
|
|
sbitmap_zero (visited);
|
|
ret = true;
|
|
|
|
FOR_EACH_EDGE (e, ei, va_arg_bb->preds)
|
|
VEC_safe_push (edge, heap, stack, e);
|
|
|
|
while (! VEC_empty (edge, stack))
|
|
{
|
|
basic_block src;
|
|
|
|
e = VEC_pop (edge, stack);
|
|
src = e->src;
|
|
|
|
if (e->flags & EDGE_COMPLEX)
|
|
{
|
|
ret = false;
|
|
break;
|
|
}
|
|
|
|
if (src == va_start_bb)
|
|
continue;
|
|
|
|
/* va_arg_bb can be executed more times than va_start_bb. */
|
|
if (src == va_arg_bb)
|
|
{
|
|
ret = false;
|
|
break;
|
|
}
|
|
|
|
gcc_assert (src != ENTRY_BLOCK_PTR);
|
|
|
|
if (! TEST_BIT (visited, src->index))
|
|
{
|
|
SET_BIT (visited, src->index);
|
|
FOR_EACH_EDGE (e, ei, src->preds)
|
|
VEC_safe_push (edge, heap, stack, e);
|
|
}
|
|
}
|
|
|
|
VEC_free (edge, heap, stack);
|
|
sbitmap_free (visited);
|
|
return ret;
|
|
}
|
|
|
|
|
|
/* For statement COUNTER = RHS, if RHS is COUNTER + constant,
|
|
return constant, otherwise return (unsigned HOST_WIDE_INT) -1.
|
|
GPR_P is true if this is GPR counter. */
|
|
|
|
static unsigned HOST_WIDE_INT
|
|
va_list_counter_bump (struct stdarg_info *si, tree counter, tree rhs,
|
|
bool gpr_p)
|
|
{
|
|
tree stmt, lhs, orig_lhs;
|
|
unsigned HOST_WIDE_INT ret = 0, val, counter_val;
|
|
unsigned int max_size;
|
|
|
|
if (si->offsets == NULL)
|
|
{
|
|
unsigned int i;
|
|
|
|
si->offsets = XNEWVEC (int, num_ssa_names);
|
|
for (i = 0; i < num_ssa_names; ++i)
|
|
si->offsets[i] = -1;
|
|
}
|
|
|
|
counter_val = gpr_p ? cfun->va_list_gpr_size : cfun->va_list_fpr_size;
|
|
max_size = gpr_p ? VA_LIST_MAX_GPR_SIZE : VA_LIST_MAX_FPR_SIZE;
|
|
orig_lhs = lhs = rhs;
|
|
while (lhs)
|
|
{
|
|
if (si->offsets[SSA_NAME_VERSION (lhs)] != -1)
|
|
{
|
|
if (counter_val >= max_size)
|
|
{
|
|
ret = max_size;
|
|
break;
|
|
}
|
|
|
|
ret -= counter_val - si->offsets[SSA_NAME_VERSION (lhs)];
|
|
break;
|
|
}
|
|
|
|
stmt = SSA_NAME_DEF_STMT (lhs);
|
|
|
|
if (TREE_CODE (stmt) != GIMPLE_MODIFY_STMT
|
|
|| GIMPLE_STMT_OPERAND (stmt, 0) != lhs)
|
|
return (unsigned HOST_WIDE_INT) -1;
|
|
|
|
rhs = GIMPLE_STMT_OPERAND (stmt, 1);
|
|
if (TREE_CODE (rhs) == WITH_SIZE_EXPR)
|
|
rhs = TREE_OPERAND (rhs, 0);
|
|
|
|
if (TREE_CODE (rhs) == SSA_NAME)
|
|
{
|
|
lhs = rhs;
|
|
continue;
|
|
}
|
|
|
|
if ((TREE_CODE (rhs) == NOP_EXPR
|
|
|| TREE_CODE (rhs) == CONVERT_EXPR)
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 0)) == SSA_NAME)
|
|
{
|
|
lhs = TREE_OPERAND (rhs, 0);
|
|
continue;
|
|
}
|
|
|
|
if ((TREE_CODE (rhs) == POINTER_PLUS_EXPR
|
|
|| TREE_CODE (rhs) == PLUS_EXPR)
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 0)) == SSA_NAME
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 1)) == INTEGER_CST
|
|
&& host_integerp (TREE_OPERAND (rhs, 1), 1))
|
|
{
|
|
ret += tree_low_cst (TREE_OPERAND (rhs, 1), 1);
|
|
lhs = TREE_OPERAND (rhs, 0);
|
|
continue;
|
|
}
|
|
|
|
if (TREE_CODE (counter) != TREE_CODE (rhs))
|
|
return (unsigned HOST_WIDE_INT) -1;
|
|
|
|
if (TREE_CODE (counter) == COMPONENT_REF)
|
|
{
|
|
if (get_base_address (counter) != get_base_address (rhs)
|
|
|| TREE_CODE (TREE_OPERAND (rhs, 1)) != FIELD_DECL
|
|
|| TREE_OPERAND (counter, 1) != TREE_OPERAND (rhs, 1))
|
|
return (unsigned HOST_WIDE_INT) -1;
|
|
}
|
|
else if (counter != rhs)
|
|
return (unsigned HOST_WIDE_INT) -1;
|
|
|
|
lhs = NULL;
|
|
}
|
|
|
|
lhs = orig_lhs;
|
|
val = ret + counter_val;
|
|
while (lhs)
|
|
{
|
|
if (si->offsets[SSA_NAME_VERSION (lhs)] != -1)
|
|
break;
|
|
|
|
if (val >= max_size)
|
|
si->offsets[SSA_NAME_VERSION (lhs)] = max_size;
|
|
else
|
|
si->offsets[SSA_NAME_VERSION (lhs)] = val;
|
|
|
|
stmt = SSA_NAME_DEF_STMT (lhs);
|
|
|
|
rhs = GIMPLE_STMT_OPERAND (stmt, 1);
|
|
if (TREE_CODE (rhs) == WITH_SIZE_EXPR)
|
|
rhs = TREE_OPERAND (rhs, 0);
|
|
|
|
if (TREE_CODE (rhs) == SSA_NAME)
|
|
{
|
|
lhs = rhs;
|
|
continue;
|
|
}
|
|
|
|
if ((TREE_CODE (rhs) == NOP_EXPR
|
|
|| TREE_CODE (rhs) == CONVERT_EXPR)
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 0)) == SSA_NAME)
|
|
{
|
|
lhs = TREE_OPERAND (rhs, 0);
|
|
continue;
|
|
}
|
|
|
|
if ((TREE_CODE (rhs) == POINTER_PLUS_EXPR
|
|
|| TREE_CODE (rhs) == PLUS_EXPR)
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 0)) == SSA_NAME
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 1)) == INTEGER_CST
|
|
&& host_integerp (TREE_OPERAND (rhs, 1), 1))
|
|
{
|
|
val -= tree_low_cst (TREE_OPERAND (rhs, 1), 1);
|
|
lhs = TREE_OPERAND (rhs, 0);
|
|
continue;
|
|
}
|
|
|
|
lhs = NULL;
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
|
|
/* Called by walk_tree to look for references to va_list variables. */
|
|
|
|
static tree
|
|
find_va_list_reference (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED,
|
|
void *data)
|
|
{
|
|
bitmap va_list_vars = (bitmap) data;
|
|
tree var = *tp;
|
|
|
|
if (TREE_CODE (var) == SSA_NAME)
|
|
var = SSA_NAME_VAR (var);
|
|
|
|
if (TREE_CODE (var) == VAR_DECL
|
|
&& bitmap_bit_p (va_list_vars, DECL_UID (var)))
|
|
return var;
|
|
|
|
return NULL_TREE;
|
|
}
|
|
|
|
|
|
/* Helper function of va_list_counter_struct_op. Compute
|
|
cfun->va_list_{g,f}pr_size. AP is a va_list GPR/FPR counter,
|
|
if WRITE_P is true, seen in AP = VAR, otherwise seen in VAR = AP
|
|
statement. GPR_P is true if AP is a GPR counter, false if it is
|
|
a FPR counter. */
|
|
|
|
static void
|
|
va_list_counter_op (struct stdarg_info *si, tree ap, tree var, bool gpr_p,
|
|
bool write_p)
|
|
{
|
|
unsigned HOST_WIDE_INT increment;
|
|
|
|
if (si->compute_sizes < 0)
|
|
{
|
|
si->compute_sizes = 0;
|
|
if (si->va_start_count == 1
|
|
&& reachable_at_most_once (si->bb, si->va_start_bb))
|
|
si->compute_sizes = 1;
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file,
|
|
"bb%d will %sbe executed at most once for each va_start "
|
|
"in bb%d\n", si->bb->index, si->compute_sizes ? "" : "not ",
|
|
si->va_start_bb->index);
|
|
}
|
|
|
|
if (write_p
|
|
&& si->compute_sizes
|
|
&& (increment = va_list_counter_bump (si, ap, var, gpr_p)) + 1 > 1)
|
|
{
|
|
if (gpr_p && cfun->va_list_gpr_size + increment < VA_LIST_MAX_GPR_SIZE)
|
|
{
|
|
cfun->va_list_gpr_size += increment;
|
|
return;
|
|
}
|
|
|
|
if (!gpr_p && cfun->va_list_fpr_size + increment < VA_LIST_MAX_FPR_SIZE)
|
|
{
|
|
cfun->va_list_fpr_size += increment;
|
|
return;
|
|
}
|
|
}
|
|
|
|
if (write_p || !si->compute_sizes)
|
|
{
|
|
if (gpr_p)
|
|
cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
|
|
else
|
|
cfun->va_list_fpr_size = VA_LIST_MAX_FPR_SIZE;
|
|
}
|
|
}
|
|
|
|
|
|
/* If AP is a va_list GPR/FPR counter, compute cfun->va_list_{g,f}pr_size.
|
|
If WRITE_P is true, AP has been seen in AP = VAR assignment, if WRITE_P
|
|
is false, AP has been seen in VAR = AP assignment.
|
|
Return true if the AP = VAR (resp. VAR = AP) statement is a recognized
|
|
va_arg operation that doesn't cause the va_list variable to escape
|
|
current function. */
|
|
|
|
static bool
|
|
va_list_counter_struct_op (struct stdarg_info *si, tree ap, tree var,
|
|
bool write_p)
|
|
{
|
|
tree base;
|
|
|
|
if (TREE_CODE (ap) != COMPONENT_REF
|
|
|| TREE_CODE (TREE_OPERAND (ap, 1)) != FIELD_DECL)
|
|
return false;
|
|
|
|
if (TREE_CODE (var) != SSA_NAME
|
|
|| bitmap_bit_p (si->va_list_vars, DECL_UID (SSA_NAME_VAR (var))))
|
|
return false;
|
|
|
|
base = get_base_address (ap);
|
|
if (TREE_CODE (base) != VAR_DECL
|
|
|| !bitmap_bit_p (si->va_list_vars, DECL_UID (base)))
|
|
return false;
|
|
|
|
if (TREE_OPERAND (ap, 1) == va_list_gpr_counter_field)
|
|
va_list_counter_op (si, ap, var, true, write_p);
|
|
else if (TREE_OPERAND (ap, 1) == va_list_fpr_counter_field)
|
|
va_list_counter_op (si, ap, var, false, write_p);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/* Check for TEM = AP. Return true if found and the caller shouldn't
|
|
search for va_list references in the statement. */
|
|
|
|
static bool
|
|
va_list_ptr_read (struct stdarg_info *si, tree ap, tree tem)
|
|
{
|
|
if (TREE_CODE (ap) != VAR_DECL
|
|
|| !bitmap_bit_p (si->va_list_vars, DECL_UID (ap)))
|
|
return false;
|
|
|
|
if (TREE_CODE (tem) != SSA_NAME
|
|
|| bitmap_bit_p (si->va_list_vars,
|
|
DECL_UID (SSA_NAME_VAR (tem)))
|
|
|| is_global_var (SSA_NAME_VAR (tem)))
|
|
return false;
|
|
|
|
if (si->compute_sizes < 0)
|
|
{
|
|
si->compute_sizes = 0;
|
|
if (si->va_start_count == 1
|
|
&& reachable_at_most_once (si->bb, si->va_start_bb))
|
|
si->compute_sizes = 1;
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file,
|
|
"bb%d will %sbe executed at most once for each va_start "
|
|
"in bb%d\n", si->bb->index, si->compute_sizes ? "" : "not ",
|
|
si->va_start_bb->index);
|
|
}
|
|
|
|
/* For void * or char * va_list types, there is just one counter.
|
|
If va_arg is used in a loop, we don't know how many registers need
|
|
saving. */
|
|
if (! si->compute_sizes)
|
|
return false;
|
|
|
|
if (va_list_counter_bump (si, ap, tem, true) == (unsigned HOST_WIDE_INT) -1)
|
|
return false;
|
|
|
|
/* Note the temporary, as we need to track whether it doesn't escape
|
|
the current function. */
|
|
bitmap_set_bit (si->va_list_escape_vars,
|
|
DECL_UID (SSA_NAME_VAR (tem)));
|
|
return true;
|
|
}
|
|
|
|
|
|
/* Check for:
|
|
tem1 = AP;
|
|
TEM2 = tem1 + CST;
|
|
AP = TEM2;
|
|
sequence and update cfun->va_list_gpr_size. Return true if found. */
|
|
|
|
static bool
|
|
va_list_ptr_write (struct stdarg_info *si, tree ap, tree tem2)
|
|
{
|
|
unsigned HOST_WIDE_INT increment;
|
|
|
|
if (TREE_CODE (ap) != VAR_DECL
|
|
|| !bitmap_bit_p (si->va_list_vars, DECL_UID (ap)))
|
|
return false;
|
|
|
|
if (TREE_CODE (tem2) != SSA_NAME
|
|
|| bitmap_bit_p (si->va_list_vars, DECL_UID (SSA_NAME_VAR (tem2))))
|
|
return false;
|
|
|
|
if (si->compute_sizes <= 0)
|
|
return false;
|
|
|
|
increment = va_list_counter_bump (si, ap, tem2, true);
|
|
if (increment + 1 <= 1)
|
|
return false;
|
|
|
|
if (cfun->va_list_gpr_size + increment < VA_LIST_MAX_GPR_SIZE)
|
|
cfun->va_list_gpr_size += increment;
|
|
else
|
|
cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/* If RHS is X, (some type *) X or X + CST for X a temporary variable
|
|
containing value of some va_list variable plus optionally some constant,
|
|
either set si->va_list_escapes or add LHS to si->va_list_escape_vars,
|
|
depending whether LHS is a function local temporary. */
|
|
|
|
static void
|
|
check_va_list_escapes (struct stdarg_info *si, tree lhs, tree rhs)
|
|
{
|
|
if (! POINTER_TYPE_P (TREE_TYPE (rhs)))
|
|
return;
|
|
|
|
if (((TREE_CODE (rhs) == POINTER_PLUS_EXPR
|
|
|| TREE_CODE (rhs) == PLUS_EXPR)
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 1)) == INTEGER_CST)
|
|
|| TREE_CODE (rhs) == NOP_EXPR
|
|
|| TREE_CODE (rhs) == CONVERT_EXPR)
|
|
rhs = TREE_OPERAND (rhs, 0);
|
|
|
|
if (TREE_CODE (rhs) != SSA_NAME
|
|
|| ! bitmap_bit_p (si->va_list_escape_vars,
|
|
DECL_UID (SSA_NAME_VAR (rhs))))
|
|
return;
|
|
|
|
if (TREE_CODE (lhs) != SSA_NAME || is_global_var (SSA_NAME_VAR (lhs)))
|
|
{
|
|
si->va_list_escapes = true;
|
|
return;
|
|
}
|
|
|
|
if (si->compute_sizes < 0)
|
|
{
|
|
si->compute_sizes = 0;
|
|
if (si->va_start_count == 1
|
|
&& reachable_at_most_once (si->bb, si->va_start_bb))
|
|
si->compute_sizes = 1;
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file,
|
|
"bb%d will %sbe executed at most once for each va_start "
|
|
"in bb%d\n", si->bb->index, si->compute_sizes ? "" : "not ",
|
|
si->va_start_bb->index);
|
|
}
|
|
|
|
/* For void * or char * va_list types, there is just one counter.
|
|
If va_arg is used in a loop, we don't know how many registers need
|
|
saving. */
|
|
if (! si->compute_sizes)
|
|
{
|
|
si->va_list_escapes = true;
|
|
return;
|
|
}
|
|
|
|
if (va_list_counter_bump (si, si->va_start_ap, lhs, true)
|
|
== (unsigned HOST_WIDE_INT) -1)
|
|
{
|
|
si->va_list_escapes = true;
|
|
return;
|
|
}
|
|
|
|
bitmap_set_bit (si->va_list_escape_vars,
|
|
DECL_UID (SSA_NAME_VAR (lhs)));
|
|
}
|
|
|
|
|
|
/* Check all uses of temporaries from si->va_list_escape_vars bitmap.
|
|
Return true if va_list might be escaping. */
|
|
|
|
static bool
|
|
check_all_va_list_escapes (struct stdarg_info *si)
|
|
{
|
|
basic_block bb;
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
block_stmt_iterator i;
|
|
|
|
for (i = bsi_start (bb); !bsi_end_p (i); bsi_next (&i))
|
|
{
|
|
tree stmt = bsi_stmt (i), use;
|
|
ssa_op_iter iter;
|
|
|
|
FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_ALL_USES)
|
|
{
|
|
if (! bitmap_bit_p (si->va_list_escape_vars,
|
|
DECL_UID (SSA_NAME_VAR (use))))
|
|
continue;
|
|
|
|
if (TREE_CODE (stmt) == GIMPLE_MODIFY_STMT)
|
|
{
|
|
tree lhs = GIMPLE_STMT_OPERAND (stmt, 0);
|
|
tree rhs = GIMPLE_STMT_OPERAND (stmt, 1);
|
|
|
|
if (TREE_CODE (rhs) == WITH_SIZE_EXPR)
|
|
rhs = TREE_OPERAND (rhs, 0);
|
|
|
|
/* x = *ap_temp; */
|
|
if (TREE_CODE (rhs) == INDIRECT_REF
|
|
&& TREE_OPERAND (rhs, 0) == use
|
|
&& TYPE_SIZE_UNIT (TREE_TYPE (rhs))
|
|
&& host_integerp (TYPE_SIZE_UNIT (TREE_TYPE (rhs)), 1)
|
|
&& si->offsets[SSA_NAME_VERSION (use)] != -1)
|
|
{
|
|
unsigned HOST_WIDE_INT gpr_size;
|
|
tree access_size = TYPE_SIZE_UNIT (TREE_TYPE (rhs));
|
|
|
|
gpr_size = si->offsets[SSA_NAME_VERSION (use)]
|
|
+ tree_low_cst (access_size, 1);
|
|
if (gpr_size >= VA_LIST_MAX_GPR_SIZE)
|
|
cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
|
|
else if (gpr_size > cfun->va_list_gpr_size)
|
|
cfun->va_list_gpr_size = gpr_size;
|
|
continue;
|
|
}
|
|
|
|
/* va_arg sequences may contain
|
|
other_ap_temp = ap_temp;
|
|
other_ap_temp = ap_temp + constant;
|
|
other_ap_temp = (some_type *) ap_temp;
|
|
ap = ap_temp;
|
|
statements. */
|
|
if ((TREE_CODE (rhs) == POINTER_PLUS_EXPR
|
|
&& TREE_CODE (TREE_OPERAND (rhs, 1)) == INTEGER_CST)
|
|
|| TREE_CODE (rhs) == NOP_EXPR
|
|
|| TREE_CODE (rhs) == CONVERT_EXPR)
|
|
rhs = TREE_OPERAND (rhs, 0);
|
|
|
|
if (rhs == use)
|
|
{
|
|
if (TREE_CODE (lhs) == SSA_NAME
|
|
&& bitmap_bit_p (si->va_list_escape_vars,
|
|
DECL_UID (SSA_NAME_VAR (lhs))))
|
|
continue;
|
|
|
|
if (TREE_CODE (lhs) == VAR_DECL
|
|
&& bitmap_bit_p (si->va_list_vars,
|
|
DECL_UID (lhs)))
|
|
continue;
|
|
}
|
|
}
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fputs ("va_list escapes in ", dump_file);
|
|
print_generic_expr (dump_file, stmt, dump_flags);
|
|
fputc ('\n', dump_file);
|
|
}
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
|
|
/* Return true if this optimization pass should be done.
|
|
It makes only sense for stdarg functions. */
|
|
|
|
static bool
|
|
gate_optimize_stdarg (void)
|
|
{
|
|
/* This optimization is only for stdarg functions. */
|
|
return cfun->stdarg != 0;
|
|
}
|
|
|
|
|
|
/* Entry point to the stdarg optimization pass. */
|
|
|
|
static unsigned int
|
|
execute_optimize_stdarg (void)
|
|
{
|
|
basic_block bb;
|
|
bool va_list_escapes = false;
|
|
bool va_list_simple_ptr;
|
|
struct stdarg_info si;
|
|
const char *funcname = NULL;
|
|
|
|
cfun->va_list_gpr_size = 0;
|
|
cfun->va_list_fpr_size = 0;
|
|
memset (&si, 0, sizeof (si));
|
|
si.va_list_vars = BITMAP_ALLOC (NULL);
|
|
si.va_list_escape_vars = BITMAP_ALLOC (NULL);
|
|
|
|
if (dump_file)
|
|
funcname = lang_hooks.decl_printable_name (current_function_decl, 2);
|
|
|
|
va_list_simple_ptr = POINTER_TYPE_P (va_list_type_node)
|
|
&& (TREE_TYPE (va_list_type_node) == void_type_node
|
|
|| TREE_TYPE (va_list_type_node) == char_type_node);
|
|
gcc_assert (is_gimple_reg_type (va_list_type_node) == va_list_simple_ptr);
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
block_stmt_iterator i;
|
|
|
|
for (i = bsi_start (bb); !bsi_end_p (i); bsi_next (&i))
|
|
{
|
|
tree stmt = bsi_stmt (i);
|
|
tree call = get_call_expr_in (stmt), callee;
|
|
tree ap;
|
|
|
|
if (!call)
|
|
continue;
|
|
|
|
callee = get_callee_fndecl (call);
|
|
if (!callee
|
|
|| DECL_BUILT_IN_CLASS (callee) != BUILT_IN_NORMAL)
|
|
continue;
|
|
|
|
switch (DECL_FUNCTION_CODE (callee))
|
|
{
|
|
case BUILT_IN_VA_START:
|
|
break;
|
|
/* If old style builtins are used, don't optimize anything. */
|
|
case BUILT_IN_SAVEREGS:
|
|
case BUILT_IN_ARGS_INFO:
|
|
case BUILT_IN_NEXT_ARG:
|
|
va_list_escapes = true;
|
|
continue;
|
|
default:
|
|
continue;
|
|
}
|
|
|
|
si.va_start_count++;
|
|
ap = CALL_EXPR_ARG (call, 0);
|
|
|
|
if (TREE_CODE (ap) != ADDR_EXPR)
|
|
{
|
|
va_list_escapes = true;
|
|
break;
|
|
}
|
|
ap = TREE_OPERAND (ap, 0);
|
|
if (TREE_CODE (ap) == ARRAY_REF)
|
|
{
|
|
if (! integer_zerop (TREE_OPERAND (ap, 1)))
|
|
{
|
|
va_list_escapes = true;
|
|
break;
|
|
}
|
|
ap = TREE_OPERAND (ap, 0);
|
|
}
|
|
if (TYPE_MAIN_VARIANT (TREE_TYPE (ap))
|
|
!= TYPE_MAIN_VARIANT (va_list_type_node)
|
|
|| TREE_CODE (ap) != VAR_DECL)
|
|
{
|
|
va_list_escapes = true;
|
|
break;
|
|
}
|
|
|
|
if (is_global_var (ap))
|
|
{
|
|
va_list_escapes = true;
|
|
break;
|
|
}
|
|
|
|
bitmap_set_bit (si.va_list_vars, DECL_UID (ap));
|
|
|
|
/* VA_START_BB and VA_START_AP will be only used if there is just
|
|
one va_start in the function. */
|
|
si.va_start_bb = bb;
|
|
si.va_start_ap = ap;
|
|
}
|
|
|
|
if (va_list_escapes)
|
|
break;
|
|
}
|
|
|
|
/* If there were no va_start uses in the function, there is no need to
|
|
save anything. */
|
|
if (si.va_start_count == 0)
|
|
goto finish;
|
|
|
|
/* If some va_list arguments weren't local, we can't optimize. */
|
|
if (va_list_escapes)
|
|
goto finish;
|
|
|
|
/* For void * or char * va_list, something useful can be done only
|
|
if there is just one va_start. */
|
|
if (va_list_simple_ptr && si.va_start_count > 1)
|
|
{
|
|
va_list_escapes = true;
|
|
goto finish;
|
|
}
|
|
|
|
/* For struct * va_list, if the backend didn't tell us what the counter fields
|
|
are, there is nothing more we can do. */
|
|
if (!va_list_simple_ptr
|
|
&& va_list_gpr_counter_field == NULL_TREE
|
|
&& va_list_fpr_counter_field == NULL_TREE)
|
|
{
|
|
va_list_escapes = true;
|
|
goto finish;
|
|
}
|
|
|
|
/* For void * or char * va_list there is just one counter
|
|
(va_list itself). Use VA_LIST_GPR_SIZE for it. */
|
|
if (va_list_simple_ptr)
|
|
cfun->va_list_fpr_size = VA_LIST_MAX_FPR_SIZE;
|
|
|
|
calculate_dominance_info (CDI_DOMINATORS);
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
block_stmt_iterator i;
|
|
|
|
si.compute_sizes = -1;
|
|
si.bb = bb;
|
|
|
|
/* For va_list_simple_ptr, we have to check PHI nodes too. We treat
|
|
them as assignments for the purpose of escape analysis. This is
|
|
not needed for non-simple va_list because virtual phis don't perform
|
|
any real data movement. */
|
|
if (va_list_simple_ptr)
|
|
{
|
|
tree phi, lhs, rhs;
|
|
use_operand_p uop;
|
|
ssa_op_iter soi;
|
|
|
|
for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
|
|
{
|
|
lhs = PHI_RESULT (phi);
|
|
|
|
if (!is_gimple_reg (lhs))
|
|
continue;
|
|
|
|
FOR_EACH_PHI_ARG (uop, phi, soi, SSA_OP_USE)
|
|
{
|
|
rhs = USE_FROM_PTR (uop);
|
|
if (va_list_ptr_read (&si, rhs, lhs))
|
|
continue;
|
|
else if (va_list_ptr_write (&si, lhs, rhs))
|
|
continue;
|
|
else
|
|
check_va_list_escapes (&si, lhs, rhs);
|
|
|
|
if (si.va_list_escapes
|
|
|| walk_tree (&phi, find_va_list_reference,
|
|
si.va_list_vars, NULL))
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fputs ("va_list escapes in ", dump_file);
|
|
print_generic_expr (dump_file, phi, dump_flags);
|
|
fputc ('\n', dump_file);
|
|
}
|
|
va_list_escapes = true;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
for (i = bsi_start (bb);
|
|
!bsi_end_p (i) && !va_list_escapes;
|
|
bsi_next (&i))
|
|
{
|
|
tree stmt = bsi_stmt (i);
|
|
tree call;
|
|
|
|
/* Don't look at __builtin_va_{start,end}, they are ok. */
|
|
call = get_call_expr_in (stmt);
|
|
if (call)
|
|
{
|
|
tree callee = get_callee_fndecl (call);
|
|
|
|
if (callee
|
|
&& DECL_BUILT_IN_CLASS (callee) == BUILT_IN_NORMAL
|
|
&& (DECL_FUNCTION_CODE (callee) == BUILT_IN_VA_START
|
|
|| DECL_FUNCTION_CODE (callee) == BUILT_IN_VA_END))
|
|
continue;
|
|
}
|
|
|
|
if (TREE_CODE (stmt) == GIMPLE_MODIFY_STMT)
|
|
{
|
|
tree lhs = GIMPLE_STMT_OPERAND (stmt, 0);
|
|
tree rhs = GIMPLE_STMT_OPERAND (stmt, 1);
|
|
|
|
if (TREE_CODE (rhs) == WITH_SIZE_EXPR)
|
|
rhs = TREE_OPERAND (rhs, 0);
|
|
|
|
if (va_list_simple_ptr)
|
|
{
|
|
/* Check for tem = ap. */
|
|
if (va_list_ptr_read (&si, rhs, lhs))
|
|
continue;
|
|
|
|
/* Check for the last insn in:
|
|
tem1 = ap;
|
|
tem2 = tem1 + CST;
|
|
ap = tem2;
|
|
sequence. */
|
|
else if (va_list_ptr_write (&si, lhs, rhs))
|
|
continue;
|
|
|
|
else
|
|
check_va_list_escapes (&si, lhs, rhs);
|
|
}
|
|
else
|
|
{
|
|
/* Check for ap[0].field = temp. */
|
|
if (va_list_counter_struct_op (&si, lhs, rhs, true))
|
|
continue;
|
|
|
|
/* Check for temp = ap[0].field. */
|
|
else if (va_list_counter_struct_op (&si, rhs, lhs, false))
|
|
continue;
|
|
|
|
/* Do any architecture specific checking. */
|
|
else if (targetm.stdarg_optimize_hook
|
|
&& targetm.stdarg_optimize_hook (&si, lhs, rhs))
|
|
continue;
|
|
}
|
|
}
|
|
|
|
/* All other uses of va_list are either va_copy (that is not handled
|
|
in this optimization), taking address of va_list variable or
|
|
passing va_list to other functions (in that case va_list might
|
|
escape the function and therefore va_start needs to set it up
|
|
fully), or some unexpected use of va_list. None of these should
|
|
happen in a gimplified VA_ARG_EXPR. */
|
|
if (si.va_list_escapes
|
|
|| walk_tree (&stmt, find_va_list_reference,
|
|
si.va_list_vars, NULL))
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
{
|
|
fputs ("va_list escapes in ", dump_file);
|
|
print_generic_expr (dump_file, stmt, dump_flags);
|
|
fputc ('\n', dump_file);
|
|
}
|
|
va_list_escapes = true;
|
|
}
|
|
}
|
|
|
|
if (va_list_escapes)
|
|
break;
|
|
}
|
|
|
|
if (! va_list_escapes
|
|
&& va_list_simple_ptr
|
|
&& ! bitmap_empty_p (si.va_list_escape_vars)
|
|
&& check_all_va_list_escapes (&si))
|
|
va_list_escapes = true;
|
|
|
|
finish:
|
|
if (va_list_escapes)
|
|
{
|
|
cfun->va_list_gpr_size = VA_LIST_MAX_GPR_SIZE;
|
|
cfun->va_list_fpr_size = VA_LIST_MAX_FPR_SIZE;
|
|
}
|
|
BITMAP_FREE (si.va_list_vars);
|
|
BITMAP_FREE (si.va_list_escape_vars);
|
|
free (si.offsets);
|
|
if (dump_file)
|
|
{
|
|
fprintf (dump_file, "%s: va_list escapes %d, needs to save ",
|
|
funcname, (int) va_list_escapes);
|
|
if (cfun->va_list_gpr_size >= VA_LIST_MAX_GPR_SIZE)
|
|
fputs ("all", dump_file);
|
|
else
|
|
fprintf (dump_file, "%d", cfun->va_list_gpr_size);
|
|
fputs (" GPR units and ", dump_file);
|
|
if (cfun->va_list_fpr_size >= VA_LIST_MAX_FPR_SIZE)
|
|
fputs ("all", dump_file);
|
|
else
|
|
fprintf (dump_file, "%d", cfun->va_list_fpr_size);
|
|
fputs (" FPR units.\n", dump_file);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
|
|
struct gimple_opt_pass pass_stdarg =
|
|
{
|
|
{
|
|
GIMPLE_PASS,
|
|
"stdarg", /* name */
|
|
gate_optimize_stdarg, /* gate */
|
|
execute_optimize_stdarg, /* execute */
|
|
NULL, /* sub */
|
|
NULL, /* next */
|
|
0, /* static_pass_number */
|
|
0, /* tv_id */
|
|
PROP_cfg | PROP_ssa | PROP_alias, /* properties_required */
|
|
0, /* properties_provided */
|
|
0, /* properties_destroyed */
|
|
0, /* todo_flags_start */
|
|
TODO_dump_func /* todo_flags_finish */
|
|
}
|
|
};
|