b5b8b0ac64
gcc/ChangeLog:
* doc/invoke.texi (-fvar-tracking-assignments): New.
(-fvar-tracking-assignments-toggle): New.
(-fdump-final-insns=file): Mark filename as optional.
(--param min-nondebug-insn-uid): New.
(-gdwarf-@{version}): Mention version 4.
* opts.c (common_handle_option): Accept it.
* tree-vrp.c (find_assert_locations_1): Skip debug stmts.
* regrename.c (regrename_optimize): Drop last. Don't count debug
insns as uses. Don't reject change because of debug insn.
(do_replace): Reject DEBUG_INSN as chain starter. Take base_regno
from the chain starter, and check for inexact matches in
DEBUG_INSNS.
(scan_rtx_reg): Accept inexact matches in DEBUG_INSNs.
(build_def_use): Simplify and fix the marking of DEBUG_INSNs.
* sched-ebb.c (schedule_ebbs): Skip boundary debug insns.
* fwprop.c (forward_propagate_and_simplify): ...into debug insns.
* doc/gimple.texi (is_gimple_debug): New.
(gimple_debug_bind_p): New.
(is_gimple_call, gimple_assign_cast_p): End sentence with period.
* doc/install.texi (bootstrap-debug): More details.
(bootstrap-debug-big, bootstrap-debug-lean): Document.
(bootstrap-debug-lib): More details.
(bootstrap-debug-ckovw): Update.
(bootstrap-time): New.
* tree-into-ssa.c (mark_def_sites): Skip debug stmts.
(insert_phi_nodes_for): Insert debug stmts.
(rewrite_stmt): Take iterator. Insert debug stmts.
(rewrite_enter_block): Adjust.
(maybe_replace_use_in_debug_stmt): New.
(rewrite_update_stmt): Use it.
(mark_use_interesting): Return early for debug stmts.
* tree-ssa-loop-im.c (rewrite_bittest): Propagate DEFs into debug
stmts before replacing stmt.
(move_computations_stmt): Likewise.
* ira-conflicts.c (add_copies): Skip debug insns.
* regstat.c (regstat_init_n_sets_and_refs): Discount debug insns.
(regstat_bb_compute_ri): Skip debug insns.
* tree-ssa-threadupdate.c (redirection_block_p): Skip debug stmts.
* tree-ssa-loop-manip.c (find_uses_to_rename_stmt,
check_loop_closed_ssa_stmt): Skip debug stmts.
* tree-tailcall.c (find_tail_calls): Likewise.
* tree-ssa-loop-ch.c (should_duplicate_loop_header_p): Likewise.
* tree.h (MAY_HAVE_DEBUG_STMTS): New.
(build_var_debug_value_stat): Declare.
(build_var_debug_value): Define.
(target_for_debug_bind): Declare.
* reload.c (find_equiv_reg): Skip debug insns.
* rtlanal.c (reg_used_between_p): Skip debug insns.
(side_effects_p): Likewise.
(canonicalize_condition): Likewise.
* ddg.c (create_ddg_dep_from_intra_loop_link): Check that non-debug
insns never depend on debug insns.
(create_ddg_dep_no_link): Likewise.
(add_cross_iteration_register_deps): Use ANTI_DEP for debug insns.
Don't add inter-loop dependencies for debug insns.
(build_intra_loop_deps): Likewise.
(create_ddg): Count debug insns.
* ddg.h (struct ddg::num_debug): New.
(num_backargs): Pair up with previous int field.
* diagnostic.c (diagnostic_report_diagnostic): Skip notes on
-fcompare-debug-second.
* final.c (get_attr_length_1): Skip debug insns.
(rest_of_clean-state): Don't dump CFA_RESTORE_STATE.
* gcc.c (invoke_as): Call compare-debug-dump-opt.
(driver_self_specs): Map -fdump-final-insns to
-fdump-final-insns=..
(get_local_tick): New.
(compare_debug_dump_opt_spec_function): Test for . argument and
compute output name. Compute temp output spec without flag name.
Compute -frandom-seed.
(OPT): Undef after use.
* cfgloopanal.c (num_loop_insns): Skip debug insns.
(average_num_loop_insns): Likewise.
* params.h (MIN_NONDEBUG_INSN_UID): New.
* gimple.def (GIMPLE_DEBUG): New.
* ipa-reference.c (scan_stmt_for_static_refs): Skip debug stmts.
* auto-inc-dec.c (merge_in_block): Skip debug insns.
(merge_in_block): Fix whitespace.
* toplev.c (flag_var_tracking): Update comment.
(flag_var_tracking_assignments): New.
(flag_var_tracking_assignments_toggle): New.
(process_options): Don't open final insns dump file if we're not
going to write to it. Compute defaults for var_tracking.
* df-scan.c (df_insn_rescan_debug_internal): New.
(df_uses_record): Handle debug insns.
* haifa-sched.c (ready): Initialize n_debug.
(contributes_to_priority): Skip debug insns.
(dep_list_size): New.
(priority): Use it.
(rank_for_schedule): Likewise. Schedule debug insns as soon as
they're ready. Disregard previous debug insns to make decisions.
(queue_insn): Never queue debug insns.
(ready_add, ready_remove_first, ready_remove): Count debug insns.
(schedule_insn): Don't reject debug insns because of issue rate.
(get_ebb_head_tail, no_real_insns_p): Skip boundary debug insns.
(queue_to_ready): Skip and discount debug insns.
(choose_ready): Let debug insns through.
(schedule_block): Check boundary debug insns. Discount debug
insns, schedule them early. Adjust whitespace.
(set_priorities): Check for boundary debug insns.
(add_jump_dependencies): Use dep_list_size.
(prev_non_location_insn): New.
(check_cfg): Use it.
* tree-ssa-loop-ivopts.c (find-interesting_users): Skip debug
stmts.
(remove_unused_ivs): Reset debug stmts.
* modulo-sched.c (const_iteration_count): Skip debug insns.
(res_MII): Discount debug insns.
(loop_single_full_bb_p): Skip debug insns.
(sms_schedule): Likewise.
(sms_schedule_by_order): Likewise.
(ps_has_conflicts): Likewise.
* caller-save.c (refmarker_fn): New.
(save_call_clobbered_regs): Replace regs with saved mem in
debug insns.
(mark_referenced_regs): Take pointer, mark and arg. Adjust.
Call refmarker_fn mark for hardregnos.
(mark_reg_as_referenced): New.
(replace_reg_with_saved_mem): New.
* ipa-pure-const.c (check_stmt): Skip debug stmts.
* cse.c (cse_insn): Canonicalize debug insns. Skip them when
searching back.
(cse_extended_basic_block): Skip debug insns.
(count_reg_usage): Likewise.
(is_dead_reg): New, split out of...
(set_live_p): ... here.
(insn_live_p): Use it for debug insns.
* tree-stdarg.c (check_all_va_list_escapes): Skip debug stmts.
(execute_optimize_stdarg): Likewise.
* tree-ssa-dom.c (propagate_rhs_into_lhs): Likewise.
* tree-ssa-propagate.c (substitute_and_fold): Don't regard
changes in debug stmts as changes.
* sel-sched.c (moving_insn_creates_bookkeeping_block_p): New.
(moveup_expr): Don't move across debug insns. Don't move
debug insn if it would create a bookkeeping block.
(moveup_expr_cached): Don't use cache for debug insns that
are heads of blocks.
(compute_av_set_inside_bb): Skip debug insns.
(sel_rank_for_schedule): Schedule debug insns first. Remove
dead code.
(block_valid_for_bookkeeping_p); Support lax searches.
(create_block_for_bookkeeping): Adjust block numbers when
encountering debug-only blocks.
(find_place_for_bookkeeping): Deal with debug-only blocks.
(generate_bookkeeping_insn): Accept no place to insert.
(remove_temp_moveop_nops): New argument full_tidying.
(prepare_place_to_insert): Deal with debug insns.
(advance_state_on_fence): Debug insns don't start cycles.
(update_boundaries): Take fence as argument. Deal with
debug insns.
(schedule_expr_on_boundary): No full_tidying on debug insns.
(fill_insns): Deal with debug insns.
(track_scheduled_insns_and_blocks): Don't count debug insns.
(need_nop_to_preserve_insn_bb): New, split out of...
(remove_insn_from_stream): ... this.
(fur_orig_expr_not_found): Skip debug insns.
* rtl.def (VALUE): Move up.
(DEBUG_INSN): New.
* tree-ssa-sink.c (all_immediate_uses_same_place): Skip debug
stmts.
(nearest_common_dominator_of_uses): Take debug_stmts argument.
Set it if debug stmts are found.
(statement_sink_location): Skip debug stmts. Propagate
moving defs into debug stmts.
* ifcvt.c (first_active_insn): Skip debug insns.
(last_active_insns): Likewise.
(cond_exec_process_insns): Likewise.
(noce_process_if_block): Likewise.
(check_cond_move_block): Likewise.
(cond_move_convert_if_block): Likewise.
(block_jumps_and_fallthru_p): Likewise.
(dead_or_predicable): Likewise.
* dwarf2out.c (debug_str_hash_forced): New.
(find_AT_string): Add comment.
(gen_label_for_indirect_string): New.
(get_debug_string_label): New.
(AT_string_form): Use it.
(mem_loc_descriptor): Handle non-TLS symbols. Handle MINUS , DIV,
MOD, AND, IOR, XOR, NOT, ABS, NEG, and CONST_STRING. Accept but
discard COMPARE, IF_THEN_ELSE, ROTATE, ROTATERT, TRUNCATE and
several operations that cannot be represented with DWARF opcodes.
(loc_descriptor): Ignore SIGN_EXTEND and ZERO_EXTEND. Require
dwarf_version 4 for DW_OP_implicit_value and DW_OP_stack_value.
(dwarf2out_var_location): Take during-call mark into account.
(output_indirect_string): Update comment. Output if there are
label and references.
(prune_indirect_string): New.
(prune_unused_types): Call it if debug_str_hash_forced.
More in dwarf2out.c, from Jakub Jelinek <jakub@redhat.com>:
(dw_long_long_const): Remove.
(struct dw_val_struct): Change val_long_long type to rtx.
(print_die, attr_checksum, same_dw_val_p, loc_descriptor): Adjust for
val_long_long change to CONST_DOUBLE rtx from a long hi/lo pair.
(output_die): Likewise. Use HOST_BITS_PER_WIDE_INT size of each
component instead of HOST_BITS_PER_LONG.
(output_loc_operands): Likewise. For const8* assert
HOST_BITS_PER_WIDE_INT rather than HOST_BITS_PER_LONG is >= 64.
(output_loc_operands_raw): For const8* assert HOST_BITS_PER_WIDE_INT
rather than HOST_BITS_PER_LONG is >= 64.
(add_AT_long_long): Remove val_hi and val_lo arguments, add
val_const_double.
(size_of_die): Use HOST_BITS_PER_WIDE_INT size multiplier instead of
HOST_BITS_PER_LONG for dw_val_class_long_long.
(add_const_value_attribute): Adjust add_AT_long_long caller. Don't
handle TLS SYMBOL_REFs. If CONST wraps a constant, tail recurse.
(dwarf_stack_op_name): Handle DW_OP_implicit_value and
DW_OP_stack_value.
(size_of_loc_descr, output_loc_operands, output_loc_operands_raw):
Handle DW_OP_implicit_value.
(extract_int): Move prototype earlier.
(mem_loc_descriptor): For SUBREG punt if inner
mode size is wider than DWARF2_ADDR_SIZE. Handle SIGN_EXTEND
and ZERO_EXTEND by DW_OP_shl and DW_OP_shr{a,}. Handle
EQ, NE, GT, GE, LT, LE, GTU, GEU, LTU, LEU, SMIN, SMAX, UMIN,
UMAX, SIGN_EXTRACT, ZERO_EXTRACT.
(loc_descriptor): Compare mode size with DWARF2_ADDR_SIZE
instead of Pmode size.
(loc_descriptor): Add MODE argument. Handle CONST_INT, CONST_DOUBLE,
CONST_VECTOR, CONST, LABEL_REF and SYMBOL_REF if mode != VOIDmode,
attempt to handle other expressions. Don't handle TLS SYMBOL_REFs.
(concat_loc_descriptor, concatn_loc_descriptor,
loc_descriptor_from_tree_1): Adjust loc_descriptor callers.
(add_location_or_const_value_attribute): Likewise. For single
location loc_lists attempt to use add_const_value_attribute
for constant decls. Add DW_AT_const_value even if
NOTE_VAR_LOCATION is VAR_LOCATION with CONSTANT_P or CONST_STRING
in its expression.
* cfgbuild.c (inside_basic_block_p): Handle debug insns.
(control_flow_insn_p): Likewise.
* tree-parloops.c (eliminate_local_variables_stmt): Handle debug
stmt.
(separate_decls_in_region_debug_bind): New.
(separate_decls_in_region): Process debug bind stmts afterwards.
* recog.c (verify_changes): Handle debug insns.
(extract_insn): Likewise.
(peephole2_optimize): Skip debug insns.
* dse.c (scan_insn): Skip debug insns.
* sel-sched-ir.c (return_nop_to_pool): Take full_tidying argument.
Pass it on.
(setup_id_for_insn): Handle debug insns.
(maybe_tidy_empty_bb): Adjust whitespace.
(tidy_control_flow): Skip debug insns.
(sel_remove_insn): Adjust for debug insns.
(sel_estimate_number_of_insns): Skip debug insns.
(create_insn_rtx_from_pattern): Handle debug insns.
(create_copy_of_insn_rtx): Likewise.
* sel-sched-.h (sel_bb_end): Declare.
(sel_bb_empty_or_nop_p): New.
(get_all_loop_exits): Use it.
(_eligible_successor_edge_p): Likewise.
(return_nop_to_pool): Adjust.
* tree-eh.c (tre_empty_eh_handler_p): Skip debug stmts.
* ira-lives.c (process_bb_node_lives): Skip debug insns.
* gimple-pretty-print.c (dump_gimple_debug): New.
(dump_gimple_stmt): Use it.
(dump_bb_header): Skip gimple debug stmts.
* regmove.c (optimize_reg_copy_1): Discount debug insns.
(fixup_match_2): Likewise.
(regmove_backward_pass): Likewise. Simplify combined
replacement. Handle debug insns.
* function.c (instantiate_virtual_regs): Handle debug insns.
* function.h (struct emit_status): Add x_cur_debug_insn_uid.
* print-rtl.h: Include cselib.h.
(print_rtx): Print VALUEs. Split out and recurse for
VAR_LOCATIONs.
* df.h (df_inns_rescan_debug_internal): Declare.
* gcse.c (alloc_hash_table): Estimate n_insns.
(cprop_insn): Don't regard debug insns as changes.
(bypass_conditional_jumps): Skip debug insns.
(one_pre_gcse_pass): Adjust.
(one_code_hoisting_pass): Likewise.
(compute_ld_motion_mems): Skip debug insns.
(one_cprop_pass): Adjust.
* tree-if-conv.c (tree_if_convert_stmt): Reset debug stmts.
(if_convertible_stmt_p): Handle debug stmts.
* init-regs.c (initialize_uninitialized_regs): Skip debug insns.
* tree-vect-loop.c (vect_is_simple_reduction): Skip debug stmts.
* ira-build.c (create_bb_allocnos): Skip debug insns.
* tree-flow-inline.h (has_zero_uses): Discount debug stmts.
(has_single_use): Likewise.
(single_imm_use): Likewise.
(num_imm_uses): Likewise.
* tree-ssa-phiopt.c (empty_block_p): Skip debug stmts.
* tree-ssa-coalesce.c (build_ssa_conflict_graph): Skip debug stmts.
(create_outofssa_var_map): Likewise.
* lower-subreg.c (adjust_decomposed_uses): New.
(resolve_debug): New.
(decompose_multiword_subregs): Use it.
* tree-dfa.c (find_referenced_vars): Skip debug stmts.
* emit-rtl.c: Include params.h.
(cur_debug_insn_uid): Define.
(set_new_first_and_last_insn): Set cur_debug_insn_uid too.
(copy_rtx_if_shared_1): Handle debug insns.
(reset_used_flags): Likewise.
(set_used_flags): LIkewise.
(get_max_insn_count): New.
(next_nondebug_insn): New.
(prev_nondebug_insn): New.
(make_debug_insn_raw): New.
(emit_insn_before_noloc): Handle debug insns.
(emit_jump_insn_before_noloc): Likewise.
(emit_call_insn_before_noloc): Likewise.
(emit_debug_insn_before_noloc): New.
(emit_insn_after_noloc): Handle debug insns.
(emit_jump_insn_after_noloc): Likewise.
(emit_call_insn_after_noloc): Likewise.
(emit_debug_insn_after_noloc): Likewise.
(emit_insn_after): Take loc from earlier non-debug insn.
(emit_jump_insn_after): Likewise.
(emit_call_insn_after): Likewise.
(emit_debug_insn_after_setloc): New.
(emit_debug_insn_after): New.
(emit_insn_before): Take loc from later non-debug insn.
(emit_jump_insn_before): Likewise.
(emit_call_insn_before): Likewise.
(emit_debug_insn_before_setloc): New.
(emit_debug_insn_before): New.
(emit_insn): Handle debug insns.
(emit_debug_insn): New.
(emit_jump_insn): Handle debug insns.
(emit_call_insn): Likewise.
(emit): Likewise.
(init_emit): Take min-nondebug-insn-uid into account.
Initialize cur_debug_insn_uid.
(emit_copy_of_insn_after): Handle debug insns.
* cfgexpand.c (gimple_assign_rhs_to_tree): Do not overwrite
location of single rhs in place.
(maybe_dump_rtl_for_gimple_stmt): Dump lineno.
(floor_sdiv_adjust): New.
(cell_sdiv_adjust): New.
(cell_udiv_adjust): New.
(round_sdiv_adjust): New.
(round_udiv_adjust): New.
(wrap_constant): Moved from cselib.
(unwrap_constant): New.
(expand_debug_expr): New.
(expand_debug_locations): New.
(expand_gimple_basic_block): Drop hiding redeclaration. Expand
debug bind stmts.
(gimple_expand_cfg): Expand debug locations.
* cselib.c: Include tree-pass.h.
(struct expand_value_data): New.
(cselib_record_sets_hook): New.
(PRESERVED_VALUE_P, LONG_TERM_PRESERVED_VALUE_P): New.
(cselib_clear_table): Move, and implemnet in terms of...
(cselib_reset_table_with_next_value): ... this.
(cselib_get_next_unknown_value): New.
(discard_useless_locs): Don't discard preserved values.
(cselib_preserve_value): New.
(cselib_preserved_value_p): New.
(cselib_preserve_definitely): New.
(cselib_clear_preserve): New.
(cselib_preserve_only_values): New.
(new_cselib_val): Take rtx argument. Dump it in details.
(cselib_lookup_mem): Adjust.
(expand_loc): Take regs_active in struct. Adjust. Silence
dumps unless details are requested.
(cselib_expand_value_rtx_cb): New.
(cselib_expand_value_rtx): Rename and reimplment in terms of...
(cselib_expand_value_rtx_1): ... this. Adjust. Silence dumps
without details. Copy more subregs. Try to resolve values
using a callback. Wrap constants.
(cselib_subst_to_values): Adjust.
(cselib_log_lookup): New.
(cselib_lookup): Call it.
(cselib_invalidate_regno): Don't count preserved values as
useless.
(cselib_invalidate_mem): Likewise.
(cselib_record_set): Likewise.
(struct set): Renamed to cselib_set, moved to cselib.h.
(cselib_record_sets): Adjust. Call hook.
(cselib_process_insn): Reset table when it would be cleared.
(dump_cselib_val): New.
(dump_cselib_table): New.
* tree-cfgcleanup.c (tree_forwarded_block_p): Skip debug stmts.
(remove_forwarder_block): Support moving debug stmts.
* cselib.h (cselib_record_sets_hook): Declare.
(cselib_expand_callback): New type.
(cselib_expand_value_rtx_cb): Declare.
(cselib_reset_table_with_next_value): Declare.
(cselib_get_next_unknown_value): Declare.
(cselib_preserve_value): Declare.
(cselib_preserved_value_p): Declare.
(cselib_preserve_only_values): Declare.
(dump_cselib_table): Declare.
* cfgcleanup.c (flow_find_cross_jump): Skip debug insns.
(try_crossjump_to_edge): Likewise.
(delete_unreachable_blocks): Remove dominant GIMPLE blocks after
dominated blocks when debug stmts are present.
* simplify-rtx.c (delegitimize_mem_from_attrs): New.
* tree-ssa-live.c (remove_unused_locals): Skip debug stmts.
(set_var_live_on_entry): Likewise.
* loop-invariant.c (find_invariants_bb): Skip debug insns.
* cfglayout.c (curr_location, last_location): Make static.
(set_curr_insn_source_location): Don't avoid bouncing.
(get_curr_insn_source_location): New.
(get_curr_insn_block): New.
(duplicate_insn_chain): Handle debug insns.
* tree-ssa-forwprop.c (forward_propagate_addr_expr): Propagate
into debug stmts.
* common.opt (fcompare-debug): Move to sort order.
(fdump-unnumbered-links): Likewise.
(fvar-tracking-assignments): New.
(fvar-tracking-assignments-toggle): New.
* tree-ssa-dce.c (mark_stmt_necessary): Don't mark blocks
because of debug stmts.
(mark_stmt_if_obviously_necessary): Mark debug stmts.
(eliminate_unnecessary_stmts): Walk dominated blocks before
dominators.
* tree-ssa-ter.c (find_replaceable_in_bb): Skip debug stmts.
* ira.c (memref_used_between_p): Skip debug insns.
(update_equiv_regs): Likewise.
* sched-deps.c (sd_lists_size): Accept empty list.
(sd_init_insn): Mark debug insns.
(sd_finish_insn): Unmark them.
(sd_add_dep): Reject non-debug deps on debug insns.
(fixup_sched_groups): Give debug insns group treatment.
Skip debug insns.
(sched_analyze_reg): Don't mark debug insns for sched before call.
(sched_analyze_2): Handle debug insns.
(sched_analyze_insn): Compute next non-debug insn. Handle debug
insns.
(deps_analyze_insn): Handle debug insns.
(deps_start_bb): Skip debug insns.
(init_deps): Initialize last_debug_insn.
* tree-ssa.c (target_for_debug_bind): New.
(find_released_ssa_name): New.
(propagate_var_def_into_debug_stmts): New.
(propagate_defs_into_debug_stmts): New.
(verify_ssa): Skip debug bind stmts without values.
(warn_uninialized_vars): Skip debug stmts.
* target-def.h (TARGET_DELEGITIMIZE_ADDRESS): Set default.
* rtl.c (rtx_equal_p_cb): Handle VALUEs.
(rtx_equal_p): Likewise.
* ira-costs.c (scan_one_insn): Skip debug insns.
(process_bb_node_for_hard_reg_moves): Likewise.
* rtl.h (DEBUG_INSN_P): New.
(NONDEBUG_INSN_P): New.
(MAY_HAVE_DEBUG_INSNS): New.
(INSN_P): Accept debug insns.
(RTX_FRAME_RELATED_P): Likewise.
(INSN_DELETED_P): Likewise
(PAT_VAR_LOCATION_DECL): New.
(PAT_VAR_LOCATION_LOC): New.
(PAT_VAR_OCATION_STATUS): New.
(NOTE_VAR_LOCATION_DECL): Reimplement.
(NOTE_VAR_LOCATION_LOC): Likewise.
(NOTE_VAR_LOCATION_STATUS): Likewise.
(INSN_VAR_LOCATION): New.
(INSN_VAR_LOCATION_DECL): New.
(INSN_VAR_LOCATION_LOC): New.
(INSN_VAR_LOCATION_STATUS): New.
(gen_rtx_UNKNOWN_VAR_LOC): New.
(VAR_LOC_UNKNOWN_P): New.
(NOTE_DURING_CALL_P): New.
(SCHED_GROUP_P): Accept debug insns.
(emit_debug_insn_before): Declare.
(emit_debug_insn_before_noloc): Declare.
(emit_debug_insn_beore_setloc): Declare.
(emit_debug_insn_after): Declare.
(emit_debug_insn_after_noloc): Declare.
(emit_debug_insn_after_setloc): Declare.
(emit_debug_insn): Declare.
(make_debug_insn_raw): Declare.
(prev_nondebug_insn): Declare.
(next_nondebug_insn): Declare.
(delegitimize_mem_from_attrs): Declare.
(get_max_insn_count): Declare.
(wrap_constant): Declare.
(unwrap_constant): Declare.
(get_curr_insn_source_location): Declare.
(get_curr_insn_block): Declare.
* tree-inline.c (insert_debug_decl_map): New.
(processing_debug_stmt): New.
(remap_decl): Don't create new mappings in debug stmts.
(remap_gimple_op_r): Don't add references in debug stmts.
(copy_tree_body_r): Likewise.
(remap_gimple_stmt): Handle debug bind stmts.
(copy_bb): Skip debug stmts.
(copy_edges_for_bb): Likewise.
(copy_debug_stmt): New.
(copy_debug_stmts): New.
(copy_body): Copy debug stmts at the end.
(insert_init_debug_bind): New.
(insert_init_stmt): Take id. Skip and emit debug stmts.
(setup_one_parameter): Remap variable earlier, register debug
mapping.
(estimate_num_insns): Skip debug stmts.
(expand_call_inline): Preserve debug_map.
(optimize_inline_calls): Check for no debug_stmts left-overs.
(unsave_expr_now): Preserve debug_map.
(copy_gimple_seq_and_replace_locals): Likewise.
(tree_function_versioning): Check for no debug_stmts left-overs.
Init and destroy debug_map as needed. Split edges unconditionally.
(build_duplicate_type): Init and destroy debug_map as needed.
* tree-inline.h: Include gimple.h instead of pointer-set.h.
(struct copy_body_data): Add debug_stmts and debug_map.
* sched-int.h (struct ready_list): Add n_debug.
(struct deps): Add last_debug_insn.
(DEBUG_INSN_SCHED_P): New.
(BOUNDARY_DEBUG_INSN_P): New.
(SCHEDULE_DEBUG_INSN_P): New.
(sd_iterator_cond): Accept empty list.
* combine.c (create_log_links): Skip debug insns.
(combine_instructions): Likewise.
(cleanup_auto_inc_dec): New. From Jakub Jelinek: Make sure the
return value is always unshared.
(struct rtx_subst_pair): New.
(auto_adjust_pair): New.
(propagate_for_debug_subst): New.
(propagate_for_debug): New.
(try_combine): Skip debug insns. Propagate removed defs into
debug insns.
(next_nonnote_nondebug_insn): New.
(distribute_notes): Use it. Skip debug insns.
(distribute_links): Skip debug insns.
* tree-outof-ssa.c (set_location_for_edge): Likewise.
* resource.c (mark_target_live_regs): Likewise.
* var-tracking.c: Include cselib.h and target.h.
(enum micro_operation_type): Add MO_VAL_USE, MO_VAL_LOC, and
MO_VAL_SET.
(micro_operation_type_name): New.
(enum emit_note_where): Add EMIT_NOTE_AFTER_CALL_INSN.
(struct micro_operation_def): Update comments.
(decl_or_value): New type. Use instead of decls.
(struct emit_note_data_def): Add vars.
(struct attrs_def): Use decl_or_value.
(struct variable_tracking_info_def): Add permp, flooded.
(struct location_chain_def): Update comment.
(struct variable_part_def): Use decl_or_value.
(struct variable_def): Make var_part a variable length array.
(valvar_pool): New.
(scratch_regs): New.
(cselib_hook_called): New.
(dv_is_decl_p): New.
(dv_is_value_p): New.
(dv_as_decl): New.
(dv_as_value): New.
(dv_as_opaque): New.
(dv_onepart_p): New.
(dv_pool): New.
(IS_DECL_CODE): New.
(check_value_is_not_decl): New.
(dv_from_decl): New.
(dv_from_value): New.
(dv_htab_hash): New.
(variable_htab_hash): Use it.
(variable_htab_eq): Support values.
(variable_htab_free): Free from the right pool.
(attrs_list_member, attrs_list_insert): Use decl_or_value.
(attrs_list_union): Adjust.
(attrs_list_mpdv_union): New.
(tie_break_pointers): New.
(canon_value_cmp): New.
(unshare_variable): Return possibly-modified slot.
(vars_copy_1): Adjust.
(var_reg_decl_set): Adjust. Split out of...
(var_reg_set): ... this.
(get_init_value): Adjust.
(var_reg_delete_and_set): Adjust.
(var_reg_delete): Adjust.
(var_regno_delete): Adjust.
(var_mem_decl_set): Split out of...
(var_mem_set): ... this.
(var_mem_delete_and_set): Adjust.
(var_mem_delete): Adjust.
(val_store): New.
(val_reset): New.
(val_resolve): New.
(variable_union): Adjust. Speed up merge of 1-part vars.
(variable_canonicalize): Use unshared slot.
(VALUED_RECURSED_INTO): New.
(find_loc_in_1pdv): New.
(struct dfset_merge): New.
(insert_into_intersection): New.
(intersect_loc_chains): New.
(loc_cmp): New.
(canonicalize_loc_order_check): New.
(canonicalize_values_mark): New.
(canonicalize_values_star): New.
(variable_merge_over_cur): New.
(variable_merge_over_src): New.
(dataflow_set_merge): New.
(dataflow_set_equiv_regs): New.
(remove_duplicate_values): New.
(struct dfset_post_merge): New.
(variable_post_merge_new_vals): New.
(variable_post_merge_perm_vals): New.
(dataflow_post_merge_adjust): New.
(find_mem_expr_in_1pdv): New.
(dataflow_set_preserve_mem_locs): New.
(dataflow_set_remove_mem_locs): New.
(dataflow_set_clear_at_call): New.
(onepart_variable_different_p): New.
(variable_different_p): Use it.
(dataflow_set_different_1): Adjust. Make detailed dump
more verbose.
(track_expr_p): Add need_rtl parameter. Don't generate rtl
if not needed.
(track_loc_p): Pass it true.
(struct count_use_info): New.
(find_use_val): New.
(replace_expr_with_values): New.
(log_op_type): New.
(use_type): New, partially split out of...
(count_uses): ... this. Count new micro-ops.
(count_uses_1): Adjust.
(count_stores): Adjust.
(count_with_sets): New.
(VAL_NEEDS_RESOLUTION): New.
(VAL_HOLDS_TRACK_EXPR): New.
(VAL_EXPR_IS_COPIED): New.
(VAL_EXPR_IS_CLOBBERED): New.
(add_uses): Adjust. Generate new micro-ops.
(add_uses_1): Adjust.
(add_stores): Generate new micro-ops.
(add_with_sets): New.
(find_src_status): Adjust.
(find_src_set_src): Adjust.
(compute_bb_dataflow): Use dataflow_set_clear_at_call.
Handle new micro-ops. Canonicalize value equivalances.
(vt_find_locations): Compute total size of hash tables for
dumping. Perform merge for var-tracking-assignments. Don't
disregard single-block loops.
(dump_attrs_list): Handle decl_or_value.
(dump_variable): Take variable. Deal with decl_or_value.
(dump_variable_slot): New.
(dump_vars): Use it.
(dump_dataflow_sets): Adjust.
(set_slot_part): New, extended to support one-part variables
after splitting out of...
(set_variable_part): ... this.
(clobber_slot_part): New, split out of...
(clobber_variable_part): ... this.
(delete_slot_part): New, split out of...
(delete_variable_part): .... this.
(check_wrap_constant): New.
(vt_expand_loc_callback): New.
(vt_expand_loc): New.
(emit_note_insn_var_location): Adjust. Handle values. Handle
EMIT_NOTE_AFTER_CALL_INSN.
(emit_notes_for_differences_1): Adjust. Handle values.
(emit_notes_for_differences_2): Likewise.
(emit_notes_for_differences): Adjust.
(emit_notes_in_bb): Take pointer to set. Emit AFTER_CALL_INSN
notes. Adjust. Handle new micro-ops.
(vt_add_function_parameters): Adjust. Create and bind values.
(vt_initialize): Adjust. Initialize scratch_regs and
valvar_pool, flooded and perm.. Initialize and use cselib. Log
operations. Move some code to count_with_sets and add_with_sets.
(delete_debug_insns): New.
(vt_debug_insns_local): New.
(vt_finalize): Release permp, valvar_pool, scratch_regs. Finish
cselib.
(var_tracking_main): If var-tracking-assignments is enabled
but var-tracking isn't, delete debug insns and leave. Likewise
if we exceed limits or fail the stack adjustments tests, and
after all var-tracking processing.
More in var-tracking, from Jakub Jelinek <jakub@redhat.com>:
(dataflow_set): Add traversed_vars.
(value_chain, const_value_chain): New typedefs.
(value_chain_pool, value_chains): New variables.
(value_chain_htab_hash, value_chain_htab_eq, add_value_chain,
add_value_chains, add_cselib_value_chains, remove_value_chain,
remove_value_chains, remove_cselib_value_chains): New functions.
(shared_hash_find_slot_unshare_1, shared_hash_find_slot_1,
shared_hash_find_slot_noinsert_1, shared_hash_find_1): New
static inlines.
(shared_hash_find_slot_unshare, shared_hash_find_slot,
shared_hash_find_slot_noinsert, shared_hash_find): Update.
(dst_can_be_shared): New variable.
(unshare_variable): Unshare set->vars if shared, use shared_hash_*.
Clear dst_can_be_shared. If set->traversed_vars is non-NULL and
different from set->vars, look up slot again instead of using the
passed in slot.
(dataflow_set_init): Initialize traversed_vars.
(variable_union): Use shared_hash_*. Use initially NO_INSERT
lookup if set->vars is shared. Don't keep slot cleared before
calling unshare_variable. Unshare set->vars if needed. Adjust
unshare_variable callers. Clear dst_can_be_shared if needed.
Even ->refcount == 1 vars must be unshared if set->vars is shared
and var needs to be modified.
(dataflow_set_union): Set traversed_vars during canonicalization.
(VALUE_CHANGED, DECL_CHANGED): Define.
(set_dv_changed, dv_changed_p): New static inlines.
(track_expr_p): Clear DECL_CHANGED.
(dump_dataflow_sets): Set it.
(variable_was_changed): Call set_dv_changed.
(emit_note_insn_var_location): Likewise.
(changed_variables_stack): New variable.
(check_changed_vars_1, check_changed_vars_2): New functions.
(emit_notes_for_changes): Do nothing if changed_variables is
empty. Traverse changed_variables with check_changed_vars_1,
call check_changed_vars_2 on each changed_variables_stack entry.
(emit_notes_in_bb): Add SET argument. Just clear it at the
beginning, use it instead of local &set, don't destroy it at the
end.
(vt_emit_notes): Call dataflow_set_clear early on all
VTI(bb)->out sets, never use them, instead use emit_notes_in_bb
computed set, dataflow_set_clear also VTI(bb)->in when we are
done with the basic block. Initialize changed_variables_stack,
free it afterwards. If ENABLE_CHECKING verify that after noting
differences to an empty set value_chains hash table is empty.
(vt_initialize): Initialize value_chains and value_chain_pool.
(vt_finalize): Delete value_chains htab, free value_chain_pool.
(variable_tracking_main): Call dump_dataflow_sets before calling
vt_emit_notes, not after it.
* tree-flow.h (propagate_defs_into_debug_stmts): Declare.
(propagate_var_def_into_debug_stmts): Declare.
* df-problems.c (df_lr_bb_local_compute): Skip debug insns.
(df_set_note): Reject debug insns.
(df_whole_mw_reg_dead_p): Take added_notes_p argument. Don't
add notes to debug insns.
(df_note_bb_compute): Adjust. Likewise.
(df_simulate_uses): Skip debug insns.
(df_simulate_initialize_backwards): Likewise.
* reg-stack.c (subst_stack_regs_in_debug_insn): New.
(subst_stack_regs_pat): Reject debug insns.
(convert_regs_1): Handle debug insns.
* Makefile.in (TREE_INLINE_H): Take pointer-set.h from GIMPLE_H.
(print-rtl.o): Depend on cselib.h.
(cselib.o): Depend on TREE_PASS_H.
(var-tracking.o): Depend on cselib.h and TARGET_H.
* sched-rgn.c (rgn_estimate_number_of_insns): Discount
debug insns.
(init_ready_list): Skip boundary debug insns.
(add_branch_dependences): Skip debug insns.
(free_block_dependencies): Check for blocks with only debug
insns.
(compute_priorities): Likewise.
* gimple.c (gss_for_code): Handle GIMPLE_DEBUG.
(gimple_build_with_ops_stat): Take subcode as unsigned. Adjust
all callers.
(gimple_build_debug_bind_stat): New.
(empty_body_p): Skip debug stmts.
(gimple_has_side_effects): Likewise.
(gimple_rhs_has_side_effects): Likewise.
* gimple.h (enum gimple_debug_subcode, GIMPLE_DEBUG_BIND): New.
(gimple_build_debug_bind_stat): Declare.
(gimple_build_debug_bind): Define.
(is_gimple_debug): New.
(gimple_debug_bind_p): New.
(gimple_debug_bind_get_var): New.
(gimple_debug_bind_get_value): New.
(gimple_debug_bind_get_value_ptr): New.
(gimple_debug_bind_set_var): New.
(gimple_debug_bind_set_value): New.
(GIMPLE_DEBUG_BIND_NOVALUE): New internal temporary macro.
(gimple_debug_bind_reset_value): New.
(gimple_debug_bind_has_value_p): New.
(gsi_next_nondebug): New.
(gsi_prev_nondebug): New.
(gsi_start_nondebug_bb): New.
(gsi_last_nondebug_bb): New.
* sched-vis.c (print_pattern): Handle VAR_LOCATION.
(print_insn): Handle DEBUG_INSN.
* tree-cfg.c (remove_bb): Walk stmts backwards. Let loc
of first insn prevail.
(first_stmt): Skip debug stmts.
(first_non_label_stmt): Likewise.
(last_stmt): Likewise.
(has_zero_uses_1): New.
(single_imm_use_1): New.
(verify_gimple_debug): New.
(verify_types_in_gimple_stmt): Handle debug stmts.
(verify_stmt): Likewise.
(debug_loop_num): Skip debug stmts.
(remove_edge_and_dominated_blocks): Remove dominators last.
* tree-ssa-reasssoc.c (rewrite_expr_tree): Propagate into
debug stmts.
(linearize_expr): Likewise.
* config/i386/i386.c (ix86_delegitimize_address): Call
default implementation.
* config/ia64/ia64.c (ia64_safe_itanium_class): Handle debug
insns.
(group_barrier_needed): Skip debug insns.
(emit_insn_group_barriers): Likewise.
(emit_all_insn_group_barriers): Likewise.
(ia64_variable_issue): Handle debug insns.
(ia64_dfa_new_cycle): Likewise.
(final_emit_insn_group_barriers): Skip debug insns.
(ia64_dwarf2out_def_steady_cfa): Take frame argument. Don't
def cfa without frame.
(process_set): Likewise.
(process_for_unwind_directive): Pass frame on.
* config/rs6000/rs6000.c (TARGET_DELEGITIMIZE_ADDRESS): Define.
(rs6000_delegitimize_address): New.
(rs6000_debug_adjust_cost): Handle debug insns.
(is_microcoded_insn): Likewise.
(is_cracked_insn): Likewise.
(is_nonpipeline_insn): Likewise.
(insn_must_be_first_in_group): Likewise.
(insn_must_be_last_in_group): Likewise.
(force_new_group): Likewise.
* cfgrtl.c (rtl_split_block): Emit INSN_DELETED note if block
contains only debug insns.
(rtl_merge_blocks): Skip debug insns.
(purge_dead_edges): Likewise.
(rtl_block_ends_with_call_p): Skip debug insns.
* dce.c (deletable_insn_p): Handle VAR_LOCATION.
(mark_reg_dependencies): Skip debug insns.
* params.def (PARAM_MIN_NONDEBUG_INSN_UID): New.
* tree-ssanames.c (release_ssa_name): Propagate def into
debug stmts.
* tree-ssa-threadedge.c
(record_temporary_equivalences_from_stmts): Skip debug stmts.
* regcprop.c (replace_oldest_value_addr): Skip debug insns.
(replace_oldest_value_mem): Use ALL_REGS for debug insns.
(copyprop_hardreg_forward_1): Handle debug insns.
* reload1.c (reload): Skip debug insns. Replace unassigned
pseudos in debug insns with their equivalences.
(eliminate_regs_in_insn): Skip debug insns.
(emit_input_reload_insns): Skip debug insns at first, adjust
them later.
* tree-ssa-operands.c (add_virtual_operand): Reject debug stmts.
(get_indirect_ref_operands): Pass opf_no_vops on.
(get_expr_operands): Likewise. Skip debug stmts.
(parse_ssa_operands): Scan debug insns with opf_no_vops.
gcc/testsuite/ChangeLog:
* gcc.dg/guality/guality.c: New.
* gcc.dg/guality/guality.h: New.
* gcc.dg/guality/guality.exp: New.
* gcc.dg/guality/example.c: New.
* lib/gcc-dg.exp (cleanup-dump): Remove .gk files.
(cleanup-saved-temps): Likewise, .gkd files too.
gcc/cp/ChangeLog:
* cp-tree.h (TFF_NO_OMIT_DEFAULT_TEMPLATE_ARGUMENTS): New.
* cp-lang.c (cxx_dwarf_name): Pass it.
* error.c (count_non_default_template_args): Take flags as
argument. Adjust all callers. Skip counting of default
arguments if the new flag is given.
ChangeLog:
* Makefile.tpl (BUILD_CONFIG): Default to bootstrap-debug.
* Makefile.in: Rebuilt.
contrib/ChangeLog:
* compare-debug: Look for .gkd files and compare them.
config/ChangeLog:
* bootstrap-debug.mk: Add comments.
* bootstrap-debug-big.mk: New.
* bootstrap-debug-lean.mk: New.
* bootstrap-debug-ckovw.mk: Add comments.
* bootstrap-debug-lib.mk: Drop CFLAGS for stages. Use -g0
for TFLAGS in stage1. Drop -fvar-tracking-assignments-toggle.
From-SVN: r151312
1369 lines
39 KiB
C
1369 lines
39 KiB
C
/* Move registers around to reduce number of move instructions needed.
|
|
Copyright (C) 1987, 1988, 1989, 1992, 1993, 1994, 1995, 1996, 1997,
|
|
1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009
|
|
Free Software Foundation, Inc.
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free
|
|
Software Foundation; either version 3, or (at your option) any later
|
|
version.
|
|
|
|
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING3. If not see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
|
|
/* This module makes some simple RTL code transformations which
|
|
improve the subsequent register allocation. */
|
|
|
|
#include "config.h"
|
|
#include "system.h"
|
|
#include "coretypes.h"
|
|
#include "tm.h"
|
|
#include "rtl.h" /* stdio.h must precede rtl.h for FFS. */
|
|
#include "tm_p.h"
|
|
#include "insn-config.h"
|
|
#include "recog.h"
|
|
#include "output.h"
|
|
#include "regs.h"
|
|
#include "hard-reg-set.h"
|
|
#include "flags.h"
|
|
#include "function.h"
|
|
#include "expr.h"
|
|
#include "basic-block.h"
|
|
#include "except.h"
|
|
#include "toplev.h"
|
|
#include "reload.h"
|
|
#include "timevar.h"
|
|
#include "tree-pass.h"
|
|
#include "df.h"
|
|
|
|
static int optimize_reg_copy_1 (rtx, rtx, rtx);
|
|
static void optimize_reg_copy_2 (rtx, rtx, rtx);
|
|
static void optimize_reg_copy_3 (rtx, rtx, rtx);
|
|
static void copy_src_to_dest (rtx, rtx, rtx);
|
|
|
|
enum match_use
|
|
{
|
|
READ,
|
|
WRITE,
|
|
READWRITE
|
|
};
|
|
|
|
struct match {
|
|
int with[MAX_RECOG_OPERANDS];
|
|
enum match_use use[MAX_RECOG_OPERANDS];
|
|
int commutative[MAX_RECOG_OPERANDS];
|
|
int early_clobber[MAX_RECOG_OPERANDS];
|
|
};
|
|
|
|
static int find_matches (rtx, struct match *);
|
|
static int fixup_match_2 (rtx, rtx, rtx, rtx);
|
|
|
|
/* Return nonzero if registers with CLASS1 and CLASS2 can be merged without
|
|
causing too much register allocation problems. */
|
|
static int
|
|
regclass_compatible_p (enum reg_class class0, enum reg_class class1)
|
|
{
|
|
return (class0 == class1
|
|
|| (reg_class_subset_p (class0, class1)
|
|
&& ! CLASS_LIKELY_SPILLED_P (class0))
|
|
|| (reg_class_subset_p (class1, class0)
|
|
&& ! CLASS_LIKELY_SPILLED_P (class1)));
|
|
}
|
|
|
|
|
|
#ifdef AUTO_INC_DEC
|
|
|
|
/* Find the place in the rtx X where REG is used as a memory address.
|
|
Return the MEM rtx that so uses it.
|
|
If PLUSCONST is nonzero, search instead for a memory address equivalent to
|
|
(plus REG (const_int PLUSCONST)).
|
|
|
|
If such an address does not appear, return 0.
|
|
If REG appears more than once, or is used other than in such an address,
|
|
return (rtx) 1. */
|
|
|
|
static rtx
|
|
find_use_as_address (rtx x, rtx reg, HOST_WIDE_INT plusconst)
|
|
{
|
|
enum rtx_code code = GET_CODE (x);
|
|
const char * const fmt = GET_RTX_FORMAT (code);
|
|
int i;
|
|
rtx value = 0;
|
|
rtx tem;
|
|
|
|
if (code == MEM && XEXP (x, 0) == reg && plusconst == 0)
|
|
return x;
|
|
|
|
if (code == MEM && GET_CODE (XEXP (x, 0)) == PLUS
|
|
&& XEXP (XEXP (x, 0), 0) == reg
|
|
&& CONST_INT_P (XEXP (XEXP (x, 0), 1))
|
|
&& INTVAL (XEXP (XEXP (x, 0), 1)) == plusconst)
|
|
return x;
|
|
|
|
if (code == SIGN_EXTRACT || code == ZERO_EXTRACT)
|
|
{
|
|
/* If REG occurs inside a MEM used in a bit-field reference,
|
|
that is unacceptable. */
|
|
if (find_use_as_address (XEXP (x, 0), reg, 0) != 0)
|
|
return (rtx) (size_t) 1;
|
|
}
|
|
|
|
if (x == reg)
|
|
return (rtx) (size_t) 1;
|
|
|
|
for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
|
|
{
|
|
if (fmt[i] == 'e')
|
|
{
|
|
tem = find_use_as_address (XEXP (x, i), reg, plusconst);
|
|
if (value == 0)
|
|
value = tem;
|
|
else if (tem != 0)
|
|
return (rtx) (size_t) 1;
|
|
}
|
|
else if (fmt[i] == 'E')
|
|
{
|
|
int j;
|
|
for (j = XVECLEN (x, i) - 1; j >= 0; j--)
|
|
{
|
|
tem = find_use_as_address (XVECEXP (x, i, j), reg, plusconst);
|
|
if (value == 0)
|
|
value = tem;
|
|
else if (tem != 0)
|
|
return (rtx) (size_t) 1;
|
|
}
|
|
}
|
|
}
|
|
|
|
return value;
|
|
}
|
|
|
|
|
|
/* INC_INSN is an instruction that adds INCREMENT to REG.
|
|
Try to fold INC_INSN as a post/pre in/decrement into INSN.
|
|
Iff INC_INSN_SET is nonzero, inc_insn has a destination different from src.
|
|
Return nonzero for success. */
|
|
static int
|
|
try_auto_increment (rtx insn, rtx inc_insn, rtx inc_insn_set, rtx reg,
|
|
HOST_WIDE_INT increment, int pre)
|
|
{
|
|
enum rtx_code inc_code;
|
|
|
|
rtx pset = single_set (insn);
|
|
if (pset)
|
|
{
|
|
/* Can't use the size of SET_SRC, we might have something like
|
|
(sign_extend:SI (mem:QI ... */
|
|
rtx use = find_use_as_address (pset, reg, 0);
|
|
if (use != 0 && use != (rtx) (size_t) 1)
|
|
{
|
|
int size = GET_MODE_SIZE (GET_MODE (use));
|
|
if (0
|
|
|| (HAVE_POST_INCREMENT
|
|
&& pre == 0 && (inc_code = POST_INC, increment == size))
|
|
|| (HAVE_PRE_INCREMENT
|
|
&& pre == 1 && (inc_code = PRE_INC, increment == size))
|
|
|| (HAVE_POST_DECREMENT
|
|
&& pre == 0 && (inc_code = POST_DEC, increment == -size))
|
|
|| (HAVE_PRE_DECREMENT
|
|
&& pre == 1 && (inc_code = PRE_DEC, increment == -size))
|
|
)
|
|
{
|
|
if (inc_insn_set)
|
|
validate_change
|
|
(inc_insn,
|
|
&SET_SRC (inc_insn_set),
|
|
XEXP (SET_SRC (inc_insn_set), 0), 1);
|
|
validate_change (insn, &XEXP (use, 0),
|
|
gen_rtx_fmt_e (inc_code, Pmode, reg), 1);
|
|
if (apply_change_group ())
|
|
{
|
|
/* If there is a REG_DEAD note on this insn, we must
|
|
change this not to REG_UNUSED meaning that the register
|
|
is set, but the value is dead. Failure to do so will
|
|
result in sched1 dying -- when it recomputes lifetime
|
|
information, the number of REG_DEAD notes will have
|
|
changed. */
|
|
rtx note = find_reg_note (insn, REG_DEAD, reg);
|
|
if (note)
|
|
PUT_REG_NOTE_KIND (note, REG_UNUSED);
|
|
|
|
add_reg_note (insn, REG_INC, reg);
|
|
|
|
if (! inc_insn_set)
|
|
delete_insn (inc_insn);
|
|
return 1;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
#endif
|
|
|
|
|
|
static int *regno_src_regno;
|
|
|
|
/* INSN is a copy from SRC to DEST, both registers, and SRC does not die
|
|
in INSN.
|
|
|
|
Search forward to see if SRC dies before either it or DEST is modified,
|
|
but don't scan past the end of a basic block. If so, we can replace SRC
|
|
with DEST and let SRC die in INSN.
|
|
|
|
This will reduce the number of registers live in that range and may enable
|
|
DEST to be tied to SRC, thus often saving one register in addition to a
|
|
register-register copy. */
|
|
|
|
static int
|
|
optimize_reg_copy_1 (rtx insn, rtx dest, rtx src)
|
|
{
|
|
rtx p, q;
|
|
rtx note;
|
|
rtx dest_death = 0;
|
|
int sregno = REGNO (src);
|
|
int dregno = REGNO (dest);
|
|
basic_block bb = BLOCK_FOR_INSN (insn);
|
|
|
|
/* We don't want to mess with hard regs if register classes are small. */
|
|
if (sregno == dregno
|
|
|| (SMALL_REGISTER_CLASSES
|
|
&& (sregno < FIRST_PSEUDO_REGISTER
|
|
|| dregno < FIRST_PSEUDO_REGISTER))
|
|
/* We don't see all updates to SP if they are in an auto-inc memory
|
|
reference, so we must disallow this optimization on them. */
|
|
|| sregno == STACK_POINTER_REGNUM || dregno == STACK_POINTER_REGNUM)
|
|
return 0;
|
|
|
|
for (p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
|
|
{
|
|
if (! INSN_P (p))
|
|
continue;
|
|
if (BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
|
|
if (reg_set_p (src, p) || reg_set_p (dest, p)
|
|
/* If SRC is an asm-declared register, it must not be replaced
|
|
in any asm. Unfortunately, the REG_EXPR tree for the asm
|
|
variable may be absent in the SRC rtx, so we can't check the
|
|
actual register declaration easily (the asm operand will have
|
|
it, though). To avoid complicating the test for a rare case,
|
|
we just don't perform register replacement for a hard reg
|
|
mentioned in an asm. */
|
|
|| (sregno < FIRST_PSEUDO_REGISTER
|
|
&& asm_noperands (PATTERN (p)) >= 0
|
|
&& reg_overlap_mentioned_p (src, PATTERN (p)))
|
|
/* Don't change hard registers used by a call. */
|
|
|| (CALL_P (p) && sregno < FIRST_PSEUDO_REGISTER
|
|
&& find_reg_fusage (p, USE, src))
|
|
/* Don't change a USE of a register. */
|
|
|| (GET_CODE (PATTERN (p)) == USE
|
|
&& reg_overlap_mentioned_p (src, XEXP (PATTERN (p), 0))))
|
|
break;
|
|
|
|
/* See if all of SRC dies in P. This test is slightly more
|
|
conservative than it needs to be. */
|
|
if ((note = find_regno_note (p, REG_DEAD, sregno)) != 0
|
|
&& GET_MODE (XEXP (note, 0)) == GET_MODE (src))
|
|
{
|
|
int failed = 0;
|
|
int d_length = 0;
|
|
int s_length = 0;
|
|
int d_n_calls = 0;
|
|
int s_n_calls = 0;
|
|
int s_freq_calls = 0;
|
|
int d_freq_calls = 0;
|
|
|
|
/* We can do the optimization. Scan forward from INSN again,
|
|
replacing regs as we go. Set FAILED if a replacement can't
|
|
be done. In that case, we can't move the death note for SRC.
|
|
This should be rare. */
|
|
|
|
/* Set to stop at next insn. */
|
|
for (q = next_real_insn (insn);
|
|
q != next_real_insn (p);
|
|
q = next_real_insn (q))
|
|
{
|
|
if (reg_overlap_mentioned_p (src, PATTERN (q)))
|
|
{
|
|
/* If SRC is a hard register, we might miss some
|
|
overlapping registers with validate_replace_rtx,
|
|
so we would have to undo it. We can't if DEST is
|
|
present in the insn, so fail in that combination
|
|
of cases. */
|
|
if (sregno < FIRST_PSEUDO_REGISTER
|
|
&& reg_mentioned_p (dest, PATTERN (q)))
|
|
failed = 1;
|
|
|
|
/* Attempt to replace all uses. */
|
|
else if (!validate_replace_rtx (src, dest, q))
|
|
failed = 1;
|
|
|
|
/* If this succeeded, but some part of the register
|
|
is still present, undo the replacement. */
|
|
else if (sregno < FIRST_PSEUDO_REGISTER
|
|
&& reg_overlap_mentioned_p (src, PATTERN (q)))
|
|
{
|
|
validate_replace_rtx (dest, src, q);
|
|
failed = 1;
|
|
}
|
|
}
|
|
|
|
/* For SREGNO, count the total number of insns scanned.
|
|
For DREGNO, count the total number of insns scanned after
|
|
passing the death note for DREGNO. */
|
|
if (!DEBUG_INSN_P (p))
|
|
{
|
|
s_length++;
|
|
if (dest_death)
|
|
d_length++;
|
|
}
|
|
|
|
/* If the insn in which SRC dies is a CALL_INSN, don't count it
|
|
as a call that has been crossed. Otherwise, count it. */
|
|
if (q != p && CALL_P (q))
|
|
{
|
|
/* Similarly, total calls for SREGNO, total calls beyond
|
|
the death note for DREGNO. */
|
|
s_n_calls++;
|
|
s_freq_calls += REG_FREQ_FROM_BB (BLOCK_FOR_INSN (q));
|
|
if (dest_death)
|
|
{
|
|
d_n_calls++;
|
|
d_freq_calls += REG_FREQ_FROM_BB (BLOCK_FOR_INSN (q));
|
|
}
|
|
}
|
|
|
|
/* If DEST dies here, remove the death note and save it for
|
|
later. Make sure ALL of DEST dies here; again, this is
|
|
overly conservative. */
|
|
if (dest_death == 0
|
|
&& (dest_death = find_regno_note (q, REG_DEAD, dregno)) != 0)
|
|
{
|
|
if (GET_MODE (XEXP (dest_death, 0)) != GET_MODE (dest))
|
|
failed = 1, dest_death = 0;
|
|
else
|
|
remove_note (q, dest_death);
|
|
}
|
|
}
|
|
|
|
if (! failed)
|
|
{
|
|
/* These counters need to be updated if and only if we are
|
|
going to move the REG_DEAD note. */
|
|
if (sregno >= FIRST_PSEUDO_REGISTER)
|
|
{
|
|
if (REG_LIVE_LENGTH (sregno) >= 0)
|
|
{
|
|
REG_LIVE_LENGTH (sregno) -= s_length;
|
|
/* REG_LIVE_LENGTH is only an approximation after
|
|
combine if sched is not run, so make sure that we
|
|
still have a reasonable value. */
|
|
if (REG_LIVE_LENGTH (sregno) < 2)
|
|
REG_LIVE_LENGTH (sregno) = 2;
|
|
}
|
|
|
|
REG_N_CALLS_CROSSED (sregno) -= s_n_calls;
|
|
REG_FREQ_CALLS_CROSSED (sregno) -= s_freq_calls;
|
|
}
|
|
|
|
/* Move death note of SRC from P to INSN. */
|
|
remove_note (p, note);
|
|
XEXP (note, 1) = REG_NOTES (insn);
|
|
REG_NOTES (insn) = note;
|
|
}
|
|
|
|
/* DEST is also dead if INSN has a REG_UNUSED note for DEST. */
|
|
if (! dest_death
|
|
&& (dest_death = find_regno_note (insn, REG_UNUSED, dregno)))
|
|
{
|
|
PUT_REG_NOTE_KIND (dest_death, REG_DEAD);
|
|
remove_note (insn, dest_death);
|
|
}
|
|
|
|
/* Put death note of DEST on P if we saw it die. */
|
|
if (dest_death)
|
|
{
|
|
XEXP (dest_death, 1) = REG_NOTES (p);
|
|
REG_NOTES (p) = dest_death;
|
|
|
|
if (dregno >= FIRST_PSEUDO_REGISTER)
|
|
{
|
|
/* If and only if we are moving the death note for DREGNO,
|
|
then we need to update its counters. */
|
|
if (REG_LIVE_LENGTH (dregno) >= 0)
|
|
REG_LIVE_LENGTH (dregno) += d_length;
|
|
REG_N_CALLS_CROSSED (dregno) += d_n_calls;
|
|
REG_FREQ_CALLS_CROSSED (dregno) += d_freq_calls;
|
|
}
|
|
}
|
|
|
|
return ! failed;
|
|
}
|
|
|
|
/* If SRC is a hard register which is set or killed in some other
|
|
way, we can't do this optimization. */
|
|
else if (sregno < FIRST_PSEUDO_REGISTER
|
|
&& dead_or_set_p (p, src))
|
|
break;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* INSN is a copy of SRC to DEST, in which SRC dies. See if we now have
|
|
a sequence of insns that modify DEST followed by an insn that sets
|
|
SRC to DEST in which DEST dies, with no prior modification of DEST.
|
|
(There is no need to check if the insns in between actually modify
|
|
DEST. We should not have cases where DEST is not modified, but
|
|
the optimization is safe if no such modification is detected.)
|
|
In that case, we can replace all uses of DEST, starting with INSN and
|
|
ending with the set of SRC to DEST, with SRC. We do not do this
|
|
optimization if a CALL_INSN is crossed unless SRC already crosses a
|
|
call or if DEST dies before the copy back to SRC.
|
|
|
|
It is assumed that DEST and SRC are pseudos; it is too complicated to do
|
|
this for hard registers since the substitutions we may make might fail. */
|
|
|
|
static void
|
|
optimize_reg_copy_2 (rtx insn, rtx dest, rtx src)
|
|
{
|
|
rtx p, q;
|
|
rtx set;
|
|
int sregno = REGNO (src);
|
|
int dregno = REGNO (dest);
|
|
basic_block bb = BLOCK_FOR_INSN (insn);
|
|
|
|
for (p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
|
|
{
|
|
if (! INSN_P (p))
|
|
continue;
|
|
if (BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
|
|
set = single_set (p);
|
|
if (set && SET_SRC (set) == dest && SET_DEST (set) == src
|
|
&& find_reg_note (p, REG_DEAD, dest))
|
|
{
|
|
/* We can do the optimization. Scan forward from INSN again,
|
|
replacing regs as we go. */
|
|
|
|
/* Set to stop at next insn. */
|
|
for (q = insn; q != NEXT_INSN (p); q = NEXT_INSN (q))
|
|
if (INSN_P (q))
|
|
{
|
|
if (reg_mentioned_p (dest, PATTERN (q)))
|
|
{
|
|
rtx note;
|
|
|
|
PATTERN (q) = replace_rtx (PATTERN (q), dest, src);
|
|
note = FIND_REG_INC_NOTE (q, dest);
|
|
if (note)
|
|
{
|
|
remove_note (q, note);
|
|
add_reg_note (q, REG_INC, src);
|
|
}
|
|
df_insn_rescan (q);
|
|
}
|
|
|
|
if (CALL_P (q))
|
|
{
|
|
int freq = REG_FREQ_FROM_BB (BLOCK_FOR_INSN (q));
|
|
REG_N_CALLS_CROSSED (dregno)--;
|
|
REG_N_CALLS_CROSSED (sregno)++;
|
|
REG_FREQ_CALLS_CROSSED (dregno) -= freq;
|
|
REG_FREQ_CALLS_CROSSED (sregno) += freq;
|
|
}
|
|
}
|
|
|
|
remove_note (p, find_reg_note (p, REG_DEAD, dest));
|
|
REG_N_DEATHS (dregno)--;
|
|
remove_note (insn, find_reg_note (insn, REG_DEAD, src));
|
|
REG_N_DEATHS (sregno)--;
|
|
return;
|
|
}
|
|
|
|
if (reg_set_p (src, p)
|
|
|| find_reg_note (p, REG_DEAD, dest)
|
|
|| (CALL_P (p) && REG_N_CALLS_CROSSED (sregno) == 0))
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* INSN is a ZERO_EXTEND or SIGN_EXTEND of SRC to DEST.
|
|
Look if SRC dies there, and if it is only set once, by loading
|
|
it from memory. If so, try to incorporate the zero/sign extension
|
|
into the memory read, change SRC to the mode of DEST, and alter
|
|
the remaining accesses to use the appropriate SUBREG. This allows
|
|
SRC and DEST to be tied later. */
|
|
static void
|
|
optimize_reg_copy_3 (rtx insn, rtx dest, rtx src)
|
|
{
|
|
rtx src_reg = XEXP (src, 0);
|
|
int src_no = REGNO (src_reg);
|
|
int dst_no = REGNO (dest);
|
|
rtx p, set;
|
|
enum machine_mode old_mode;
|
|
basic_block bb = BLOCK_FOR_INSN (insn);
|
|
|
|
if (src_no < FIRST_PSEUDO_REGISTER
|
|
|| dst_no < FIRST_PSEUDO_REGISTER
|
|
|| ! find_reg_note (insn, REG_DEAD, src_reg)
|
|
|| REG_N_DEATHS (src_no) != 1
|
|
|| REG_N_SETS (src_no) != 1)
|
|
return;
|
|
|
|
for (p = PREV_INSN (insn); p && ! reg_set_p (src_reg, p); p = PREV_INSN (p))
|
|
if (INSN_P (p) && BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
|
|
if (! p || BLOCK_FOR_INSN (p) != bb)
|
|
return;
|
|
|
|
if (! (set = single_set (p))
|
|
|| !MEM_P (SET_SRC (set))
|
|
/* If there's a REG_EQUIV note, this must be an insn that loads an
|
|
argument. Prefer keeping the note over doing this optimization. */
|
|
|| find_reg_note (p, REG_EQUIV, NULL_RTX)
|
|
|| SET_DEST (set) != src_reg)
|
|
return;
|
|
|
|
/* Be conservative: although this optimization is also valid for
|
|
volatile memory references, that could cause trouble in later passes. */
|
|
if (MEM_VOLATILE_P (SET_SRC (set)))
|
|
return;
|
|
|
|
/* Do not use a SUBREG to truncate from one mode to another if truncation
|
|
is not a nop. */
|
|
if (GET_MODE_BITSIZE (GET_MODE (src_reg)) <= GET_MODE_BITSIZE (GET_MODE (src))
|
|
&& !TRULY_NOOP_TRUNCATION (GET_MODE_BITSIZE (GET_MODE (src)),
|
|
GET_MODE_BITSIZE (GET_MODE (src_reg))))
|
|
return;
|
|
|
|
old_mode = GET_MODE (src_reg);
|
|
PUT_MODE (src_reg, GET_MODE (src));
|
|
XEXP (src, 0) = SET_SRC (set);
|
|
|
|
/* Include this change in the group so that it's easily undone if
|
|
one of the changes in the group is invalid. */
|
|
validate_change (p, &SET_SRC (set), src, 1);
|
|
|
|
/* Now walk forward making additional replacements. We want to be able
|
|
to undo all the changes if a later substitution fails. */
|
|
while (p = NEXT_INSN (p), p != insn)
|
|
{
|
|
if (! INSN_P (p))
|
|
continue;
|
|
|
|
/* Make a tentative change. */
|
|
validate_replace_rtx_group (src_reg,
|
|
gen_lowpart_SUBREG (old_mode, src_reg),
|
|
p);
|
|
}
|
|
|
|
validate_replace_rtx_group (src, src_reg, insn);
|
|
|
|
/* Now see if all the changes are valid. */
|
|
if (! apply_change_group ())
|
|
{
|
|
/* One or more changes were no good. Back out everything. */
|
|
PUT_MODE (src_reg, old_mode);
|
|
XEXP (src, 0) = src_reg;
|
|
}
|
|
else
|
|
{
|
|
rtx note = find_reg_note (p, REG_EQUAL, NULL_RTX);
|
|
if (note)
|
|
remove_note (p, note);
|
|
}
|
|
}
|
|
|
|
|
|
/* If we were not able to update the users of src to use dest directly, try
|
|
instead moving the value to dest directly before the operation. */
|
|
|
|
static void
|
|
copy_src_to_dest (rtx insn, rtx src, rtx dest)
|
|
{
|
|
rtx seq;
|
|
rtx link;
|
|
rtx next;
|
|
rtx set;
|
|
rtx move_insn;
|
|
rtx *p_insn_notes;
|
|
rtx *p_move_notes;
|
|
int src_regno;
|
|
int dest_regno;
|
|
int insn_uid;
|
|
int move_uid;
|
|
|
|
/* A REG_LIVE_LENGTH of -1 indicates the register is equivalent to a constant
|
|
or memory location and is used infrequently; a REG_LIVE_LENGTH of -2 is
|
|
parameter when there is no frame pointer that is not allocated a register.
|
|
For now, we just reject them, rather than incrementing the live length. */
|
|
|
|
if (REG_P (src)
|
|
&& REG_LIVE_LENGTH (REGNO (src)) > 0
|
|
&& REG_P (dest)
|
|
&& REG_LIVE_LENGTH (REGNO (dest)) > 0
|
|
&& (set = single_set (insn)) != NULL_RTX
|
|
&& !reg_mentioned_p (dest, SET_SRC (set))
|
|
&& GET_MODE (src) == GET_MODE (dest))
|
|
{
|
|
int old_num_regs = reg_rtx_no;
|
|
|
|
/* Generate the src->dest move. */
|
|
start_sequence ();
|
|
emit_move_insn (dest, src);
|
|
seq = get_insns ();
|
|
end_sequence ();
|
|
/* If this sequence uses new registers, we may not use it. */
|
|
if (old_num_regs != reg_rtx_no
|
|
|| ! validate_replace_rtx (src, dest, insn))
|
|
{
|
|
/* We have to restore reg_rtx_no to its old value, lest
|
|
recompute_reg_usage will try to compute the usage of the
|
|
new regs, yet reg_n_info is not valid for them. */
|
|
reg_rtx_no = old_num_regs;
|
|
return;
|
|
}
|
|
emit_insn_before (seq, insn);
|
|
move_insn = PREV_INSN (insn);
|
|
p_move_notes = ®_NOTES (move_insn);
|
|
p_insn_notes = ®_NOTES (insn);
|
|
|
|
/* Move any notes mentioning src to the move instruction. */
|
|
for (link = REG_NOTES (insn); link != NULL_RTX; link = next)
|
|
{
|
|
next = XEXP (link, 1);
|
|
if (XEXP (link, 0) == src)
|
|
{
|
|
*p_move_notes = link;
|
|
p_move_notes = &XEXP (link, 1);
|
|
}
|
|
else
|
|
{
|
|
*p_insn_notes = link;
|
|
p_insn_notes = &XEXP (link, 1);
|
|
}
|
|
}
|
|
|
|
*p_move_notes = NULL_RTX;
|
|
*p_insn_notes = NULL_RTX;
|
|
|
|
insn_uid = INSN_UID (insn);
|
|
move_uid = INSN_UID (move_insn);
|
|
|
|
/* Update the various register tables. */
|
|
dest_regno = REGNO (dest);
|
|
INC_REG_N_SETS (dest_regno, 1);
|
|
REG_LIVE_LENGTH (dest_regno)++;
|
|
src_regno = REGNO (src);
|
|
if (! find_reg_note (move_insn, REG_DEAD, src))
|
|
REG_LIVE_LENGTH (src_regno)++;
|
|
}
|
|
}
|
|
|
|
/* reg_set_in_bb[REGNO] points to basic block iff the register is set
|
|
only once in the given block and has REG_EQUAL note. */
|
|
|
|
static basic_block *reg_set_in_bb;
|
|
|
|
/* Size of reg_set_in_bb array. */
|
|
static unsigned int max_reg_computed;
|
|
|
|
|
|
/* Return whether REG is set in only one location, and is set to a
|
|
constant, but is set in a different basic block from INSN (an
|
|
instructions which uses REG). In this case REG is equivalent to a
|
|
constant, and we don't want to break that equivalence, because that
|
|
may increase register pressure and make reload harder. If REG is
|
|
set in the same basic block as INSN, we don't worry about it,
|
|
because we'll probably need a register anyhow (??? but what if REG
|
|
is used in a different basic block as well as this one?). */
|
|
|
|
static bool
|
|
reg_is_remote_constant_p (rtx reg, rtx insn)
|
|
{
|
|
basic_block bb;
|
|
rtx p;
|
|
int max;
|
|
|
|
if (!reg_set_in_bb)
|
|
{
|
|
max_reg_computed = max = max_reg_num ();
|
|
reg_set_in_bb = XCNEWVEC (basic_block, max);
|
|
|
|
FOR_EACH_BB (bb)
|
|
FOR_BB_INSNS (bb, p)
|
|
{
|
|
rtx s;
|
|
|
|
if (!INSN_P (p))
|
|
continue;
|
|
s = single_set (p);
|
|
/* This is the instruction which sets REG. If there is a
|
|
REG_EQUAL note, then REG is equivalent to a constant. */
|
|
if (s != 0
|
|
&& REG_P (SET_DEST (s))
|
|
&& REG_N_SETS (REGNO (SET_DEST (s))) == 1
|
|
&& find_reg_note (p, REG_EQUAL, NULL_RTX))
|
|
reg_set_in_bb[REGNO (SET_DEST (s))] = bb;
|
|
}
|
|
}
|
|
|
|
gcc_assert (REGNO (reg) < max_reg_computed);
|
|
if (reg_set_in_bb[REGNO (reg)] == NULL)
|
|
return false;
|
|
return (reg_set_in_bb[REGNO (reg)] != BLOCK_FOR_INSN (insn));
|
|
}
|
|
|
|
/* INSN is adding a CONST_INT to a REG. We search backwards looking for
|
|
another add immediate instruction with the same source and dest registers,
|
|
and if we find one, we change INSN to an increment, and return 1. If
|
|
no changes are made, we return 0.
|
|
|
|
This changes
|
|
(set (reg100) (plus reg1 offset1))
|
|
...
|
|
(set (reg100) (plus reg1 offset2))
|
|
to
|
|
(set (reg100) (plus reg1 offset1))
|
|
...
|
|
(set (reg100) (plus reg100 offset2-offset1)) */
|
|
|
|
/* ??? What does this comment mean? */
|
|
/* cse disrupts preincrement / postdecrement sequences when it finds a
|
|
hard register as ultimate source, like the frame pointer. */
|
|
|
|
static int
|
|
fixup_match_2 (rtx insn, rtx dst, rtx src, rtx offset)
|
|
{
|
|
rtx p, dst_death = 0;
|
|
int length, num_calls = 0, freq_calls = 0;
|
|
basic_block bb = BLOCK_FOR_INSN (insn);
|
|
|
|
/* If SRC dies in INSN, we'd have to move the death note. This is
|
|
considered to be very unlikely, so we just skip the optimization
|
|
in this case. */
|
|
if (find_regno_note (insn, REG_DEAD, REGNO (src)))
|
|
return 0;
|
|
|
|
/* Scan backward to find the first instruction that sets DST. */
|
|
|
|
for (length = 0, p = PREV_INSN (insn); p; p = PREV_INSN (p))
|
|
{
|
|
rtx pset;
|
|
|
|
if (! INSN_P (p))
|
|
continue;
|
|
if (BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
|
|
if (find_regno_note (p, REG_DEAD, REGNO (dst)))
|
|
dst_death = p;
|
|
if (! dst_death && !DEBUG_INSN_P (p))
|
|
length++;
|
|
|
|
pset = single_set (p);
|
|
if (pset && SET_DEST (pset) == dst
|
|
&& GET_CODE (SET_SRC (pset)) == PLUS
|
|
&& XEXP (SET_SRC (pset), 0) == src
|
|
&& CONST_INT_P (XEXP (SET_SRC (pset), 1)))
|
|
{
|
|
HOST_WIDE_INT newconst
|
|
= INTVAL (offset) - INTVAL (XEXP (SET_SRC (pset), 1));
|
|
rtx add = gen_add3_insn (dst, dst, GEN_INT (newconst));
|
|
|
|
if (add && validate_change (insn, &PATTERN (insn), add, 0))
|
|
{
|
|
/* Remove the death note for DST from DST_DEATH. */
|
|
if (dst_death)
|
|
{
|
|
remove_death (REGNO (dst), dst_death);
|
|
REG_LIVE_LENGTH (REGNO (dst)) += length;
|
|
REG_N_CALLS_CROSSED (REGNO (dst)) += num_calls;
|
|
REG_FREQ_CALLS_CROSSED (REGNO (dst)) += freq_calls;
|
|
}
|
|
|
|
if (dump_file)
|
|
fprintf (dump_file,
|
|
"Fixed operand of insn %d.\n",
|
|
INSN_UID (insn));
|
|
|
|
#ifdef AUTO_INC_DEC
|
|
for (p = PREV_INSN (insn); p; p = PREV_INSN (p))
|
|
{
|
|
if (! INSN_P (p))
|
|
continue;
|
|
if (BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
if (reg_overlap_mentioned_p (dst, PATTERN (p)))
|
|
{
|
|
if (try_auto_increment (p, insn, 0, dst, newconst, 0))
|
|
return 1;
|
|
break;
|
|
}
|
|
}
|
|
for (p = NEXT_INSN (insn); p; p = NEXT_INSN (p))
|
|
{
|
|
if (! INSN_P (p))
|
|
continue;
|
|
if (BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
if (reg_overlap_mentioned_p (dst, PATTERN (p)))
|
|
{
|
|
try_auto_increment (p, insn, 0, dst, newconst, 1);
|
|
break;
|
|
}
|
|
}
|
|
#endif
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
if (reg_set_p (dst, PATTERN (p)))
|
|
break;
|
|
|
|
/* If we have passed a call instruction, and the
|
|
pseudo-reg SRC is not already live across a call,
|
|
then don't perform the optimization. */
|
|
/* reg_set_p is overly conservative for CALL_INSNS, thinks that all
|
|
hard regs are clobbered. Thus, we only use it for src for
|
|
non-call insns. */
|
|
if (CALL_P (p))
|
|
{
|
|
if (! dst_death)
|
|
{
|
|
num_calls++;
|
|
freq_calls += REG_FREQ_FROM_BB (BLOCK_FOR_INSN (p));
|
|
}
|
|
|
|
if (REG_N_CALLS_CROSSED (REGNO (src)) == 0)
|
|
break;
|
|
|
|
if (call_used_regs [REGNO (dst)]
|
|
|| find_reg_fusage (p, CLOBBER, dst))
|
|
break;
|
|
}
|
|
else if (reg_set_p (src, PATTERN (p)))
|
|
break;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* A forward pass. Replace output operands with input operands. */
|
|
|
|
static void
|
|
regmove_forward_pass (void)
|
|
{
|
|
basic_block bb;
|
|
rtx insn;
|
|
|
|
if (! flag_expensive_optimizations)
|
|
return;
|
|
|
|
if (dump_file)
|
|
fprintf (dump_file, "Starting forward pass...\n");
|
|
|
|
FOR_EACH_BB (bb)
|
|
{
|
|
FOR_BB_INSNS (bb, insn)
|
|
{
|
|
rtx set = single_set (insn);
|
|
if (! set)
|
|
continue;
|
|
|
|
if ((GET_CODE (SET_SRC (set)) == SIGN_EXTEND
|
|
|| GET_CODE (SET_SRC (set)) == ZERO_EXTEND)
|
|
&& REG_P (XEXP (SET_SRC (set), 0))
|
|
&& REG_P (SET_DEST (set)))
|
|
optimize_reg_copy_3 (insn, SET_DEST (set), SET_SRC (set));
|
|
|
|
if (REG_P (SET_SRC (set))
|
|
&& REG_P (SET_DEST (set)))
|
|
{
|
|
/* If this is a register-register copy where SRC is not dead,
|
|
see if we can optimize it. If this optimization succeeds,
|
|
it will become a copy where SRC is dead. */
|
|
if ((find_reg_note (insn, REG_DEAD, SET_SRC (set))
|
|
|| optimize_reg_copy_1 (insn, SET_DEST (set), SET_SRC (set)))
|
|
&& REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
|
|
{
|
|
/* Similarly for a pseudo-pseudo copy when SRC is dead. */
|
|
if (REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER)
|
|
optimize_reg_copy_2 (insn, SET_DEST (set), SET_SRC (set));
|
|
if (regno_src_regno[REGNO (SET_DEST (set))] < 0
|
|
&& SET_SRC (set) != SET_DEST (set))
|
|
{
|
|
int srcregno = REGNO (SET_SRC (set));
|
|
if (regno_src_regno[srcregno] >= 0)
|
|
srcregno = regno_src_regno[srcregno];
|
|
regno_src_regno[REGNO (SET_DEST (set))] = srcregno;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* A backward pass. Replace input operands with output operands. */
|
|
|
|
static void
|
|
regmove_backward_pass (void)
|
|
{
|
|
basic_block bb;
|
|
rtx insn, prev;
|
|
|
|
if (dump_file)
|
|
fprintf (dump_file, "Starting backward pass...\n");
|
|
|
|
FOR_EACH_BB_REVERSE (bb)
|
|
{
|
|
/* ??? Use the safe iterator because fixup_match_2 can remove
|
|
insns via try_auto_increment. */
|
|
FOR_BB_INSNS_REVERSE_SAFE (bb, insn, prev)
|
|
{
|
|
struct match match;
|
|
rtx copy_src, copy_dst;
|
|
int op_no, match_no;
|
|
int success = 0;
|
|
|
|
if (! INSN_P (insn))
|
|
continue;
|
|
|
|
if (! find_matches (insn, &match))
|
|
continue;
|
|
|
|
/* Now scan through the operands looking for a destination operand
|
|
which is supposed to match a source operand.
|
|
Then scan backward for an instruction which sets the source
|
|
operand. If safe, then replace the source operand with the
|
|
dest operand in both instructions. */
|
|
|
|
copy_src = NULL_RTX;
|
|
copy_dst = NULL_RTX;
|
|
for (op_no = 0; op_no < recog_data.n_operands; op_no++)
|
|
{
|
|
rtx set, p, src, dst;
|
|
rtx src_note, dst_note;
|
|
int num_calls = 0, freq_calls = 0;
|
|
enum reg_class src_class, dst_class;
|
|
int length;
|
|
|
|
match_no = match.with[op_no];
|
|
|
|
/* Nothing to do if the two operands aren't supposed to match. */
|
|
if (match_no < 0)
|
|
continue;
|
|
|
|
dst = recog_data.operand[match_no];
|
|
src = recog_data.operand[op_no];
|
|
|
|
if (!REG_P (src))
|
|
continue;
|
|
|
|
if (!REG_P (dst)
|
|
|| REGNO (dst) < FIRST_PSEUDO_REGISTER
|
|
|| REG_LIVE_LENGTH (REGNO (dst)) < 0
|
|
|| GET_MODE (src) != GET_MODE (dst))
|
|
continue;
|
|
|
|
/* If the operands already match, then there is nothing to do. */
|
|
if (operands_match_p (src, dst))
|
|
continue;
|
|
|
|
if (match.commutative[op_no] >= 0)
|
|
{
|
|
rtx comm = recog_data.operand[match.commutative[op_no]];
|
|
if (operands_match_p (comm, dst))
|
|
continue;
|
|
}
|
|
|
|
set = single_set (insn);
|
|
if (! set)
|
|
continue;
|
|
|
|
/* Note that single_set ignores parts of a parallel set for
|
|
which one of the destinations is REG_UNUSED. We can't
|
|
handle that here, since we can wind up rewriting things
|
|
such that a single register is set twice within a single
|
|
parallel. */
|
|
if (reg_set_p (src, insn))
|
|
continue;
|
|
|
|
/* match_no/dst must be a write-only operand, and
|
|
operand_operand/src must be a read-only operand. */
|
|
if (match.use[op_no] != READ
|
|
|| match.use[match_no] != WRITE)
|
|
continue;
|
|
|
|
if (match.early_clobber[match_no]
|
|
&& count_occurrences (PATTERN (insn), src, 0) > 1)
|
|
continue;
|
|
|
|
/* Make sure match_no is the destination. */
|
|
if (recog_data.operand[match_no] != SET_DEST (set))
|
|
continue;
|
|
|
|
if (REGNO (src) < FIRST_PSEUDO_REGISTER)
|
|
{
|
|
if (GET_CODE (SET_SRC (set)) == PLUS
|
|
&& CONST_INT_P (XEXP (SET_SRC (set), 1))
|
|
&& XEXP (SET_SRC (set), 0) == src
|
|
&& fixup_match_2 (insn, dst, src,
|
|
XEXP (SET_SRC (set), 1)))
|
|
break;
|
|
continue;
|
|
}
|
|
src_class = reg_preferred_class (REGNO (src));
|
|
dst_class = reg_preferred_class (REGNO (dst));
|
|
|
|
if (! (src_note = find_reg_note (insn, REG_DEAD, src)))
|
|
{
|
|
/* We used to force the copy here like in other cases, but
|
|
it produces worse code, as it eliminates no copy
|
|
instructions and the copy emitted will be produced by
|
|
reload anyway. On patterns with multiple alternatives,
|
|
there may be better solution available.
|
|
|
|
In particular this change produced slower code for numeric
|
|
i387 programs. */
|
|
|
|
continue;
|
|
}
|
|
|
|
if (! regclass_compatible_p (src_class, dst_class))
|
|
{
|
|
if (!copy_src)
|
|
{
|
|
copy_src = src;
|
|
copy_dst = dst;
|
|
}
|
|
continue;
|
|
}
|
|
|
|
/* Can not modify an earlier insn to set dst if this insn
|
|
uses an old value in the source. */
|
|
if (reg_overlap_mentioned_p (dst, SET_SRC (set)))
|
|
{
|
|
if (!copy_src)
|
|
{
|
|
copy_src = src;
|
|
copy_dst = dst;
|
|
}
|
|
continue;
|
|
}
|
|
|
|
/* If src is set once in a different basic block,
|
|
and is set equal to a constant, then do not use
|
|
it for this optimization, as this would make it
|
|
no longer equivalent to a constant. */
|
|
|
|
if (reg_is_remote_constant_p (src, insn))
|
|
{
|
|
if (!copy_src)
|
|
{
|
|
copy_src = src;
|
|
copy_dst = dst;
|
|
}
|
|
continue;
|
|
}
|
|
|
|
|
|
if (dump_file)
|
|
fprintf (dump_file,
|
|
"Could fix operand %d of insn %d matching operand %d.\n",
|
|
op_no, INSN_UID (insn), match_no);
|
|
|
|
/* Scan backward to find the first instruction that uses
|
|
the input operand. If the operand is set here, then
|
|
replace it in both instructions with match_no. */
|
|
|
|
for (length = 0, p = PREV_INSN (insn); p; p = PREV_INSN (p))
|
|
{
|
|
rtx pset;
|
|
|
|
if (! INSN_P (p))
|
|
continue;
|
|
if (BLOCK_FOR_INSN (p) != bb)
|
|
break;
|
|
|
|
if (!DEBUG_INSN_P (p))
|
|
length++;
|
|
|
|
/* ??? See if all of SRC is set in P. This test is much
|
|
more conservative than it needs to be. */
|
|
pset = single_set (p);
|
|
if (pset && SET_DEST (pset) == src)
|
|
{
|
|
/* We use validate_replace_rtx, in case there
|
|
are multiple identical source operands. All
|
|
of them have to be changed at the same time:
|
|
when validate_replace_rtx() calls
|
|
apply_change_group(). */
|
|
validate_change (p, &SET_DEST (pset), dst, 1);
|
|
if (validate_replace_rtx (src, dst, insn))
|
|
success = 1;
|
|
break;
|
|
}
|
|
|
|
/* We can't make this change if SRC is read or
|
|
partially written in P, since we are going to
|
|
eliminate SRC. We can't make this change
|
|
if DST is mentioned at all in P,
|
|
since we are going to change its value. */
|
|
if (reg_overlap_mentioned_p (src, PATTERN (p)))
|
|
{
|
|
if (DEBUG_INSN_P (p))
|
|
validate_replace_rtx_group (dst, src, insn);
|
|
else
|
|
break;
|
|
}
|
|
if (reg_mentioned_p (dst, PATTERN (p)))
|
|
{
|
|
if (DEBUG_INSN_P (p))
|
|
validate_change (p, &INSN_VAR_LOCATION_LOC (p),
|
|
gen_rtx_UNKNOWN_VAR_LOC (), 1);
|
|
else
|
|
break;
|
|
}
|
|
|
|
/* If we have passed a call instruction, and the
|
|
pseudo-reg DST is not already live across a call,
|
|
then don't perform the optimization. */
|
|
if (CALL_P (p))
|
|
{
|
|
num_calls++;
|
|
freq_calls += REG_FREQ_FROM_BB (BLOCK_FOR_INSN (p));
|
|
|
|
if (REG_N_CALLS_CROSSED (REGNO (dst)) == 0)
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (success)
|
|
{
|
|
int dstno, srcno;
|
|
|
|
/* Remove the death note for SRC from INSN. */
|
|
remove_note (insn, src_note);
|
|
/* Move the death note for SRC to P if it is used
|
|
there. */
|
|
if (reg_overlap_mentioned_p (src, PATTERN (p)))
|
|
{
|
|
XEXP (src_note, 1) = REG_NOTES (p);
|
|
REG_NOTES (p) = src_note;
|
|
}
|
|
/* If there is a REG_DEAD note for DST on P, then remove
|
|
it, because DST is now set there. */
|
|
if ((dst_note = find_reg_note (p, REG_DEAD, dst)))
|
|
remove_note (p, dst_note);
|
|
|
|
dstno = REGNO (dst);
|
|
srcno = REGNO (src);
|
|
|
|
INC_REG_N_SETS (dstno, 1);
|
|
INC_REG_N_SETS (srcno, -1);
|
|
|
|
REG_N_CALLS_CROSSED (dstno) += num_calls;
|
|
REG_N_CALLS_CROSSED (srcno) -= num_calls;
|
|
REG_FREQ_CALLS_CROSSED (dstno) += freq_calls;
|
|
REG_FREQ_CALLS_CROSSED (srcno) -= freq_calls;
|
|
|
|
REG_LIVE_LENGTH (dstno) += length;
|
|
if (REG_LIVE_LENGTH (srcno) >= 0)
|
|
{
|
|
REG_LIVE_LENGTH (srcno) -= length;
|
|
/* REG_LIVE_LENGTH is only an approximation after
|
|
combine if sched is not run, so make sure that we
|
|
still have a reasonable value. */
|
|
if (REG_LIVE_LENGTH (srcno) < 2)
|
|
REG_LIVE_LENGTH (srcno) = 2;
|
|
}
|
|
|
|
if (dump_file)
|
|
fprintf (dump_file,
|
|
"Fixed operand %d of insn %d matching operand %d.\n",
|
|
op_no, INSN_UID (insn), match_no);
|
|
|
|
break;
|
|
}
|
|
else if (num_changes_pending () > 0)
|
|
cancel_changes (0);
|
|
}
|
|
|
|
/* If we weren't able to replace any of the alternatives, try an
|
|
alternative approach of copying the source to the destination. */
|
|
if (!success && copy_src != NULL_RTX)
|
|
copy_src_to_dest (insn, copy_src, copy_dst);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Main entry for the register move optimization. */
|
|
|
|
static unsigned int
|
|
regmove_optimize (void)
|
|
{
|
|
int i;
|
|
int nregs = max_reg_num ();
|
|
|
|
df_note_add_problem ();
|
|
df_analyze ();
|
|
|
|
regstat_init_n_sets_and_refs ();
|
|
regstat_compute_ri ();
|
|
|
|
regno_src_regno = XNEWVEC (int, nregs);
|
|
for (i = nregs; --i >= 0; )
|
|
regno_src_regno[i] = -1;
|
|
|
|
/* A forward pass. Replace output operands with input operands. */
|
|
regmove_forward_pass ();
|
|
|
|
/* A backward pass. Replace input operands with output operands. */
|
|
regmove_backward_pass ();
|
|
|
|
/* Clean up. */
|
|
free (regno_src_regno);
|
|
if (reg_set_in_bb)
|
|
{
|
|
free (reg_set_in_bb);
|
|
reg_set_in_bb = NULL;
|
|
}
|
|
regstat_free_n_sets_and_refs ();
|
|
regstat_free_ri ();
|
|
return 0;
|
|
}
|
|
|
|
/* Returns nonzero if INSN's pattern has matching constraints for any operand.
|
|
Returns 0 if INSN can't be recognized, or if the alternative can't be
|
|
determined.
|
|
|
|
Initialize the info in MATCHP based on the constraints. */
|
|
|
|
static int
|
|
find_matches (rtx insn, struct match *matchp)
|
|
{
|
|
int likely_spilled[MAX_RECOG_OPERANDS];
|
|
int op_no;
|
|
int any_matches = 0;
|
|
|
|
extract_insn (insn);
|
|
if (! constrain_operands (0))
|
|
return 0;
|
|
|
|
/* Must initialize this before main loop, because the code for
|
|
the commutative case may set matches for operands other than
|
|
the current one. */
|
|
for (op_no = recog_data.n_operands; --op_no >= 0; )
|
|
matchp->with[op_no] = matchp->commutative[op_no] = -1;
|
|
|
|
for (op_no = 0; op_no < recog_data.n_operands; op_no++)
|
|
{
|
|
const char *p;
|
|
char c;
|
|
int i = 0;
|
|
|
|
p = recog_data.constraints[op_no];
|
|
|
|
likely_spilled[op_no] = 0;
|
|
matchp->use[op_no] = READ;
|
|
matchp->early_clobber[op_no] = 0;
|
|
if (*p == '=')
|
|
matchp->use[op_no] = WRITE;
|
|
else if (*p == '+')
|
|
matchp->use[op_no] = READWRITE;
|
|
|
|
for (;*p && i < which_alternative; p++)
|
|
if (*p == ',')
|
|
i++;
|
|
|
|
while ((c = *p) != '\0' && c != ',')
|
|
{
|
|
switch (c)
|
|
{
|
|
case '=':
|
|
break;
|
|
case '+':
|
|
break;
|
|
case '&':
|
|
matchp->early_clobber[op_no] = 1;
|
|
break;
|
|
case '%':
|
|
matchp->commutative[op_no] = op_no + 1;
|
|
matchp->commutative[op_no + 1] = op_no;
|
|
break;
|
|
|
|
case '0': case '1': case '2': case '3': case '4':
|
|
case '5': case '6': case '7': case '8': case '9':
|
|
{
|
|
char *end;
|
|
unsigned long match_ul = strtoul (p, &end, 10);
|
|
int match = match_ul;
|
|
|
|
p = end;
|
|
|
|
if (match < op_no && likely_spilled[match])
|
|
continue;
|
|
matchp->with[op_no] = match;
|
|
any_matches = 1;
|
|
if (matchp->commutative[op_no] >= 0)
|
|
matchp->with[matchp->commutative[op_no]] = match;
|
|
}
|
|
continue;
|
|
|
|
case 'a': case 'b': case 'c': case 'd': case 'e': case 'f': case 'h':
|
|
case 'j': case 'k': case 'l': case 'p': case 'q': case 't': case 'u':
|
|
case 'v': case 'w': case 'x': case 'y': case 'z': case 'A': case 'B':
|
|
case 'C': case 'D': case 'W': case 'Y': case 'Z':
|
|
if (CLASS_LIKELY_SPILLED_P (REG_CLASS_FROM_CONSTRAINT ((unsigned char) c, p) ))
|
|
likely_spilled[op_no] = 1;
|
|
break;
|
|
}
|
|
p += CONSTRAINT_LEN (c, p);
|
|
}
|
|
}
|
|
return any_matches;
|
|
}
|
|
|
|
|
|
|
|
static bool
|
|
gate_handle_regmove (void)
|
|
{
|
|
return (optimize > 0 && flag_regmove);
|
|
}
|
|
|
|
|
|
struct rtl_opt_pass pass_regmove =
|
|
{
|
|
{
|
|
RTL_PASS,
|
|
"regmove", /* name */
|
|
gate_handle_regmove, /* gate */
|
|
regmove_optimize, /* execute */
|
|
NULL, /* sub */
|
|
NULL, /* next */
|
|
0, /* static_pass_number */
|
|
TV_REGMOVE, /* tv_id */
|
|
0, /* properties_required */
|
|
0, /* properties_provided */
|
|
0, /* properties_destroyed */
|
|
0, /* todo_flags_start */
|
|
TODO_df_finish | TODO_verify_rtl_sharing |
|
|
TODO_dump_func |
|
|
TODO_ggc_collect /* todo_flags_finish */
|
|
}
|
|
};
|