2014-10-27 Andrew MacLeod <amacleod@redhat.com> * testsuite/gcc.dg/plugin/ggcplug.c: Shuffle includes to include gcc-plugin.h earlier. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * c/c-typeck.c: Adjust include files. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * c-family/c-gimplify.c: Adjust include files. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * cp/cp-gimplify.c: Adjust include files. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * go/go-gcc.cc: Adjust include files. * go/go-lang.c: Ditto. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * java/java-gimplify.c: Adjust include files. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * lto/lto-lang.c: Adjust include files. * lto/lto-object.c: Ditto. * lto/lto-partition.c: Ditto. * lto/lto-symtab.c: Ditto. * lto/lto.c: Ditto. 2014-10-27 Andrew MacLeod <amacleod@redhat.com> * basic-block.h: Remove all includes. (enum profile_status_d, struct control_flow_graph): Move to cfg.h * cfg.h (profile_status_d, struct control_flow_graph): Relocate here. * Makefile.in (GTFILES): Add cfg.h to list. * cgraph.h (symbol_table::create_empty): Move to cgraph.c. * cgraph.c (symbol_table::create_empty): Relocate from cgraph.h. * genconditions.c (write_header): Add predict.h and basic-block.h to lits of includes. * genemit.c (main): Ditto. * genpreds.c (write_insn_preds_c): Ditto. * genrecog.c (write_header): Ditto. * gengtype.c (open_base_files): Add predict.h, basic-block.h, and cfg.h to list of includes. * alias.c: Adjust include files. * asan.c: Ditto. * auto-inc-dec.c: Ditto. * auto-profile.c: Ditto. * bb-reorder.c: Ditto. * bt-load.c: Ditto. * builtins.c: Ditto. * caller-save.c: Ditto. * calls.c: Ditto. * cfg.c: Ditto. * cfganal.c: Ditto. * cfgbuild.c: Ditto. * cfgcleanup.c: Ditto. * cfgexpand.c: Ditto. * cfghooks.c: Ditto. * cfgloop.c: Ditto. * cfgloopanal.c: Ditto. * cfgloopmanip.c: Ditto. * cfgrtl.c: Ditto. * cgraphbuild.c: Ditto. * cgraphclones.c: Ditto. * cgraphunit.c: Ditto. * combine-stack-adj.c: Ditto. * combine.c: Ditto. * compare-elim.c: Ditto. * coverage.c: Ditto. * cprop.c: Ditto. * cse.c: Ditto. * cselib.c: Ditto. * data-streamer-in.c: Ditto. * data-streamer-out.c: Ditto. * data-streamer.c: Ditto. * dce.c: Ditto. * ddg.c: Ditto. * ddg.h: Ditto. * df-core.c: Ditto. * df-problems.c: Ditto. * df-scan.c: Ditto. * df.h: Ditto. * dojump.c: Ditto. * dominance.c: Ditto. * domwalk.c: Ditto. * dse.c: Ditto. * dwarf2cfi.c: Ditto. * emit-rtl.c: Ditto. * et-forest.c: Ditto. * except.c: Ditto. * expmed.c: Ditto. * expr.c: Ditto. * final.c: Ditto. * fold-const.c: Ditto. * function.c: Ditto. * fwprop.c: Ditto. * gcc-plugin.h: Ditto. * gcse.c: Ditto. * generic-match-head.c: Ditto. * ggc-page.c: Ditto. * gimple-builder.c: Ditto. * gimple-expr.c: Ditto. * gimple-fold.c: Ditto. * gimple-iterator.c: Ditto. * gimple-low.c: Ditto. * gimple-match-head.c: Ditto. * gimple-pretty-print.c: Ditto. * gimple-ssa-isolate-paths.c: Ditto. * gimple-ssa-strength-reduction.c: Ditto. * gimple-streamer-in.c: Ditto. * gimple-streamer-out.c: Ditto. * gimple-streamer.h: Ditto. * gimple-walk.c: Ditto. * gimple.c: Ditto. * gimplify-me.c: Ditto. * gimplify.c: Ditto. * graph.c: Ditto. * graphite-blocking.c: Ditto. * graphite-clast-to-gimple.c: Ditto. * graphite-dependences.c: Ditto. * graphite-interchange.c: Ditto. * graphite-isl-ast-to-gimple.c: Ditto. * graphite-optimize-isl.c: Ditto. * graphite-poly.c: Ditto. * graphite-scop-detection.c: Ditto. * graphite-sese-to-poly.c: Ditto. * graphite.c: Ditto. * haifa-sched.c: Ditto. * hw-doloop.c: Ditto. * ifcvt.c: Ditto. * init-regs.c: Ditto. * internal-fn.c: Ditto. * ipa-cp.c: Ditto. * ipa-devirt.c: Ditto. * ipa-icf-gimple.c: Ditto. * ipa-icf.c: Ditto. * ipa-inline-analysis.c: Ditto. * ipa-inline.c: Ditto. * ipa-polymorphic-call.c: Ditto. * ipa-profile.c: Ditto. * ipa-prop.c: Ditto. * ipa-pure-const.c: Ditto. * ipa-reference.c: Ditto. * ipa-split.c: Ditto. * ipa-utils.c: Ditto. * ipa.c: Ditto. * ira-build.c: Ditto. * ira-color.c: Ditto. * ira-conflicts.c: Ditto. * ira-costs.c: Ditto. * ira-emit.c: Ditto. * ira-lives.c: Ditto. * ira.c: Ditto. * jump.c: Ditto. * lcm.c: Ditto. * loop-doloop.c: Ditto. * loop-init.c: Ditto. * loop-invariant.c: Ditto. * loop-iv.c: Ditto. * loop-unroll.c: Ditto. * lower-subreg.c: Ditto. * lra-assigns.c: Ditto. * lra-coalesce.c: Ditto. * lra-constraints.c: Ditto. * lra-eliminations.c: Ditto. * lra-lives.c: Ditto. * lra-spills.c: Ditto. * lra.c: Ditto. * lto-cgraph.c: Ditto. * lto-compress.c: Ditto. * lto-opts.c: Ditto. * lto-section-in.c: Ditto. * lto-section-out.c: Ditto. * lto-streamer-in.c: Ditto. * lto-streamer-out.c: Ditto. * lto-streamer.c: Ditto. * mcf.c: Ditto. * mode-switching.c: Ditto. * modulo-sched.c: Ditto. * omp-low.c: Ditto. * optabs.c: Ditto. * opts-global.c: Ditto. * passes.c: Ditto. * postreload-gcse.c: Ditto. * postreload.c: Ditto. * predict.c: Ditto. * print-rtl.c: Ditto. * profile.c: Ditto. * recog.c: Ditto. * ree.c: Ditto. * reg-stack.c: Ditto. * regcprop.c: Ditto. * regcprop.h: Ditto. * reginfo.c: Ditto. * regrename.c: Ditto. * regstat.c: Ditto. * reload.c: Ditto. * reload1.c: Ditto. * reorg.c: Ditto. * resource.c: Ditto. * rtlanal.c: Ditto. * sched-deps.c: Ditto. * sched-ebb.c: Ditto. * sched-int.h: Ditto. * sched-rgn.c: Ditto. * sched-vis.c: Ditto. * sel-sched-dump.c: Ditto. * sel-sched-ir.c: Ditto. * sel-sched-ir.h: Ditto. * sel-sched.c: Ditto. * sese.c: Ditto. * shrink-wrap.c: Ditto. * stack-ptr-mod.c: Ditto. * stmt.c: Ditto. * store-motion.c: Ditto. * symtab.c: Ditto. * toplev.c: Ditto. * tracer.c: Ditto. * trans-mem.c: Ditto. * tree-affine.c: Ditto. * tree-call-cdce.c: Ditto. * tree-cfg.c: Ditto. * tree-cfgcleanup.c: Ditto. * tree-chrec.c: Ditto. * tree-complex.c: Ditto. * tree-data-ref.c: Ditto. * tree-dfa.c: Ditto. * tree-eh.c: Ditto. * tree-emutls.c: Ditto. * tree-if-conv.c: Ditto. * tree-inline.c: Ditto. * tree-into-ssa.c: Ditto. * tree-loop-distribution.c: Ditto. * tree-nested.c: Ditto. * tree-nrv.c: Ditto. * tree-object-size.c: Ditto. * tree-outof-ssa.c: Ditto. * tree-parloops.c: Ditto. * tree-phinodes.c: Ditto. * tree-predcom.c: Ditto. * tree-pretty-print.c: Ditto. * tree-profile.c: Ditto. * tree-scalar-evolution.c: Ditto. * tree-sra.c: Ditto. * tree-ssa-address.c: Ditto. * tree-ssa-alias.c: Ditto. * tree-ssa-ccp.c: Ditto. * tree-ssa-coalesce.c: Ditto. * tree-ssa-copy.c: Ditto. * tree-ssa-copyrename.c: Ditto. * tree-ssa-dce.c: Ditto. * tree-ssa-dom.c: Ditto. * tree-ssa-dse.c: Ditto. * tree-ssa-forwprop.c: Ditto. * tree-ssa-ifcombine.c: Ditto. * tree-ssa-live.c: Ditto. * tree-ssa-loop-ch.c: Ditto. * tree-ssa-loop-im.c: Ditto. * tree-ssa-loop-ivcanon.c: Ditto. * tree-ssa-loop-ivopts.c: Ditto. * tree-ssa-loop-manip.c: Ditto. * tree-ssa-loop-niter.c: Ditto. * tree-ssa-loop-prefetch.c: Ditto. * tree-ssa-loop-unswitch.c: Ditto. * tree-ssa-loop.c: Ditto. * tree-ssa-math-opts.c: Ditto. * tree-ssa-operands.c: Ditto. * tree-ssa-phiopt.c: Ditto. * tree-ssa-phiprop.c: Ditto. * tree-ssa-pre.c: Ditto. * tree-ssa-propagate.c: Ditto. * tree-ssa-reassoc.c: Ditto. * tree-ssa-sccvn.c: Ditto. * tree-ssa-sink.c: Ditto. * tree-ssa-strlen.c: Ditto. * tree-ssa-structalias.c: Ditto. * tree-ssa-tail-merge.c: Ditto. * tree-ssa-ter.c: Ditto. * tree-ssa-threadedge.c: Ditto. * tree-ssa-threadupdate.c: Ditto. * tree-ssa-uncprop.c: Ditto. * tree-ssa-uninit.c: Ditto. * tree-ssa.c: Ditto. * tree-ssanames.c: Ditto. * tree-stdarg.c: Ditto. * tree-streamer-in.c: Ditto. * tree-streamer-out.c: Ditto. * tree-streamer.c: Ditto. * tree-switch-conversion.c: Ditto. * tree-tailcall.c: Ditto. * tree-vect-data-refs.c: Ditto. * tree-vect-generic.c: Ditto. * tree-vect-loop-manip.c: Ditto. * tree-vect-loop.c: Ditto. * tree-vect-patterns.c: Ditto. * tree-vect-slp.c: Ditto. * tree-vect-stmts.c: Ditto. * tree-vectorizer.c: Ditto. * tree-vrp.c: Ditto. * tree.c: Ditto. * tsan.c: Ditto. * ubsan.c: Ditto. * valtrack.c: Ditto. * valtrack.h: Ditto. * value-prof.c: Ditto. * var-tracking.c: Ditto. * varasm.c: Ditto. * varpool.c: Ditto. * vtable-verify.c: Ditto. * web.c: Ditto. * config/aarch64/aarch64-builtins.c: Ditto. * config/aarch64/aarch64.c: Ditto. * config/alpha/alpha.c: Ditto. * config/arc/arc.c: Ditto. * config/arm/arm.c: Ditto. * config/avr/avr.c: Ditto. * config/bfin/bfin.c: Ditto. * config/c6x/c6x.c: Ditto. * config/cr16/cr16.c: Ditto. * config/cris/cris.c: Ditto. * config/darwin-c.c: Ditto. * config/darwin.c: Ditto. * config/epiphany/epiphany.c: Ditto. * config/epiphany/mode-switch-use.c: Ditto. * config/epiphany/resolve-sw-modes.c: Ditto. * config/fr30/fr30.c: Ditto. * config/frv/frv.c: Ditto. * config/h8300/h8300.c: Ditto. * config/i386/i386.c: Ditto. * config/i386/winnt.c: Ditto. * config/ia64/ia64.c: Ditto. * config/iq2000/iq2000.c: Ditto. * config/lm32/lm32.c: Ditto. * config/m32c/m32c.c: Ditto. * config/m32r/m32r.c: Ditto. * config/m68k/m68k.c: Ditto. * config/mcore/mcore.c: Ditto. * config/mep/mep.c: Ditto. * config/microblaze/microblaze.c: Ditto. * config/mips/mips.c: Ditto. * config/mmix/mmix.c: Ditto. * config/mn10300/mn10300.c: Ditto. * config/moxie/moxie.c: Ditto. * config/msp430/msp430.c: Ditto. * config/nds32/nds32-cost.c: Ditto. * config/nds32/nds32-fp-as-gp.c: Ditto. * config/nds32/nds32-intrinsic.c: Ditto. * config/nds32/nds32-isr.c: Ditto. * config/nds32/nds32-md-auxiliary.c: Ditto. * config/nds32/nds32-memory-manipulation.c: Ditto. * config/nds32/nds32-pipelines-auxiliary.c: Ditto. * config/nds32/nds32-predicates.c: Ditto. * config/nds32/nds32.c: Ditto. * config/nios2/nios2.c: Ditto. * config/pa/pa.c: Ditto. * config/pdp11/pdp11.c: Ditto. * config/rl78/rl78.c: Ditto. * config/rs6000/rs6000.c: Ditto. * config/rx/rx.c: Ditto. * config/s390/s390.c: Ditto. * config/sh/sh-mem.cc: Ditto. * config/sh/sh.c: Ditto. * config/sh/sh_optimize_sett_clrt.cc: Ditto. * config/sh/sh_treg_combine.cc: Ditto. * config/sparc/sparc.c: Ditto. * config/spu/spu.c: Ditto. * config/stormy16/stormy16.c: Ditto. * config/tilegx/tilegx.c: Ditto. * config/tilepro/tilepro.c: Ditto. * config/v850/v850.c: Ditto. * config/vax/vax.c: Ditto. * config/xtensa/xtensa.c: Ditto. From-SVN: r216735
461 lines
11 KiB
C
461 lines
11 KiB
C
/* Loop unswitching.
|
|
Copyright (C) 2004-2014 Free Software Foundation, Inc.
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by the
|
|
Free Software Foundation; either version 3, or (at your option) any
|
|
later version.
|
|
|
|
GCC is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING3. If not see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "config.h"
|
|
#include "system.h"
|
|
#include "coretypes.h"
|
|
#include "tm.h"
|
|
#include "tree.h"
|
|
#include "tm_p.h"
|
|
#include "predict.h"
|
|
#include "vec.h"
|
|
#include "hashtab.h"
|
|
#include "hash-set.h"
|
|
#include "machmode.h"
|
|
#include "hard-reg-set.h"
|
|
#include "input.h"
|
|
#include "function.h"
|
|
#include "dominance.h"
|
|
#include "cfg.h"
|
|
#include "basic-block.h"
|
|
#include "tree-ssa-alias.h"
|
|
#include "internal-fn.h"
|
|
#include "gimple-expr.h"
|
|
#include "is-a.h"
|
|
#include "gimple.h"
|
|
#include "gimplify.h"
|
|
#include "gimple-ssa.h"
|
|
#include "tree-cfg.h"
|
|
#include "tree-phinodes.h"
|
|
#include "ssa-iterators.h"
|
|
#include "tree-ssa-loop-niter.h"
|
|
#include "tree-ssa-loop.h"
|
|
#include "tree-into-ssa.h"
|
|
#include "cfgloop.h"
|
|
#include "params.h"
|
|
#include "tree-pass.h"
|
|
#include "tree-inline.h"
|
|
|
|
/* This file implements the loop unswitching, i.e. transformation of loops like
|
|
|
|
while (A)
|
|
{
|
|
if (inv)
|
|
B;
|
|
|
|
X;
|
|
|
|
if (!inv)
|
|
C;
|
|
}
|
|
|
|
where inv is the loop invariant, into
|
|
|
|
if (inv)
|
|
{
|
|
while (A)
|
|
{
|
|
B;
|
|
X;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
while (A)
|
|
{
|
|
X;
|
|
C;
|
|
}
|
|
}
|
|
|
|
Inv is considered invariant iff the values it compares are both invariant;
|
|
tree-ssa-loop-im.c ensures that all the suitable conditions are in this
|
|
shape. */
|
|
|
|
static struct loop *tree_unswitch_loop (struct loop *, basic_block, tree);
|
|
static bool tree_unswitch_single_loop (struct loop *, int);
|
|
static tree tree_may_unswitch_on (basic_block, struct loop *);
|
|
|
|
/* Main entry point. Perform loop unswitching on all suitable loops. */
|
|
|
|
unsigned int
|
|
tree_ssa_unswitch_loops (void)
|
|
{
|
|
struct loop *loop;
|
|
bool changed = false;
|
|
HOST_WIDE_INT iterations;
|
|
|
|
/* Go through inner loops (only original ones). */
|
|
FOR_EACH_LOOP (loop, LI_ONLY_INNERMOST)
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file, ";; Considering loop %d\n", loop->num);
|
|
|
|
/* Do not unswitch in cold regions. */
|
|
if (optimize_loop_for_size_p (loop))
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file, ";; Not unswitching cold loops\n");
|
|
continue;
|
|
}
|
|
|
|
/* The loop should not be too large, to limit code growth. */
|
|
if (tree_num_loop_insns (loop, &eni_size_weights)
|
|
> (unsigned) PARAM_VALUE (PARAM_MAX_UNSWITCH_INSNS))
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file, ";; Not unswitching, loop too big\n");
|
|
continue;
|
|
}
|
|
|
|
/* If the loop is not expected to iterate, there is no need
|
|
for unswitching. */
|
|
iterations = estimated_loop_iterations_int (loop);
|
|
if (iterations >= 0 && iterations <= 1)
|
|
{
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file, ";; Not unswitching, loop is not expected to iterate\n");
|
|
continue;
|
|
}
|
|
|
|
changed |= tree_unswitch_single_loop (loop, 0);
|
|
}
|
|
|
|
if (changed)
|
|
return TODO_cleanup_cfg;
|
|
return 0;
|
|
}
|
|
|
|
/* Checks whether we can unswitch LOOP on condition at end of BB -- one of its
|
|
basic blocks (for what it means see comments below). */
|
|
|
|
static tree
|
|
tree_may_unswitch_on (basic_block bb, struct loop *loop)
|
|
{
|
|
gimple stmt, def;
|
|
tree cond, use;
|
|
basic_block def_bb;
|
|
ssa_op_iter iter;
|
|
|
|
/* BB must end in a simple conditional jump. */
|
|
stmt = last_stmt (bb);
|
|
if (!stmt || gimple_code (stmt) != GIMPLE_COND)
|
|
return NULL_TREE;
|
|
|
|
/* To keep the things simple, we do not directly remove the conditions,
|
|
but just replace tests with 0 != 0 resp. 1 != 0. Prevent the infinite
|
|
loop where we would unswitch again on such a condition. */
|
|
if (gimple_cond_true_p (stmt) || gimple_cond_false_p (stmt))
|
|
return NULL_TREE;
|
|
|
|
/* Condition must be invariant. */
|
|
FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
|
|
{
|
|
def = SSA_NAME_DEF_STMT (use);
|
|
def_bb = gimple_bb (def);
|
|
if (def_bb
|
|
&& flow_bb_inside_loop_p (loop, def_bb))
|
|
return NULL_TREE;
|
|
}
|
|
|
|
cond = build2 (gimple_cond_code (stmt), boolean_type_node,
|
|
gimple_cond_lhs (stmt), gimple_cond_rhs (stmt));
|
|
|
|
return cond;
|
|
}
|
|
|
|
/* Simplifies COND using checks in front of the entry of the LOOP. Just very
|
|
simplish (sufficient to prevent us from duplicating loop in unswitching
|
|
unnecessarily). */
|
|
|
|
static tree
|
|
simplify_using_entry_checks (struct loop *loop, tree cond)
|
|
{
|
|
edge e = loop_preheader_edge (loop);
|
|
gimple stmt;
|
|
|
|
while (1)
|
|
{
|
|
stmt = last_stmt (e->src);
|
|
if (stmt
|
|
&& gimple_code (stmt) == GIMPLE_COND
|
|
&& gimple_cond_code (stmt) == TREE_CODE (cond)
|
|
&& operand_equal_p (gimple_cond_lhs (stmt),
|
|
TREE_OPERAND (cond, 0), 0)
|
|
&& operand_equal_p (gimple_cond_rhs (stmt),
|
|
TREE_OPERAND (cond, 1), 0))
|
|
return (e->flags & EDGE_TRUE_VALUE
|
|
? boolean_true_node
|
|
: boolean_false_node);
|
|
|
|
if (!single_pred_p (e->src))
|
|
return cond;
|
|
|
|
e = single_pred_edge (e->src);
|
|
if (e->src == ENTRY_BLOCK_PTR_FOR_FN (cfun))
|
|
return cond;
|
|
}
|
|
}
|
|
|
|
/* Unswitch single LOOP. NUM is number of unswitchings done; we do not allow
|
|
it to grow too much, it is too easy to create example on that the code would
|
|
grow exponentially. */
|
|
|
|
static bool
|
|
tree_unswitch_single_loop (struct loop *loop, int num)
|
|
{
|
|
basic_block *bbs;
|
|
struct loop *nloop;
|
|
unsigned i, found;
|
|
tree cond = NULL_TREE;
|
|
gimple stmt;
|
|
bool changed = false;
|
|
|
|
i = 0;
|
|
bbs = get_loop_body (loop);
|
|
found = loop->num_nodes;
|
|
|
|
while (1)
|
|
{
|
|
/* Find a bb to unswitch on. */
|
|
for (; i < loop->num_nodes; i++)
|
|
if ((cond = tree_may_unswitch_on (bbs[i], loop)))
|
|
break;
|
|
|
|
if (i == loop->num_nodes)
|
|
{
|
|
if (dump_file
|
|
&& num > PARAM_VALUE (PARAM_MAX_UNSWITCH_LEVEL)
|
|
&& (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file, ";; Not unswitching anymore, hit max level\n");
|
|
|
|
if (found == loop->num_nodes)
|
|
{
|
|
free (bbs);
|
|
return changed;
|
|
}
|
|
break;
|
|
}
|
|
|
|
cond = simplify_using_entry_checks (loop, cond);
|
|
stmt = last_stmt (bbs[i]);
|
|
if (integer_nonzerop (cond))
|
|
{
|
|
/* Remove false path. */
|
|
gimple_cond_set_condition_from_tree (stmt, boolean_true_node);
|
|
changed = true;
|
|
}
|
|
else if (integer_zerop (cond))
|
|
{
|
|
/* Remove true path. */
|
|
gimple_cond_set_condition_from_tree (stmt, boolean_false_node);
|
|
changed = true;
|
|
}
|
|
/* Do not unswitch too much. */
|
|
else if (num > PARAM_VALUE (PARAM_MAX_UNSWITCH_LEVEL))
|
|
{
|
|
i++;
|
|
continue;
|
|
}
|
|
/* In nested tree_unswitch_single_loop first optimize all conditions
|
|
using entry checks, then discover still reachable blocks in the
|
|
loop and find the condition only among those still reachable bbs. */
|
|
else if (num != 0)
|
|
{
|
|
if (found == loop->num_nodes)
|
|
found = i;
|
|
i++;
|
|
continue;
|
|
}
|
|
else
|
|
{
|
|
found = i;
|
|
break;
|
|
}
|
|
|
|
update_stmt (stmt);
|
|
i++;
|
|
}
|
|
|
|
if (num != 0)
|
|
{
|
|
basic_block *tos, *worklist;
|
|
|
|
/* When called recursively, first do a quick discovery
|
|
of reachable bbs after the above changes and only
|
|
consider conditions in still reachable bbs. */
|
|
tos = worklist = XNEWVEC (basic_block, loop->num_nodes);
|
|
|
|
for (i = 0; i < loop->num_nodes; i++)
|
|
bbs[i]->flags &= ~BB_REACHABLE;
|
|
|
|
/* Start with marking header. */
|
|
*tos++ = bbs[0];
|
|
bbs[0]->flags |= BB_REACHABLE;
|
|
|
|
/* Iterate: find everything reachable from what we've already seen
|
|
within the same innermost loop. Don't look through false edges
|
|
if condition is always true or true edges if condition is
|
|
always false. */
|
|
while (tos != worklist)
|
|
{
|
|
basic_block b = *--tos;
|
|
edge e;
|
|
edge_iterator ei;
|
|
int flags = 0;
|
|
|
|
if (EDGE_COUNT (b->succs) == 2)
|
|
{
|
|
gimple stmt = last_stmt (b);
|
|
if (stmt
|
|
&& gimple_code (stmt) == GIMPLE_COND)
|
|
{
|
|
if (gimple_cond_true_p (stmt))
|
|
flags = EDGE_FALSE_VALUE;
|
|
else if (gimple_cond_false_p (stmt))
|
|
flags = EDGE_TRUE_VALUE;
|
|
}
|
|
}
|
|
|
|
FOR_EACH_EDGE (e, ei, b->succs)
|
|
{
|
|
basic_block dest = e->dest;
|
|
|
|
if (dest->loop_father == loop
|
|
&& !(dest->flags & BB_REACHABLE)
|
|
&& !(e->flags & flags))
|
|
{
|
|
*tos++ = dest;
|
|
dest->flags |= BB_REACHABLE;
|
|
}
|
|
}
|
|
}
|
|
|
|
free (worklist);
|
|
|
|
/* Find a bb to unswitch on. */
|
|
for (; found < loop->num_nodes; found++)
|
|
if ((bbs[found]->flags & BB_REACHABLE)
|
|
&& (cond = tree_may_unswitch_on (bbs[found], loop)))
|
|
break;
|
|
|
|
if (found == loop->num_nodes)
|
|
{
|
|
free (bbs);
|
|
return changed;
|
|
}
|
|
}
|
|
|
|
if (dump_file && (dump_flags & TDF_DETAILS))
|
|
fprintf (dump_file, ";; Unswitching loop\n");
|
|
|
|
initialize_original_copy_tables ();
|
|
/* Unswitch the loop on this condition. */
|
|
nloop = tree_unswitch_loop (loop, bbs[found], cond);
|
|
if (!nloop)
|
|
{
|
|
free_original_copy_tables ();
|
|
free (bbs);
|
|
return changed;
|
|
}
|
|
|
|
/* Update the SSA form after unswitching. */
|
|
update_ssa (TODO_update_ssa);
|
|
free_original_copy_tables ();
|
|
|
|
/* Invoke itself on modified loops. */
|
|
tree_unswitch_single_loop (nloop, num + 1);
|
|
tree_unswitch_single_loop (loop, num + 1);
|
|
free (bbs);
|
|
return true;
|
|
}
|
|
|
|
/* Unswitch a LOOP w.r. to given basic block UNSWITCH_ON. We only support
|
|
unswitching of innermost loops. COND is the condition determining which
|
|
loop is entered -- the new loop is entered if COND is true. Returns NULL
|
|
if impossible, new loop otherwise. */
|
|
|
|
static struct loop *
|
|
tree_unswitch_loop (struct loop *loop,
|
|
basic_block unswitch_on, tree cond)
|
|
{
|
|
unsigned prob_true;
|
|
edge edge_true, edge_false;
|
|
|
|
/* Some sanity checking. */
|
|
gcc_assert (flow_bb_inside_loop_p (loop, unswitch_on));
|
|
gcc_assert (EDGE_COUNT (unswitch_on->succs) == 2);
|
|
gcc_assert (loop->inner == NULL);
|
|
|
|
extract_true_false_edges_from_block (unswitch_on, &edge_true, &edge_false);
|
|
prob_true = edge_true->probability;
|
|
return loop_version (loop, unshare_expr (cond),
|
|
NULL, prob_true, prob_true,
|
|
REG_BR_PROB_BASE - prob_true, false);
|
|
}
|
|
|
|
/* Loop unswitching pass. */
|
|
|
|
namespace {
|
|
|
|
const pass_data pass_data_tree_unswitch =
|
|
{
|
|
GIMPLE_PASS, /* type */
|
|
"unswitch", /* name */
|
|
OPTGROUP_LOOP, /* optinfo_flags */
|
|
TV_TREE_LOOP_UNSWITCH, /* tv_id */
|
|
PROP_cfg, /* properties_required */
|
|
0, /* properties_provided */
|
|
0, /* properties_destroyed */
|
|
0, /* todo_flags_start */
|
|
0, /* todo_flags_finish */
|
|
};
|
|
|
|
class pass_tree_unswitch : public gimple_opt_pass
|
|
{
|
|
public:
|
|
pass_tree_unswitch (gcc::context *ctxt)
|
|
: gimple_opt_pass (pass_data_tree_unswitch, ctxt)
|
|
{}
|
|
|
|
/* opt_pass methods: */
|
|
virtual bool gate (function *) { return flag_unswitch_loops != 0; }
|
|
virtual unsigned int execute (function *);
|
|
|
|
}; // class pass_tree_unswitch
|
|
|
|
unsigned int
|
|
pass_tree_unswitch::execute (function *fun)
|
|
{
|
|
if (number_of_loops (fun) <= 1)
|
|
return 0;
|
|
|
|
return tree_ssa_unswitch_loops ();
|
|
}
|
|
|
|
} // anon namespace
|
|
|
|
gimple_opt_pass *
|
|
make_pass_tree_unswitch (gcc::context *ctxt)
|
|
{
|
|
return new pass_tree_unswitch (ctxt);
|
|
}
|
|
|
|
|