2004-09-23 Dorit Naishlos <dorit@il.ibm.com> * tree.def (ALIGN_INDIRECT_REF, MISALIGNED_INDIRECT_REF): New tree-codes. * tree.h (REF_ORIGINAL): Consider ALIGN_INDIRECT_REF and MISALIGNED_INDIRECT_REF. * alias.c (get_alias_set, nonoverlapping_memrefs_p): Likewise. * emit-rtl.c (mem_expr_equal_p, set_mem_attributes_minus_bitpos): Likewise. * expr.c (safe_from_p, expand_expr_real_1, rewrite_address_base) (find_interesting_uses_address): Likewise. * fold-const.c (non_lvalue, operand_equal_p): Likewise. (build_fold_addr_expr_with_type): Likewise. * gimplify.c (gimplify_addr_expr, gimplify_expr): Likewise. * print-rtl.c (print_mem_expr): Likewise. * tree-dump.c (dequeue_and_dump): Likewise. * tree-eh.c (tree_could_trap_p): Likewise. * tree-gimple.c (is_gimple_addressable, get_base_address): Likewise. * tree-pretty-print.c (op_prio, op_symbol, dump_generic_node): Likewise. * tree-ssa-alias.c (find_ptr_dereference, ptr_is_dereferenced_by): Likewise. * tree-ssa-dce.c (mark_stmt_if_obviously_necessary): Likewise. * tree-ssa-dom.c (record_equivalences_from_stmt): Likewise. * tree-ssa-loop-im.c (for_each_index, is_call_clobbered_ref): Likewise. * tree-ssa-loop-ivopts.c (find_interesting_uses_address): Likewise. (add_address_candidates, rewrite_address_base): Likewise. * tree-ssa-operands.c (get_expr_operands, get_indirect_ref_operands): Likewise. * tree.c (staticp, build1_stat): Likewise. * tree.def (REALIGN_LOAD_EXPR, REALIGN_STORE_EXPR): New tree-codes. * tree-pretty-print.c (dump_generic_node): Consider REALIGN_LOAD_EXPR. * tree-ssa-operands.c (get_expr_operands): Likewise. * expr.c (expand_expr_real_1): Likewise. * optabs.h (vec_realign_store_optab, vec_realign_load_optab): New optabs. (OTI_vec_realign_store, OTI_vec_realign_load): New optab_index values for the new optabs. (expand_ternary_op): New function. * genopinit.c (optabs): Handle the new optabs. * optabs.c (optab_for_tree_code): Add cases for the new tree-codes. (init_optabs): Initialize vec_realign_load_optab. (expand_ternary_op): New functions. * target-def.h (TARGET_VECTORIZE): New member for struct gcc_target. (TARGET_VECTORIZE_MISALIGNED_MEM_OK): New member for targetm.vectorize. (TARGET_VECTORIZE_BUILTIN_MASK_FOR_LOAD): Likewise. (TARGET_VECTORIZE_BUILTIN_MASK_FOR_STORE): Likewise. * target.h (struct vectorize): New member for struct gcc_target. (misaligned_mem_ok): New member for targetm.vectorize. (builtin_mask_for_load): Likewise. (builtin_mask_for_store): Likewise. * targethooks.c (default_vect_misaligned_mem_ok): New function. * targethooks.h (default_vect_misaligned_mem_ok): New function. * config/rs6000/altivec.md (build_vector_mask_for_load): New define_expand. (vec_realign_load_v4si, vec_realign_load_v4sf, vec_realign_load_v8hi) (vec_realign_load_v16qi): New define_insn. * config/rs6000/rs6000.h (ALTIVEC_BUILTIN_MASK_FOR_LOAD): (ALTIVEC_BUILTIN_MASK_FOR_STORE): New target builtins. * config/rs6000/rs6000.c (altivec_builtin_mask_for_load): (altivec_builtin_mask_for_store): New variables. (rs6000_builtin_mask_for_load): New function. Implements TARGET_VECTORIZE_BUILTIN_MASK_FOR_LOAD. (rs6000_builtin_mask_for_store): New function. Implements TARGET_VECTORIZE_BUILTIN_MASK_FOR_STORE. (rs6000_expand_builtin): Expand the target builtins builtin_mask_for_load and builtin_mask_for_store. (altivec_init_builtins): Initialize the new target builtins. * config/i386/i386.c (ix86_misaligned_mem_ok): New function. Implements the target hook TARGET_VECTORIZE_MISALIGNED_MEM_OK. * tree-vectorizer.c (vect_create_data_ref): Renamed to vect_create_data_ref_ptr. Returns a pointer instead of an array-ref. (vect_create_addr_base_for_vector_ref): Additional argument (offset). (vectorizable_store): Call vect_create_data_ref_ptr with additional arguments, and create an indirect_ref with its return value data_ref. Check aligned_access_p. (vectorizable_load): Handle misaligned loads, using software-pipelined scheme with REALIGN_LOAD_EXPR and ALIGN_INDIRECT_REF if vec_realign_load_optab is supported, or using a scheme without software-pipelining with MISALIGNED_INDIRECT_REF if the target hook misaligned_mem_ok is supported. (vect_finish_stmt_generation): Typo. (vect_enhance_data_refs_alignment): Rename loop_vinfo to loop_info. (vect_analyze_data_refs_alignment): Don't fail vectorization in the presence of misaligned loads. (vect_analyze_data_ref_access): Add check for constant init. (vect_get_symbl_and_dr): Remove duplicate line. * tree-vectorizer.h (DR_MISALIGNMENT): Add comment. From-SVN: r87948
196 lines
6.1 KiB
C
196 lines
6.1 KiB
C
/* Loop Vectorization
|
|
Copyright (C) 2003, 2004 Free Software Foundation, Inc.
|
|
Contributed by Dorit Naishlos <dorit@il.ibm.com>
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free
|
|
Software Foundation; either version 2, or (at your option) any later
|
|
version.
|
|
|
|
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING. If not, write to the Free
|
|
Software Foundation, 59 Temple Place - Suite 330, Boston, MA
|
|
02111-1307, USA. */
|
|
|
|
#ifndef GCC_TREE_VECTORIZER_H
|
|
#define GCC_TREE_VECTORIZER_H
|
|
|
|
/* Used for naming of new temporaries. */
|
|
enum vect_var_kind {
|
|
vect_simple_var,
|
|
vect_pointer_var
|
|
};
|
|
|
|
/* Defines type of operation: unary or binary. */
|
|
enum operation_type {
|
|
unary_op = 1,
|
|
binary_op
|
|
};
|
|
|
|
/*-----------------------------------------------------------------*/
|
|
/* Info on vectorized defs. */
|
|
/*-----------------------------------------------------------------*/
|
|
enum stmt_vec_info_type {
|
|
undef_vec_info_type = 0,
|
|
load_vec_info_type,
|
|
store_vec_info_type,
|
|
op_vec_info_type,
|
|
assignment_vec_info_type
|
|
};
|
|
|
|
typedef struct _stmt_vec_info {
|
|
|
|
enum stmt_vec_info_type type;
|
|
|
|
/* The stmt to which this info struct refers to. */
|
|
tree stmt;
|
|
|
|
/* The loop with respect to which STMT is vectorized. */
|
|
struct loop *loop;
|
|
|
|
/* Not all stmts in the loop need to be vectorized. e.g, the incrementation
|
|
of the loop induction variable and computation of array indexes. relevant
|
|
indicates whether the stmt needs to be vectorized. */
|
|
bool relevant;
|
|
|
|
/* The vector type to be used. */
|
|
tree vectype;
|
|
|
|
/* The vectorized version of the stmt. */
|
|
tree vectorized_stmt;
|
|
|
|
|
|
/** The following is relevant only for stmts that contain a non-scalar
|
|
data-ref (array/pointer/struct access). A GIMPLE stmt is expected to have
|
|
at most one such data-ref. **/
|
|
|
|
/* Information about the data-ref (access function, etc). */
|
|
struct data_reference *data_ref_info;
|
|
|
|
/* Aliasing information. */
|
|
tree memtag;
|
|
|
|
/* Data reference base. This field holds the entire invariant part of the
|
|
data-reference (with respect to the relevant loop), as opposed to the
|
|
field DR_BASE of the STMT_VINFO_DATA_REF struct, which holds only the
|
|
initial base; e.g:
|
|
REF BR_BASE VECT_DR_BASE
|
|
a[i] a a
|
|
a[i][j] a a[i] */
|
|
tree vect_dr_base;
|
|
} *stmt_vec_info;
|
|
|
|
/* Access Functions. */
|
|
#define STMT_VINFO_TYPE(S) (S)->type
|
|
#define STMT_VINFO_STMT(S) (S)->stmt
|
|
#define STMT_VINFO_LOOP(S) (S)->loop
|
|
#define STMT_VINFO_RELEVANT_P(S) (S)->relevant
|
|
#define STMT_VINFO_VECTYPE(S) (S)->vectype
|
|
#define STMT_VINFO_VEC_STMT(S) (S)->vectorized_stmt
|
|
#define STMT_VINFO_DATA_REF(S) (S)->data_ref_info
|
|
#define STMT_VINFO_MEMTAG(S) (S)->memtag
|
|
#define STMT_VINFO_VECT_DR_BASE(S) (S)->vect_dr_base
|
|
|
|
static inline void set_stmt_info (stmt_ann_t ann, stmt_vec_info stmt_info);
|
|
static inline stmt_vec_info vinfo_for_stmt (tree stmt);
|
|
|
|
static inline void
|
|
set_stmt_info (stmt_ann_t ann, stmt_vec_info stmt_info)
|
|
{
|
|
if (ann)
|
|
ann->common.aux = (char *) stmt_info;
|
|
}
|
|
|
|
static inline stmt_vec_info
|
|
vinfo_for_stmt (tree stmt)
|
|
{
|
|
stmt_ann_t ann = stmt_ann (stmt);
|
|
return ann ? (stmt_vec_info) ann->common.aux : NULL;
|
|
}
|
|
|
|
/*-----------------------------------------------------------------*/
|
|
/* Info on data references alignment. */
|
|
/*-----------------------------------------------------------------*/
|
|
|
|
/* The misalignment of the memory access in bytes. */
|
|
#define DR_MISALIGNMENT(DR) (DR)->aux
|
|
|
|
static inline bool
|
|
aligned_access_p (struct data_reference *data_ref_info)
|
|
{
|
|
return (DR_MISALIGNMENT (data_ref_info) == 0);
|
|
}
|
|
|
|
static inline bool
|
|
unknown_alignment_for_access_p (struct data_reference *data_ref_info)
|
|
{
|
|
return (DR_MISALIGNMENT (data_ref_info) == -1);
|
|
}
|
|
|
|
/* Perform signed modulo, always returning a non-negative value. */
|
|
#define VECT_SMODULO(x,y) ((x) % (y) < 0 ? ((x) % (y) + (y)) : (x) % (y))
|
|
|
|
|
|
/*-----------------------------------------------------------------*/
|
|
/* Info on vectorized loops. */
|
|
/*-----------------------------------------------------------------*/
|
|
typedef struct _loop_vec_info {
|
|
|
|
/* The loop to which this info struct refers to. */
|
|
struct loop *loop;
|
|
|
|
/* The loop basic blocks. */
|
|
basic_block *bbs;
|
|
|
|
/* The loop exit_condition. */
|
|
tree exit_cond;
|
|
|
|
/* Number of iterations. -1 if unknown. */
|
|
HOST_WIDE_INT num_iters;
|
|
|
|
/* Is the loop vectorizable? */
|
|
bool vectorizable;
|
|
|
|
/* Unrolling factor */
|
|
int vectorization_factor;
|
|
|
|
/* All data references in the loop that are being written to. */
|
|
varray_type data_ref_writes;
|
|
|
|
/* All data references in the loop that are being read from. */
|
|
varray_type data_ref_reads;
|
|
} *loop_vec_info;
|
|
|
|
/* Access Functions. */
|
|
#define LOOP_VINFO_LOOP(L) (L)->loop
|
|
#define LOOP_VINFO_BBS(L) (L)->bbs
|
|
#define LOOP_VINFO_EXIT_COND(L) (L)->exit_cond
|
|
#define LOOP_VINFO_NITERS(L) (L)->num_iters
|
|
#define LOOP_VINFO_VECTORIZABLE_P(L) (L)->vectorizable
|
|
#define LOOP_VINFO_VECT_FACTOR(L) (L)->vectorization_factor
|
|
#define LOOP_VINFO_DATAREF_WRITES(L) (L)->data_ref_writes
|
|
#define LOOP_VINFO_DATAREF_READS(L) (L)->data_ref_reads
|
|
|
|
#define LOOP_VINFO_NITERS_KNOWN_P(L) ((L)->num_iters > 0)
|
|
|
|
/*-----------------------------------------------------------------*/
|
|
/* Function prototypes. */
|
|
/*-----------------------------------------------------------------*/
|
|
|
|
/* Main driver. */
|
|
extern void vectorize_loops (struct loops *);
|
|
|
|
/* creation and deletion of loop and stmt info structs. */
|
|
extern loop_vec_info new_loop_vec_info (struct loop *loop);
|
|
extern void destroy_loop_vec_info (loop_vec_info);
|
|
extern stmt_vec_info new_stmt_vec_info (tree stmt, struct loop *loop);
|
|
|
|
#endif /* GCC_TREE_VECTORIZER_H */
|