tree-vect-patterns.c (vect_recog_divmod_pattern): Optimize sequence based on get_range_info returned range.

* tree-vect-patterns.c (vect_recog_divmod_pattern): Optimize
	sequence based on get_range_info returned range.

	* gcc.target/i386/vect-div-1.c: New test.

From-SVN: r203969
This commit is contained in:
Jakub Jelinek 2013-10-23 14:45:21 +02:00 committed by Jakub Jelinek
parent 2d67d16929
commit 7abed77964
4 changed files with 94 additions and 15 deletions

View File

@ -1,3 +1,8 @@
2013-10-23 Jakub Jelinek <jakub@redhat.com>
* tree-vect-patterns.c (vect_recog_divmod_pattern): Optimize
sequence based on get_range_info returned range.
2013-10-23 Andrew MacLeod <amacleod@redhat.com> 2013-10-23 Andrew MacLeod <amacleod@redhat.com>
* tree-ssa.h: Remove all #include's * tree-ssa.h: Remove all #include's

View File

@ -1,5 +1,7 @@
2013-10-23 Jakub Jelinek <jakub@redhat.com> 2013-10-23 Jakub Jelinek <jakub@redhat.com>
* gcc.target/i386/vect-div-1.c: New test.
* gcc.dg/vect/pr58508.c: Remove dg-options. * gcc.dg/vect/pr58508.c: Remove dg-options.
2013-10-23 Richard Biener <rguenther@suse.de> 2013-10-23 Richard Biener <rguenther@suse.de>

View File

@ -0,0 +1,43 @@
/* { dg-do compile { target sse2 } } */
/* { dg-options "-O2 -ftree-vectorize -fno-common -msse2" } */
unsigned short b[1024] = { 0 };
int a[1024] = { 0 };
int
f1 (int x)
{
int i;
for (i = 0; i < 1024; i++)
a[i] = (b[i] + 7) / 15;
}
int
f2 (int x)
{
int i;
for (i = 0; i < 1024; i++)
a[i] = (b[i] + 7) % 15;
}
int
f3 (int x)
{
int i;
for (i = 0; i < 1024; i++)
a[i] = (b[i] - 66000) / 15;
}
int
f4 (int x)
{
int i;
for (i = 0; i < 1024; i++)
a[i] = (b[i] - 66000) % 15;
}
/* In f1 and f2, VRP can prove the first operand of division or modulo
is always non-negative, so there is no need to do >> 31 shift
etc. to check if it is. And in f3 and f4, VRP can prove it is always
negative. */
/* { dg-final { scan-assembler-not "psrad\[^\n\r\]*\\\$31" } } */

View File

@ -2230,20 +2230,19 @@ vect_recog_divmod_pattern (vec<gimple> *stmts,
if (post_shift >= prec) if (post_shift >= prec)
return NULL; return NULL;
/* t1 = oprnd1 h* ml; */ /* t1 = oprnd0 h* ml; */
t1 = vect_recog_temp_ssa_var (itype, NULL); t1 = vect_recog_temp_ssa_var (itype, NULL);
def_stmt def_stmt
= gimple_build_assign_with_ops (MULT_HIGHPART_EXPR, t1, oprnd0, = gimple_build_assign_with_ops (MULT_HIGHPART_EXPR, t1, oprnd0,
build_int_cst (itype, ml)); build_int_cst (itype, ml));
append_pattern_def_seq (stmt_vinfo, def_stmt);
if (add) if (add)
{ {
/* t2 = t1 + oprnd0; */ /* t2 = t1 + oprnd0; */
append_pattern_def_seq (stmt_vinfo, def_stmt);
t2 = vect_recog_temp_ssa_var (itype, NULL); t2 = vect_recog_temp_ssa_var (itype, NULL);
def_stmt def_stmt
= gimple_build_assign_with_ops (PLUS_EXPR, t2, t1, oprnd0); = gimple_build_assign_with_ops (PLUS_EXPR, t2, t1, oprnd0);
append_pattern_def_seq (stmt_vinfo, def_stmt);
} }
else else
t2 = t1; t2 = t1;
@ -2251,27 +2250,57 @@ vect_recog_divmod_pattern (vec<gimple> *stmts,
if (post_shift) if (post_shift)
{ {
/* t3 = t2 >> post_shift; */ /* t3 = t2 >> post_shift; */
append_pattern_def_seq (stmt_vinfo, def_stmt);
t3 = vect_recog_temp_ssa_var (itype, NULL); t3 = vect_recog_temp_ssa_var (itype, NULL);
def_stmt def_stmt
= gimple_build_assign_with_ops (RSHIFT_EXPR, t3, t2, = gimple_build_assign_with_ops (RSHIFT_EXPR, t3, t2,
build_int_cst (itype, post_shift)); build_int_cst (itype, post_shift));
append_pattern_def_seq (stmt_vinfo, def_stmt);
} }
else else
t3 = t2; t3 = t2;
/* t4 = oprnd0 >> (prec - 1); */ double_int oprnd0_min, oprnd0_max;
t4 = vect_recog_temp_ssa_var (itype, NULL); int msb = 1;
def_stmt if (get_range_info (oprnd0, &oprnd0_min, &oprnd0_max) == VR_RANGE)
= gimple_build_assign_with_ops (RSHIFT_EXPR, t4, oprnd0, {
build_int_cst (itype, prec - 1)); if (!oprnd0_min.is_negative ())
append_pattern_def_seq (stmt_vinfo, def_stmt); msb = 0;
else if (oprnd0_max.is_negative ())
msb = -1;
}
/* q = t3 - t4; or q = t4 - t3; */ if (msb == 0 && d >= 0)
q = vect_recog_temp_ssa_var (itype, NULL); {
pattern_stmt /* q = t3; */
= gimple_build_assign_with_ops (MINUS_EXPR, q, d < 0 ? t4 : t3, q = t3;
d < 0 ? t3 : t4); pattern_stmt = def_stmt;
}
else
{
/* t4 = oprnd0 >> (prec - 1);
or if we know from VRP that oprnd0 >= 0
t4 = 0;
or if we know from VRP that oprnd0 < 0
t4 = -1; */
append_pattern_def_seq (stmt_vinfo, def_stmt);
t4 = vect_recog_temp_ssa_var (itype, NULL);
if (msb != 1)
def_stmt
= gimple_build_assign_with_ops (INTEGER_CST,
t4, build_int_cst (itype, msb),
NULL_TREE);
else
def_stmt
= gimple_build_assign_with_ops (RSHIFT_EXPR, t4, oprnd0,
build_int_cst (itype, prec - 1));
append_pattern_def_seq (stmt_vinfo, def_stmt);
/* q = t3 - t4; or q = t4 - t3; */
q = vect_recog_temp_ssa_var (itype, NULL);
pattern_stmt
= gimple_build_assign_with_ops (MINUS_EXPR, q, d < 0 ? t4 : t3,
d < 0 ? t3 : t4);
}
} }
if (rhs_code == TRUNC_MOD_EXPR) if (rhs_code == TRUNC_MOD_EXPR)