https://gcc.gnu.org/bugzilla/show_bug.cgi?id=99414
Jan Hubicka <hubicka at gcc dot gnu.org> changed:
What |Removed |Added
----------------------------------------------------------------------------
Summary|s235, s2233, s275 and s233 |s235, s2233, s275, s2275
|benchmarks of TSVC is |and s233 benchmarks of TSVC
|vectorized better by icc |is vectorized better by icc
|than gcc (loop interchange) |than gcc (loop interchange)
--- Comment #5 from Jan Hubicka <hubicka at gcc dot gnu.org> ---
s2275:
typedef float real_t;
#define iterations 100000
#define LEN_1D 32000
#define LEN_2D 256
// array definitions
real_t
a[LEN_2D],b[LEN_2D],c[LEN_2D],d[LEN_2D],aa[LEN_2D][LEN_2D],bb[LEN_2D][LEN_2D],cc[LEN_2D][LEN_2D],tt[LEN_2D][LEN_2D];
int main(struct args_t * func_args)
{
// loop distribution is needed to be able to interchange
for (int nl = 0; nl < 100*(iterations/LEN_2D); nl++) {
for (int i = 0; i < LEN_2D; i++) {
for (int j = 0; j < LEN_2D; j++) {
aa[j][i] = aa[j][i] + bb[j][i] * cc[j][i];
}
a[i] = b[i] + c[i] * d[i];
}
dummy();
}
return aa[0][0];
}