gcc/testsuite/gcc.dg/tree-ssa/ssa-dom-cse-2.c - gcc - Git at Google

 /* { dg-do compile } */
 /* { dg-options "-O3 -fno-tree-fre -fno-tree-pre -fdump-tree-optimized --param sra-max-scalarization-size-Ospeed=32" } */
 /* System Z needs hardware vector support for this to work (the optimization
    gets too complex without it.
    { dg-additional-options "-march=z13" { target s390x-*-* } } */
 /* Use generic tuning on x86 for the same reasons as why alpha, powerpc etc. are
    xfailed below.
    { dg-additional-options "-mtune=generic" { target i?86-*-* x86_64-*-* } } */

 int
 foo ()
 {
   const int a[8] = { 0, 1, 2, 3, 4, 5, 6, 7 };
   int i, sum;

   sum = 0;
   for (i = 0; i < sizeof (a) / sizeof (*a); i++)
     sum += a[i];

   return sum;
 }

 /* After late unrolling the above loop completely DOM should be
    able to optimize this to return 28.  */

 /* On alpha, the vectorizer generates writes of two vector elements at once,
    but the loop reads only one element at a time, and DOM cannot resolve these.
    The same happens on powerpc depending on the SIMD support available.  */

 /* { dg-final { scan-tree-dump "return 28;" "optimized" { xfail { { alpha*-*-* hppa*64*-*-* nvptx*-*-* mmix-knuth-mmixware } || { { { lp64 && { powerpc*-*-* sparc*-*-* riscv*-*-* } } || aarch64_sve } || { arm*-*-* && { ! arm_neon } } } } } } } */
	/* { dg-do compile } */
	/* { dg-options "-O3 -fno-tree-fre -fno-tree-pre -fdump-tree-optimized --param sra-max-scalarization-size-Ospeed=32" } */
	/* System Z needs hardware vector support for this to work (the optimization
	gets too complex without it.
	{ dg-additional-options "-march=z13" { target s390x-- } } */
	/* Use generic tuning on x86 for the same reasons as why alpha, powerpc etc. are
	xfailed below.
	{ dg-additional-options "-mtune=generic" { target i?86-- x86_64-- } } */

	int
	foo ()
	{
	const int a[8] = { 0, 1, 2, 3, 4, 5, 6, 7 };
	int i, sum;

	sum = 0;
	for (i = 0; i < sizeof (a) / sizeof (*a); i++)
	sum += a[i];

	return sum;
	}

	/* After late unrolling the above loop completely DOM should be
	able to optimize this to return 28. */

	/* On alpha, the vectorizer generates writes of two vector elements at once,
	but the loop reads only one element at a time, and DOM cannot resolve these.
	The same happens on powerpc depending on the SIMD support available. */

	/* { dg-final { scan-tree-dump "return 28;" "optimized" { xfail { { alpha--* hppa64-- nvptx--* mmix-knuth-mmixware } \|\| { { { lp64 && { powerpc--* sparc--* riscv--* } } \|\| aarch64_sve } \|\| { arm--* && { ! arm_neon } } } } } } } */