[Upload patch] Upload patches to add new features

and fix bugs - add-fp-model-options.patch: New file - enable-simd-math.patch: Enable simd math library in C and Fortran - fix-CTOR-vectorization.patch: New file - fix-range-set-by-vectorization-on-niter-IVs.patch: New file - medium-code-mode.patch: Fix bugs when used with fpic - optabs-Dont-use-scalar-conversions-for-vectors.patch: New file - PR92429-do-not-fold-when-updating.patch: New file - redundant-loop-elimination.patch: Fix some programming specifications - fix-ICE-in-vect.patch: New file - Fix-type-mismatch-in-SLPed-constructors.patch: New file - add-check-for-pressure-in-sche1.patch: New file - revert-moutline-atomics.patch: New file - fix-ICE-in-eliminate-stmt.patch: New file - revise-type-before-build-MULT.patch: New file - Simplify-X-C1-C2.patch: New file - gcc.spec: Add new patches
2021-04-28 17:07:13 +08:00 · 2021-04-28 17:07:13 +08:00 · ae8eb7c877
commit ae8eb7c877
parent 4d36586e0c
16 changed files with 3069 additions and 182 deletions
--- a/Fix-type-mismatch-in-SLPed-constructors.patch
+++ b/Fix-type-mismatch-in-SLPed-constructors.patch
@ -0,0 +1,118 @@
 This backport contains 2 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-Fix-type-mismatch-in-SLPed-constructors.patch
 86c3a7d891f9f175d09d61f5ce163c6dc5ce681f
 0001-re-PR-fortran-91003-ICE-when-compiling-LAPACK-CGEGV-.patch
 d005f61e7a0dbb2c991f13b4b61b1a27ca2d8b73
 diff -urpN a/gcc/testsuite/gfortran.dg/pr91003.f90 b/gcc/testsuite/gfortran.dg/pr91003.f90
 --- a/gcc/testsuite/gfortran.dg/pr91003.f90	1969-12-31 19:00:00.000000000 -0500
 +++ b/gcc/testsuite/gfortran.dg/pr91003.f90	2021-02-22 03:02:39.484000000 -0500
@@ -0,0 +1,33 @@
 +! { dg-do compile }
 +! { dg-options "-Ofast" }
 +      SUBROUTINE FOO(N, A, B, C, D, E, F, G)
 +      COMPLEX A(*)
 +      LOGICAL H
 +      INTEGER G
 +      REAL I, C, J, F, F1, F2, K, E, L, M, B, D
 +      DO JC = 1, N
 +        K = F*REAL(A(JC))
 +        Z = F*AIMAG(A(JC))
 +        H = .FALSE.
 +        L = G
 +        IF(ABS(Z).LT.D .AND. I.GE. MAX(D, B*C, B*J)) THEN
 +          H = .TRUE.
 +          L = (D / F1) / MAX(D, F2*I)
 +        END IF
 +        IF(ABS(K).LT.D .AND. C.GE. MAX(D, B*I, B*J)) THEN
 +          L = MAX(L, (D / F1) / MAX(D, F2*C))
 +        END IF
 +        IF(ABS(E).LT.D .AND. J.GE. MAX(D, B*C, B*I)) THEN
 +          H = .TRUE.
 +          L = MAX(L, (D / BNRM1) / MAX(D, BNRM2*J))
 +        END IF
 +        IF(H) THEN
 +          M = (L*D)*MAX(ABS(K), ABS(Z), ABS(E))
 +        END IF
 +        IF(H) THEN
 +          K = (L*REAL(A(JC)))*F
 +          Z = (L*AIMAG(A(JC)))*F
 +        END IF
 +        A(JC) = CMPLX(K, Z)
 +      END DO
 +      END
 diff -urpN a/gcc/tree-vect-slp.c b/gcc/tree-vect-slp.c
 --- a/gcc/tree-vect-slp.c	2021-02-22 02:56:51.328000000 -0500
 +++ b/gcc/tree-vect-slp.c	2021-02-22 03:03:22.676000000 -0500
@@ -3442,7 +3442,7 @@ vect_slp_bb (basic_block bb)
 /* Return 1 if vector type STMT_VINFO is a boolean vector.  */
 static bool
 -vect_mask_constant_operand_p (stmt_vec_info stmt_vinfo)
 +vect_mask_constant_operand_p (stmt_vec_info stmt_vinfo, unsigned op_num)
 {
   enum tree_code code = gimple_expr_code (stmt_vinfo->stmt);
   tree op, vectype;
@@ -3467,9 +3467,17 @@ vect_mask_constant_operand_p (stmt_vec_i
       tree cond = gimple_assign_rhs1 (stmt);
       if (TREE_CODE (cond) == SSA_NAME)
 -	op = cond;
 +	{
 +	  if (op_num > 0)
 +	    return VECTOR_BOOLEAN_TYPE_P (STMT_VINFO_VECTYPE (stmt_vinfo));
 +	  op = cond;
 +	}
       else
 -	op = TREE_OPERAND (cond, 0);
 +	{
 +	  if (op_num > 1)
 +	    return VECTOR_BOOLEAN_TYPE_P (STMT_VINFO_VECTYPE (stmt_vinfo));
 +	  op = TREE_OPERAND (cond, 0);
 +	}
       if (!vect_is_simple_use (op, stmt_vinfo->vinfo, &dt, &vectype))
 	gcc_unreachable ();
@@ -3600,9 +3608,10 @@ duplicate_and_interleave (vec_info *vinf
    operands.  */
 static void
 -vect_get_constant_vectors (slp_tree op_node, slp_tree slp_node,
 +vect_get_constant_vectors (slp_tree slp_node, unsigned op_num,
                            vec<tree> *vec_oprnds)
 {
 +  slp_tree op_node = SLP_TREE_CHILDREN (slp_node)[op_num];
   stmt_vec_info stmt_vinfo = SLP_TREE_SCALAR_STMTS (slp_node)[0];
   vec_info *vinfo = stmt_vinfo->vinfo;
   unsigned HOST_WIDE_INT nunits;
@@ -3624,7 +3633,7 @@ vect_get_constant_vectors (slp_tree op_n
   /* Check if vector type is a boolean vector.  */
   tree stmt_vectype = STMT_VINFO_VECTYPE (stmt_vinfo);
   if (VECT_SCALAR_BOOLEAN_TYPE_P (TREE_TYPE (op))
 -      && vect_mask_constant_operand_p (stmt_vinfo))
 +      && vect_mask_constant_operand_p (stmt_vinfo, op_num))
     vector_type = truth_type_for (stmt_vectype);
   else
     vector_type = get_vectype_for_scalar_type (vinfo, TREE_TYPE (op), op_node);
@@ -3848,7 +3857,7 @@ vect_get_slp_defs (slp_tree slp_node, ve
 	  vect_get_slp_vect_defs (child, &vec_defs);
 	}
       else
 -	vect_get_constant_vectors (child, slp_node, &vec_defs);
 +	vect_get_constant_vectors (slp_node, i, &vec_defs);
       vec_oprnds->quick_push (vec_defs);
     }
@@ -4269,6 +4278,10 @@ vectorize_slp_instance_root_stmt (slp_tr
 	{
 	  tree vect_lhs = gimple_get_lhs (child_stmt_info->stmt);
 	  tree root_lhs = gimple_get_lhs (instance->root_stmt->stmt);
 +	  if (!useless_type_conversion_p (TREE_TYPE (root_lhs),
 +					  TREE_TYPE (vect_lhs)))
 +	    vect_lhs = build1 (VIEW_CONVERT_EXPR, TREE_TYPE (root_lhs),
 +			       vect_lhs);
 	  rstmt = gimple_build_assign (root_lhs, vect_lhs);
 	  break;
 	}
--- a/PR92429-do-not-fold-when-updating.patch
+++ b/PR92429-do-not-fold-when-updating.patch
@ -0,0 +1,70 @@
 This backport contains 1 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-PR-tree-optimization-92429-do-not-fold-when-updating.patch
 f7dff7699fd70d3b8c3e637818e18c86f93ccfec
 diff --git a/gcc/tree-ssa-loop-niter.c b/gcc/tree-ssa-loop-niter.c
 index 4d5e0494511..6e6df0bfdb8 100644
 --- a/gcc/tree-ssa-loop-niter.c
 +++ b/gcc/tree-ssa-loop-niter.c
@@ -1934,7 +1934,8 @@ number_of_iterations_cond (class loop *loop,
 tree
 simplify_replace_tree (tree expr, tree old, tree new_tree,
 -		       tree (*valueize) (tree, void*), void *context)
 +		       tree (*valueize) (tree, void*), void *context,
 +		       bool do_fold)
 {
   unsigned i, n;
   tree ret = NULL_TREE, e, se;
@@ -1966,7 +1967,7 @@ simplify_replace_tree (tree expr, tree old, tree new_tree,
   for (i = 0; i < n; i++)
     {
       e = TREE_OPERAND (expr, i);
 -      se = simplify_replace_tree (e, old, new_tree, valueize, context);
 +      se = simplify_replace_tree (e, old, new_tree, valueize, context, do_fold);
       if (e == se)
 	continue;
@@ -1976,7 +1977,7 @@ simplify_replace_tree (tree expr, tree old, tree new_tree,
       TREE_OPERAND (ret, i) = se;
     }
 -  return (ret ? fold (ret) : expr);
 +  return (ret ? (do_fold ? fold (ret) : ret) : expr);
 }
 /* Expand definitions of ssa names in EXPR as long as they are simple
 diff --git a/gcc/tree-ssa-loop-niter.h b/gcc/tree-ssa-loop-niter.h
 index 621e2c2e28d..eb8d1579479 100644
 --- a/gcc/tree-ssa-loop-niter.h
 +++ b/gcc/tree-ssa-loop-niter.h
@@ -58,7 +58,7 @@ extern void free_numbers_of_iterations_estimates (class loop *);
 extern void free_numbers_of_iterations_estimates (function *);
 extern tree simplify_replace_tree (tree, tree,
 				   tree, tree (*)(tree, void *) = NULL,
 -				   void * = NULL);
 +				   void * = NULL, bool do_fold = true);
 extern void substitute_in_loop_info (struct loop *, tree, tree);
 #endif /* GCC_TREE_SSA_LOOP_NITER_H */
 diff --git a/gcc/tree-vect-loop.c b/gcc/tree-vect-loop.c
 index 8e318a037a7..e5fb434bd4e 100644
 --- a/gcc/tree-vect-loop.c
 +++ b/gcc/tree-vect-loop.c
@@ -8434,8 +8434,13 @@ update_epilogue_loop_vinfo (class loop *epilogue, tree advance)
 	    gimple_set_op (stmt, j, *new_op);
 	  else
 	    {
 +	      /* PR92429: The last argument of simplify_replace_tree disables
 +		 folding when replacing arguments.  This is required as
 +		 otherwise you might end up with different statements than the
 +		 ones analyzed in vect_loop_analyze, leading to different
 +		 vectorization.  */
 	      op = simplify_replace_tree (op, NULL_TREE, NULL_TREE,
 -				     &find_in_mapping, &mapping);
 +					  &find_in_mapping, &mapping, false);
 	      gimple_set_op (stmt, j, op);
 	    }
 	}
--- a/Simplify-X-C1-C2.patch
+++ b/Simplify-X-C1-C2.patch
@ -0,0 +1,197 @@
 This backport contains 2 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-Simplify-X-C1-C2-with-undefined-overflow.patch
 ca2b8c082c4f16919071c9f8de8db0b33b54c405
 0002-Simplify-X-C1-C2-with-wrapping-overflow.patch
 287522613d661b4c5ba8403b051eb470c1674cba
 diff -Nurp a/gcc/expr.c b/gcc/expr.c
 --- a/gcc/expr.c	2021-03-17 16:34:24.700000000 +0800
 +++ b/gcc/expr.c	2021-03-17 10:30:11.500000000 +0800
@@ -11706,38 +11706,6 @@ string_constant (tree arg, tree *ptr_off
   return init;
 }
 -/* Compute the modular multiplicative inverse of A modulo M
 -   using extended Euclid's algorithm.  Assumes A and M are coprime.  */
 -static wide_int
 -mod_inv (const wide_int &a, const wide_int &b)
 -{
 -  /* Verify the assumption.  */
 -  gcc_checking_assert (wi::eq_p (wi::gcd (a, b), 1));
 -
 -  unsigned int p = a.get_precision () + 1;
 -  gcc_checking_assert (b.get_precision () + 1 == p);
 -  wide_int c = wide_int::from (a, p, UNSIGNED);
 -  wide_int d = wide_int::from (b, p, UNSIGNED);
 -  wide_int x0 = wide_int::from (0, p, UNSIGNED);
 -  wide_int x1 = wide_int::from (1, p, UNSIGNED);
 -
 -  if (wi::eq_p (b, 1))
 -    return wide_int::from (1, p, UNSIGNED);
 -
 -  while (wi::gt_p (c, 1, UNSIGNED))
 -    {
 -      wide_int t = d;
 -      wide_int q = wi::divmod_trunc (c, d, UNSIGNED, &d);
 -      c = t;
 -      wide_int s = x0;
 -      x0 = wi::sub (x1, wi::mul (q, x0));
 -      x1 = s;
 -    }
 -  if (wi::lt_p (x1, 0, SIGNED))
 -    x1 += d;
 -  return x1;
 -}
 -
 /* Optimize x % C1 == C2 for signed modulo if C1 is a power of two and C2
    is non-zero and C3 ((1<<(prec-1)) | (C1 - 1)):
    for C2 > 0 to x & C3 == C2
@@ -11948,7 +11916,7 @@ maybe_optimize_mod_cmp (enum tree_code c
   w = wi::lrshift (w, shift);
   wide_int a = wide_int::from (w, prec + 1, UNSIGNED);
   wide_int b = wi::shifted_mask (prec, 1, false, prec + 1);
 -  wide_int m = wide_int::from (mod_inv (a, b), prec, UNSIGNED);
 +  wide_int m = wide_int::from (wi::mod_inv (a, b), prec, UNSIGNED);
   tree c3 = wide_int_to_tree (type, m);
   tree c5 = NULL_TREE;
   wide_int d, e;
 diff -Nurp a/gcc/match.pd b/gcc/match.pd
 --- a/gcc/match.pd	2021-03-17 16:34:19.320000000 +0800
 +++ b/gcc/match.pd	2021-03-17 10:30:11.500000000 +0800
@@ -3290,6 +3290,35 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT)
      (scmp @0 @2)
      (cmp @0 @2))))))
 +/* For integral types with undefined overflow fold
 +   x * C1 == C2 into x == C2 / C1 or false.
 +   If overflow wraps and C1 is odd, simplify to x == C2 / C1 in the ring
 +   Z / 2^n Z.  */
 +(for cmp (eq ne)
 + (simplify
 +  (cmp (mult @0 INTEGER_CST@1) INTEGER_CST@2)
 +  (if (INTEGRAL_TYPE_P (TREE_TYPE (@0))
 +       && TYPE_OVERFLOW_UNDEFINED (TREE_TYPE (@0))
 +       && wi::to_wide (@1) != 0)
 +   (with { widest_int quot; }
 +    (if (wi::multiple_of_p (wi::to_widest (@2), wi::to_widest (@1),
 +			    TYPE_SIGN (TREE_TYPE (@0)), &quot))
 +     (cmp @0 { wide_int_to_tree (TREE_TYPE (@0), quot); })
 +     { constant_boolean_node (cmp == NE_EXPR, type); }))
 +   (if (INTEGRAL_TYPE_P (TREE_TYPE (@0))
 +	&& TYPE_OVERFLOW_WRAPS (TREE_TYPE (@0))
 +	&& (wi::bit_and (wi::to_wide (@1), 1) == 1))
 +    (cmp @0
 +     {
 +       tree itype = TREE_TYPE (@0);
 +       int p = TYPE_PRECISION (itype);
 +       wide_int m = wi::one (p + 1) << p;
 +       wide_int a = wide_int::from (wi::to_wide (@1), p + 1, UNSIGNED);
 +       wide_int i = wide_int::from (wi::mod_inv (a, m),
 +				    p, TYPE_SIGN (itype));
 +       wide_int_to_tree (itype, wi::mul (i, wi::to_wide (@2)));
 +     })))))
 +
 /* Simplify comparison of something with itself.  For IEEE
    floating-point, we can only do some of these simplifications.  */
 (for cmp (eq ge le)
 diff -Nurp a/gcc/testsuite/gcc.c-torture/execute/pr23135.c b/gcc/testsuite/gcc.c-torture/execute/pr23135.c
 --- a/gcc/testsuite/gcc.c-torture/execute/pr23135.c	2021-03-17 16:34:24.016000000 +0800
 +++ b/gcc/testsuite/gcc.c-torture/execute/pr23135.c	2021-03-17 10:30:13.572000000 +0800
@@ -1,7 +1,7 @@
 /* Based on execute/simd-1.c, modified by joern.rennecke@st.com to
    trigger a reload bug.  Verified for gcc mainline from 20050722 13:00 UTC
    for sh-elf -m4 -O2.  */
 -/* { dg-options "-Wno-psabi" } */
 +/* { dg-options "-Wno-psabi -fwrapv" } */
 /* { dg-add-options stack_size } */
 #ifndef STACK_SIZE
 diff -Nurp a/gcc/testsuite/gcc.dg/tree-ssa/pr95433-2.c b/gcc/testsuite/gcc.dg/tree-ssa/pr95433-2.c
 --- a/gcc/testsuite/gcc.dg/tree-ssa/pr95433-2.c	1970-01-01 08:00:00.000000000 +0800
 +++ b/gcc/testsuite/gcc.dg/tree-ssa/pr95433-2.c	2021-03-17 10:30:13.276000000 +0800
@@ -0,0 +1,15 @@
 +/* { dg-do compile } */
 +/* { dg-options "-O -fwrapv -fdump-tree-gimple" } */
 +
 +typedef __INT32_TYPE__ int32_t;
 +typedef unsigned __INT32_TYPE__ uint32_t;
 +
 +int e(int32_t x){return 3*x==5;}
 +int f(int32_t x){return 3*x==-5;}
 +int g(int32_t x){return -3*x==5;}
 +int h(int32_t x){return 7*x==3;}
 +int i(uint32_t x){return 7*x==3;}
 +
 +/* { dg-final { scan-tree-dump-times "== 1431655767" 1 "gimple" } } */
 +/* { dg-final { scan-tree-dump-times "== -1431655767" 2 "gimple" } } */
 +/* { dg-final { scan-tree-dump-times "== 613566757" 2 "gimple" } } */
 diff -Nurp a/gcc/testsuite/gcc.dg/tree-ssa/pr95433.c b/gcc/testsuite/gcc.dg/tree-ssa/pr95433.c
 --- a/gcc/testsuite/gcc.dg/tree-ssa/pr95433.c	1970-01-01 08:00:00.000000000 +0800
 +++ b/gcc/testsuite/gcc.dg/tree-ssa/pr95433.c	2021-03-17 10:30:13.276000000 +0800
@@ -0,0 +1,8 @@
 +/* { dg-do compile } */
 +/* { dg-options "-O -fdump-tree-optimized" } */
 +
 +int f(int x){return x*7==17;}
 +int g(int x){return x*3==15;}
 +
 +/* { dg-final { scan-tree-dump "return 0;" "optimized" } } */
 +/* { dg-final { scan-tree-dump "== 5;" "optimized" } } */
 diff -Nurp a/gcc/wide-int.cc b/gcc/wide-int.cc
 --- a/gcc/wide-int.cc	2021-03-17 16:34:24.488000000 +0800
 +++ b/gcc/wide-int.cc	2021-03-17 10:30:11.500000000 +0800
@@ -2223,6 +2223,39 @@ wi::round_up_for_mask (const wide_int &v
   return (val | tmp) & -tmp;
 }
 +/* Compute the modular multiplicative inverse of A modulo B
 +   using extended Euclid's algorithm.  Assumes A and B are coprime,
 +   and that A and B have the same precision.  */
 +wide_int
 +wi::mod_inv (const wide_int &a, const wide_int &b)
 +{
 +  /* Verify the assumption.  */
 +  gcc_checking_assert (wi::eq_p (wi::gcd (a, b), 1));
 +
 +  unsigned int p = a.get_precision () + 1;
 +  gcc_checking_assert (b.get_precision () + 1 == p);
 +  wide_int c = wide_int::from (a, p, UNSIGNED);
 +  wide_int d = wide_int::from (b, p, UNSIGNED);
 +  wide_int x0 = wide_int::from (0, p, UNSIGNED);
 +  wide_int x1 = wide_int::from (1, p, UNSIGNED);
 +
 +  if (wi::eq_p (b, 1))
 +    return wide_int::from (1, p, UNSIGNED);
 +
 +  while (wi::gt_p (c, 1, UNSIGNED))
 +    {
 +      wide_int t = d;
 +      wide_int q = wi::divmod_trunc (c, d, UNSIGNED, &d);
 +      c = t;
 +      wide_int s = x0;
 +      x0 = wi::sub (x1, wi::mul (q, x0));
 +      x1 = s;
 +    }
 +  if (wi::lt_p (x1, 0, SIGNED))
 +    x1 += d;
 +  return x1;
 +}
 +
 /*
  * Private utilities.
  */
 diff -Nurp a/gcc/wide-int.h b/gcc/wide-int.h
 --- a/gcc/wide-int.h	2021-03-17 16:34:14.792000000 +0800
 +++ b/gcc/wide-int.h	2021-03-17 10:30:11.500000000 +0800
@@ -3368,6 +3368,8 @@ namespace wi
   wide_int round_down_for_mask (const wide_int &, const wide_int &);
   wide_int round_up_for_mask (const wide_int &, const wide_int &);
 +  wide_int mod_inv (const wide_int &a, const wide_int &b);
 +
   template <typename T>
   T mask (unsigned int, bool);
--- a/add-check-for-pressure-in-sche1.patch
+++ b/add-check-for-pressure-in-sche1.patch
@ -0,0 +1,52 @@
 --- a/gcc/haifa-sched.c	2021-03-08 14:46:59.204000000 +0800
 +++ b/gcc/haifa-sched.c	2021-03-09 13:32:40.656000000 +0800
@@ -2036,8 +2036,10 @@ model_start_update_pressure (struct mode
       /* The instruction wasn't part of the model schedule; it was moved
 	 from a different block.  Update the pressure for the end of
 	 the model schedule.  */
 -      MODEL_REF_PRESSURE (group, point, pci) += delta;
 -      MODEL_MAX_PRESSURE (group, point, pci) += delta;
 +      if (MODEL_REF_PRESSURE (group, point, pci) != -1 || delta > 0)
 +	MODEL_REF_PRESSURE (group, point, pci) += delta;
 +      if (MODEL_MAX_PRESSURE (group, point, pci) != -1 || delta > 0)
 +	MODEL_MAX_PRESSURE (group, point, pci) += delta;
     }
   else
     {
 diff -uprN a/gcc/testsuite/gcc.dg/sche1-pressure-check.c b/gcc/testsuite/gcc.dg/sche1-pressure-check.c
 --- a/gcc/testsuite/gcc.dg/sche1-pressure-check.c  1970-01-01 08:00:00.000000000 +0800
 +++ b/gcc/testsuite/gcc.dg/sche1-pressure-check.c  2021-03-09 13:40:34.036000000 +0800
@@ -0,0 +1,33 @@
 +/* { dg-do compile } */
 +/* { dg-options "-O3" } */
 +
 +int a, g, h;
 +char b, c;
 +short d;
 +static int e;
 +int *volatile f;
 +void i() {
 +  int j = 0;
 +  int *k = &a;
 +  for (; c; c--) {
 +    g && (d = 0);
 +    j ^= 10;
 +    {
 +      int l[2];
 +      l;
 +      h = l[1];
 +    }
 +    e = 1;
 +    for (; e <= 7; e++) {
 +      *k = 6;
 +      *f = b = 0;
 +      for (; b <= 7; b++) {
 +        int m = 5;
 +        if (g)
 +          *k &= m ^= j;
 +      }
 +    }
 +  }
 +}
 +int main() {}
 +
--- a/add-fp-model-options.patch
+++ b/add-fp-model-options.patch
@ -0,0 +1,376 @@
 diff -Nurp a/gcc/common.opt b/gcc/common.opt
 --- a/gcc/common.opt	2021-02-18 21:22:07.216000000 +0800
 +++ b/gcc/common.opt	2021-02-19 16:04:17.876000000 +0800
@@ -1506,6 +1506,32 @@ ffp-int-builtin-inexact
 Common Report Var(flag_fp_int_builtin_inexact) Init(1) Optimization
 Allow built-in functions ceil, floor, round, trunc to raise \"inexact\" exceptions.
 +fftz
 +Common Report Var(flag_ftz) Optimization
 +Control fpcr register for flush to zero.
 +
 +fp-model=
 +Common Joined RejectNegative Enum(fp_model) Var(flag_fp_model) Init(FP_MODEL_NORMAL) Optimization
 +-fp-model=[normal|fast|precise|except|strict] Perform floating-point precision control.
 +
 +Enum
 +Name(fp_model) Type(enum fp_model) UnknownError(unknown floating point precision model %qs)
 +
 +EnumValue
 +Enum(fp_model) String(normal) Value(FP_MODEL_NORMAL)
 +
 +EnumValue
 +Enum(fp_model) String(fast) Value(FP_MODEL_FAST)
 +
 +EnumValue
 +Enum(fp_model) String(precise) Value(FP_MODEL_PRECISE)
 +
 +EnumValue
 +Enum(fp_model) String(except) Value(FP_MODEL_EXCEPT)
 +
 +EnumValue
 +Enum(fp_model) String(strict) Value(FP_MODEL_STRICT)
 +
 ; Nonzero means don't put addresses of constant functions in registers.
 ; Used for compiling the Unix kernel, where strange substitutions are
 ; done on the assembly output.
 diff -Nurp a/gcc/config/aarch64/aarch64-linux.h b/gcc/config/aarch64/aarch64-linux.h
 --- a/gcc/config/aarch64/aarch64-linux.h	2021-02-18 21:22:07.220000000 +0800
 +++ b/gcc/config/aarch64/aarch64-linux.h	2021-02-18 21:23:55.932000000 +0800
@@ -50,7 +50,8 @@
 #define LINK_SPEC LINUX_TARGET_LINK_SPEC AARCH64_ERRATA_LINK_SPEC
 #define GNU_USER_TARGET_MATHFILE_SPEC \
 -  "%{Ofast|ffast-math|funsafe-math-optimizations:crtfastmath.o%s}"
 +  "%{Ofast|ffast-math|funsafe-math-optimizations|fp-model=fast|fftz:\
 +  %{!fno-ftz:crtfastmath.o%s}}"
 #undef ENDFILE_SPEC
 #define ENDFILE_SPEC   \
 diff -Nurp a/gcc/flag-types.h b/gcc/flag-types.h
 --- a/gcc/flag-types.h	2020-03-12 19:07:21.000000000 +0800
 +++ b/gcc/flag-types.h	2021-02-18 21:23:55.932000000 +0800
@@ -207,6 +207,15 @@ enum fp_contract_mode {
   FP_CONTRACT_FAST = 2
 };
 +/* Floating-point precision mode.  */
 +enum fp_model {
 +  FP_MODEL_NORMAL = 0,
 +  FP_MODEL_FAST = 1,
 +  FP_MODEL_PRECISE = 2,
 +  FP_MODEL_EXCEPT = 3,
 +  FP_MODEL_STRICT = 4
 +};
 +
 /* Scalar storage order kind.  */
 enum scalar_storage_order_kind {
   SSO_NATIVE = 0,
 diff -Nurp a/gcc/fortran/options.c b/gcc/fortran/options.c
 --- a/gcc/fortran/options.c	2020-03-12 19:07:21.000000000 +0800
 +++ b/gcc/fortran/options.c	2021-02-18 21:23:55.932000000 +0800
@@ -247,6 +247,7 @@ form_from_filename (const char *filename
   return f_form;
 }
 +static void gfc_handle_fpe_option (const char *arg, bool trap);
 /* Finalize commandline options.  */
@@ -274,6 +275,13 @@ gfc_post_options (const char **pfilename
   if (flag_protect_parens == -1)
     flag_protect_parens = !optimize_fast;
 +  /* If fp-model=precise/strict, turn on all ffpe-trap and ffpe-summary.  */
 +  if (flag_fp_model == FP_MODEL_EXCEPT || flag_fp_model == FP_MODEL_STRICT)
 +    {
 +      gfc_handle_fpe_option ("all", false);
 +      gfc_handle_fpe_option ("invalid,zero,overflow,underflow", true);
 +    }
 +
   /* -Ofast sets implies -fstack-arrays unless an explicit size is set for
      stack arrays.  */
   if (flag_stack_arrays == -1 && flag_max_stack_var_size == -2)
 diff -Nurp a/gcc/opts.c b/gcc/opts.c
 --- a/gcc/opts.c	2021-02-18 21:22:07.424000000 +0800
 +++ b/gcc/opts.c	2021-02-19 16:00:08.628000000 +0800
@@ -196,6 +196,7 @@ static void set_debug_level (enum debug_
 			     struct gcc_options *opts_set,
 			     location_t loc);
 static void set_fast_math_flags (struct gcc_options *opts, int set);
 +static void set_fp_model_flags (struct gcc_options *opts, int set);
 static void decode_d_option (const char *arg, struct gcc_options *opts,
 			     location_t loc, diagnostic_context *dc);
 static void set_unsafe_math_optimizations_flags (struct gcc_options *opts,
@@ -2433,6 +2434,10 @@ common_handle_option (struct gcc_options
       set_fast_math_flags (opts, value);
       break;
 +    case OPT_fp_model_:
 +      set_fp_model_flags (opts, value);
 +      break;
 +
     case OPT_funsafe_math_optimizations:
       set_unsafe_math_optimizations_flags (opts, value);
       break;
@@ -2905,6 +2910,69 @@ set_fast_math_flags (struct gcc_options
     }
 }
 +/* Handle fp-model options.  */
 +static void
 +set_fp_model_flags (struct gcc_options *opts, int set)
 +{
 +  enum fp_model model = (enum fp_model) set;
 +  switch (model)
 +    {
 +      case FP_MODEL_FAST:
 +	/* Equivalent to open ffast-math.  */
 +	set_fast_math_flags (opts, 1);
 +	break;
 +
 +      case FP_MODEL_PRECISE:
 +	/* Equivalent to close ffast-math.  */
 +	set_fast_math_flags (opts, 0);
 +	/* Turn on -frounding-math -fsignaling-nans.  */
 +	if (!opts->frontend_set_flag_signaling_nans)
 +	  opts->x_flag_signaling_nans = 1;
 +	if (!opts->frontend_set_flag_rounding_math)
 +	  opts->x_flag_rounding_math = 1;
 +	opts->x_flag_expensive_optimizations = 0;
 +	opts->x_flag_code_hoisting = 0;
 +	opts->x_flag_predictive_commoning = 0;
 +	opts->x_flag_fp_contract_mode = FP_CONTRACT_OFF;
 +	break;
 +
 +      case FP_MODEL_EXCEPT:
 +	if (!opts->frontend_set_flag_signaling_nans)
 +	  opts->x_flag_signaling_nans = 1;
 +	if (!opts->frontend_set_flag_errno_math)
 +	  opts->x_flag_errno_math = 1;
 +	if (!opts->frontend_set_flag_trapping_math)
 +	  opts->x_flag_trapping_math = 1;
 +	opts->x_flag_fp_int_builtin_inexact = 1;
 +	/* Also turn on ffpe-trap in fortran.  */
 +	break;
 +
 +      case FP_MODEL_STRICT:
 +	/* Turn on both precise and except.  */
 +	if (!opts->frontend_set_flag_signaling_nans)
 +	  opts->x_flag_signaling_nans = 1;
 +	if (!opts->frontend_set_flag_rounding_math)
 +	  opts->x_flag_rounding_math = 1;
 +	opts->x_flag_expensive_optimizations = 0;
 +	opts->x_flag_code_hoisting = 0;
 +	opts->x_flag_predictive_commoning = 0;
 +	if (!opts->frontend_set_flag_errno_math)
 +	  opts->x_flag_errno_math = 1;
 +	if (!opts->frontend_set_flag_trapping_math)
 +	  opts->x_flag_trapping_math = 1;
 +	opts->x_flag_fp_int_builtin_inexact = 1;
 +	opts->x_flag_fp_contract_mode = FP_CONTRACT_OFF;
 +	break;
 +
 +      case FP_MODEL_NORMAL:
 +	/* Do nothing.  */
 +	break;
 +
 +      default:
 +	gcc_unreachable ();
 +    }
 +}
 +
 /* When -funsafe-math-optimizations is set the following
    flags are set as well.  */
 static void
 diff -Nurp a/gcc/opts-common.c b/gcc/opts-common.c
 --- a/gcc/opts-common.c	2020-03-12 19:07:21.000000000 +0800
 +++ b/gcc/opts-common.c	2021-02-19 09:49:18.880000000 +0800
@@ -26,7 +26,8 @@ along with GCC; see the file COPYING3.
 #include "diagnostic.h"
 #include "spellcheck.h"
 -static void prune_options (struct cl_decoded_option **, unsigned int *);
 +static void prune_options (struct cl_decoded_option **, unsigned int *,
 +			   unsigned int);
 /* An option that is undocumented, that takes a joined argument, and
    that doesn't fit any of the classes of uses (language/common,
@@ -968,7 +969,7 @@ decode_cmdline_options_to_array (unsigne
   *decoded_options = opt_array;
   *decoded_options_count = num_decoded_options;
 -  prune_options (decoded_options, decoded_options_count);
 +  prune_options (decoded_options, decoded_options_count, lang_mask);
 }
 /* Return true if NEXT_OPT_IDX cancels OPT_IDX.  Return false if the
@@ -989,11 +990,108 @@ cancel_option (int opt_idx, int next_opt
   return false;
 }
 +/* Check whether opt_idx exists in decoded_options array bewteen index
 +   start and end.  If found, return its index in decoded_options,
 +   else return end.  */
 +static unsigned int
 +find_opt_idx (struct cl_decoded_option *decoded_options,
 +	       unsigned int decoded_options_count,
 +	       unsigned int start, unsigned int end, unsigned int opt_idx)
 +{
 +  gcc_assert (end <= decoded_options_count);
 +  gcc_assert (opt_idx < cl_options_count);
 +  unsigned int k;
 +  for (k = start; k < end; k++)
 +    {
 +      if (decoded_options[k].opt_index == opt_idx)
 +	{
 +	  return k;
 +	}
 +    }
 +  return k;
 +}
 +
 +/* remove the opt_index element from decoded_options array.  */
 +static unsigned int
 +remove_option (struct cl_decoded_option *decoded_options,
 +	       unsigned int decoded_options_count,
 +	       unsigned int opt_index)
 +{
 +  gcc_assert (opt_index < decoded_options_count);
 +  unsigned int i;
 +  for (i = opt_index; i < decoded_options_count - 1; i++)
 +    {
 +      decoded_options[i] = decoded_options[i + 1];
 +    }
 +  return decoded_options_count - 1;
 +}
 +
 +/* Handle the priority between fp-model, Ofast, and
 +   ffast-math.  */
 +static unsigned int
 +handle_fp_model_driver (struct cl_decoded_option *decoded_options,
 +			unsigned int decoded_options_count,
 +			unsigned int fp_model_index,
 +			unsigned int lang_mask)
 +{
 +  struct cl_decoded_option fp_model_opt = decoded_options[fp_model_index];
 +  enum fp_model model = (enum fp_model) fp_model_opt.value;
 +  if (model == FP_MODEL_PRECISE || model == FP_MODEL_STRICT)
 +    {
 +      /* If found Ofast, override Ofast with O3.  */
 +      unsigned int Ofast_index;
 +      Ofast_index = find_opt_idx (decoded_options, decoded_options_count,
 +				  0, decoded_options_count, OPT_Ofast);
 +      while (Ofast_index != decoded_options_count)
 +	{
 +	  const char *tmp_argv = "-O3";
 +	  decode_cmdline_option (&tmp_argv, lang_mask,
 +				 &decoded_options[Ofast_index]);
 +	  warning (0, "'-Ofast' is degraded to '-O3' due to %qs",
 +		   fp_model_opt.orig_option_with_args_text);
 +	  Ofast_index = find_opt_idx (decoded_options, decoded_options_count,
 +				      0, decoded_options_count, OPT_Ofast);
 +	}
 +      /* If found ffast-math before fp-model=precise/strict
 +	 it, cancel it.  */
 +      unsigned int ffast_math_index;
 +      ffast_math_index
 +	= find_opt_idx (decoded_options, decoded_options_count, 0,
 +			fp_model_index, OPT_ffast_math);
 +      if (ffast_math_index != fp_model_index)
 +	{
 +	  decoded_options_count
 +	    = remove_option (decoded_options, decoded_options_count,
 +			     ffast_math_index);
 +	  warning (0, "'-ffast-math' before %qs is canceled",
 +		   fp_model_opt.orig_option_with_args_text);
 +	}
 +    }
 +  if (model == FP_MODEL_FAST)
 +    {
 +      /* If found -fno-fast-math after fp-model=fast, cancel this one.  */
 +      unsigned int fno_fast_math_index;
 +      fno_fast_math_index
 +	= find_opt_idx (decoded_options, decoded_options_count, fp_model_index,
 +			decoded_options_count, OPT_ffast_math);
 +      if (fno_fast_math_index != decoded_options_count
 +	  && decoded_options[fno_fast_math_index].value == 0)
 +	{
 +	  decoded_options_count
 +	    = remove_option (decoded_options, decoded_options_count,
 +			     fp_model_index);
 +	  warning (0, "'-fp-model=fast' before '-fno-fast-math' is canceled");
 +	}
 +    }
 +  return decoded_options_count;
 +}
 +
 /* Filter out options canceled by the ones after them.  */
 static void
 prune_options (struct cl_decoded_option **decoded_options,
 -	       unsigned int *decoded_options_count)
 +	       unsigned int *decoded_options_count,
 +	       unsigned int lang_mask)
 {
   unsigned int old_decoded_options_count = *decoded_options_count;
   struct cl_decoded_option *old_decoded_options = *decoded_options;
@@ -1005,6 +1103,8 @@ prune_options (struct cl_decoded_option
   unsigned int fdiagnostics_color_idx = 0;
   /* Remove arguments which are negated by others after them.  */
 +
 +  unsigned int fp_model_index = old_decoded_options_count;
   new_decoded_options_count = 0;
   for (i = 0; i < old_decoded_options_count; i++)
     {
@@ -1028,6 +1128,34 @@ prune_options (struct cl_decoded_option
 	  fdiagnostics_color_idx = i;
 	  continue;
 +	case OPT_fp_model_:
 +	  /* Only the last fp-model option will take effect.  */
 +	  unsigned int next_fp_model_idx;
 +	  next_fp_model_idx = find_opt_idx (old_decoded_options,
 +					    old_decoded_options_count,
 +					    i + 1,
 +					    old_decoded_options_count,
 +					    OPT_fp_model_);
 +	  if (next_fp_model_idx != old_decoded_options_count)
 +	    {
 +	      /* Found more than one fp-model, cancel this one.  */
 +	      if (old_decoded_options[i].value
 +		  != old_decoded_options[next_fp_model_idx].value)
 +		{
 +		  warning (0, "%qs is overrided by %qs",
 +			   old_decoded_options[i].
 +			   orig_option_with_args_text,
 +			   old_decoded_options[next_fp_model_idx].
 +			   orig_option_with_args_text);
 +		}
 +	      break;
 +	    }
 +	  else
 +	    {
 +	      /* Found the last fp-model option.  */
 +	      fp_model_index = new_decoded_options_count;
 +	    }
 +	  /* FALLTHRU.  */
 	default:
 	  gcc_assert (opt_idx < cl_options_count);
 	  option = &cl_options[opt_idx];
@@ -1067,6 +1195,14 @@ keep:
 	  break;
 	}
     }
 +  if (fp_model_index < new_decoded_options_count)
 +    {
 +      new_decoded_options_count
 +	= handle_fp_model_driver (new_decoded_options,
 +				  new_decoded_options_count,
 +				  fp_model_index,
 +				  lang_mask);
 +    }
   if (fdiagnostics_color_idx >= 1)
     {
--- a/enable-simd-math.patch
+++ b/enable-simd-math.patch
@ -1,7 +1,35 @@
 diff -Nurp a/gcc/c-family/c-opts.c b/gcc/c-family/c-opts.c
 --- a/gcc/c-family/c-opts.c	2021-01-07 17:32:31.856000000 +0800
 +++ b/gcc/c-family/c-opts.c	2021-01-07 17:05:02.524000000 +0800
@@ -783,6 +783,10 @@ c_common_post_options (const char **pfil
   if (cpp_opts->deps.style == DEPS_NONE)
     check_deps_environment_vars ();
 +  if (flag_simdmath)
 +    {
 +      defer_opt (OPT_include, "simdmath.h");
 +    }
   handle_deferred_opts ();
   sanitize_cpp_opts ();
 diff -Nurp a/gcc/common.opt b/gcc/common.opt
 --- a/gcc/common.opt	2021-01-07 17:30:43.912000000 +0800
 +++ b/gcc/common.opt	2021-01-07 17:38:38.612000000 +0800
@@ -1935,6 +1935,10 @@ fmath-errno
 Common Report Var(flag_errno_math) Init(1) Optimization SetByCombined
 Set errno after built-in math functions.
 +fsimdmath
 +Common Report Var(flag_simdmath) Init(0) Optimization
 +Enable auto-vectorize math functions for mathlib.  This option will turn on -fno-math-errno and -fopenmp-simd.
 +
 fmax-errors=
 Common Joined RejectNegative UInteger Var(flag_max_errors)
 -fmax-errors=<number>	Maximum number of errors to report.
 diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
--- a/gcc/config/aarch64/aarch64.c	2020-07-06 17:20:30.368000000 +0800
+--- a/gcc/config/aarch64/aarch64.c	2021-01-07 17:30:43.912000000 +0800
-+++ b/gcc/config/aarch64/aarch64.c	2020-07-06 20:02:39.480000000 +0800
+++ b/gcc/config/aarch64/aarch64.c	2021-01-05 15:17:21.580000000 +0800
-@@ -18860,8 +18860,12 @@ aarch64_simd_clone_compute_vecsize_and_s
+@@ -21588,8 +21588,12 @@ aarch64_simd_clone_compute_vecsize_and_s
   elt_bits = GET_MODE_BITSIZE (SCALAR_TYPE_MODE (base_type));
   if (clonei->simdlen == 0)
     {
@ -17,9 +45,9 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
     }
   else
 diff -Nurp a/gcc/config/aarch64/aarch64.opt b/gcc/config/aarch64/aarch64.opt
--- a/gcc/config/aarch64/aarch64.opt	2020-07-06 17:20:30.364000000 +0800
+--- a/gcc/config/aarch64/aarch64.opt	2021-01-07 17:30:43.912000000 +0800
-+++ b/gcc/config/aarch64/aarch64.opt	2020-07-06 20:02:39.480000000 +0800
+++ b/gcc/config/aarch64/aarch64.opt	2021-01-05 15:17:21.448000000 +0800
-@@ -186,6 +186,12 @@ precision of square root results to abou
+@@ -197,6 +197,12 @@ precision of square root results to abou
 single precision and to 32 bits for double precision.
 If enabled, it implies -mlow-precision-recip-sqrt.
@ -32,3 +60,199 @@ diff -Nurp a/gcc/config/aarch64/aarch64.opt b/gcc/config/aarch64/aarch64.opt
 mlow-precision-div
 Target Var(flag_mlow_precision_div) Optimization
 Enable the division approximation.  Enabling this reduces
 diff -Nurp a/gcc/fortran/scanner.c b/gcc/fortran/scanner.c
 --- a/gcc/fortran/scanner.c	2021-01-07 17:31:59.264000000 +0800
 +++ b/gcc/fortran/scanner.c	2021-01-07 17:05:28.776000000 +0800
@@ -2702,6 +2702,10 @@ gfc_new_file (void)
       && !load_file (flag_pre_include, NULL, false))
     exit (FATAL_EXIT_CODE);
 +  if (flag_simdmath
 +      && !load_file ("simdmath_f.h", NULL, false))
 +    exit (FATAL_EXIT_CODE);
 +
   if (gfc_cpp_enabled ())
     {
       result = gfc_cpp_preprocess (gfc_source_file);
 diff -Nurp a/gcc/opts.c b/gcc/opts.c
 --- a/gcc/opts.c	2021-01-07 17:30:57.740000000 +0800
 +++ b/gcc/opts.c	2021-01-05 15:17:21.068000000 +0800
@@ -190,6 +190,7 @@ typedef char *char_p; /* For DEF_VEC_P.
 static void handle_param (struct gcc_options *opts,
 			  struct gcc_options *opts_set, location_t loc,
 			  const char *carg);
 +static void set_simdmath_flags (struct gcc_options *opts, int set);
 static void set_debug_level (enum debug_info_type type, int extended,
 			     const char *arg, struct gcc_options *opts,
 			     struct gcc_options *opts_set,
@@ -2420,6 +2421,10 @@ common_handle_option (struct gcc_options
       dc->min_margin_width = value;
       break;
 +    case OPT_fsimdmath:
 +      set_simdmath_flags (opts, value);
 +      break;
 +
     case OPT_fdump_:
       /* Deferred.  */
       break;
@@ -2843,6 +2848,18 @@ handle_param (struct gcc_options *opts,
   free (arg);
 }
 +/* The following routines are used to set -fno-math-errno and -fopenmp-simd
 +   to enable vector mathlib.  */
 +static void
 +set_simdmath_flags (struct gcc_options *opts, int set)
 +{
 +  if (set)
 +    {
 +      opts->x_flag_errno_math = 0;
 +      opts->x_flag_openmp_simd = 1;
 +    }
 +}
 +
 /* Used to set the level of strict aliasing warnings in OPTS,
    when no level is specified (i.e., when -Wstrict-aliasing, and not
    -Wstrict-aliasing=level was given).
 diff -Nurp a/libgomp/configure b/libgomp/configure
 --- a/libgomp/configure	2021-01-07 17:40:08.216000000 +0800
 +++ b/libgomp/configure	2021-01-07 16:29:45.628000000 +0800
@@ -17258,7 +17258,7 @@ fi
 -ac_config_files="$ac_config_files omp.h omp_lib.h omp_lib.f90 libgomp_f.h"
 +ac_config_files="$ac_config_files omp.h omp_lib.h simdmath.h simdmath_f.h omp_lib.f90 libgomp_f.h"
 ac_config_files="$ac_config_files Makefile testsuite/Makefile libgomp.spec"
@@ -18426,6 +18426,8 @@ do
     "gstdint.h") CONFIG_COMMANDS="$CONFIG_COMMANDS gstdint.h" ;;
     "omp.h") CONFIG_FILES="$CONFIG_FILES omp.h" ;;
     "omp_lib.h") CONFIG_FILES="$CONFIG_FILES omp_lib.h" ;;
 +    "simdmath.h") CONFIG_FILES="$CONFIG_FILES simdmath.h" ;;
 +    "simdmath_f.h") CONFIG_FILES="$CONFIG_FILES simdmath_f.h" ;;
     "omp_lib.f90") CONFIG_FILES="$CONFIG_FILES omp_lib.f90" ;;
     "libgomp_f.h") CONFIG_FILES="$CONFIG_FILES libgomp_f.h" ;;
     "Makefile") CONFIG_FILES="$CONFIG_FILES Makefile" ;;
 diff -Nurp a/libgomp/configure.ac b/libgomp/configure.ac
 --- a/libgomp/configure.ac	2021-01-07 17:40:08.216000000 +0800
 +++ b/libgomp/configure.ac	2021-01-07 16:26:26.560000000 +0800
@@ -422,7 +422,7 @@ CFLAGS="$save_CFLAGS"
 # Determine what GCC version number to use in filesystem paths.
 GCC_BASE_VER
 -AC_CONFIG_FILES(omp.h omp_lib.h omp_lib.f90 libgomp_f.h)
 +AC_CONFIG_FILES(omp.h omp_lib.h simdmath.h simdmath_f.h omp_lib.f90 libgomp_f.h)
 AC_CONFIG_FILES(Makefile testsuite/Makefile libgomp.spec)
 AC_CONFIG_FILES([testsuite/libgomp-test-support.pt.exp:testsuite/libgomp-test-support.exp.in])
 AC_OUTPUT
 diff -Nurp a/libgomp/Makefile.am b/libgomp/Makefile.am
 --- a/libgomp/Makefile.am	2021-01-07 17:40:08.168000000 +0800
 +++ b/libgomp/Makefile.am	2021-01-07 16:27:39.776000000 +0800
@@ -74,9 +74,9 @@ libgomp_la_SOURCES += openacc.f90
 endif
 nodist_noinst_HEADERS = libgomp_f.h
 -nodist_libsubinclude_HEADERS = omp.h openacc.h
 +nodist_libsubinclude_HEADERS = omp.h openacc.h simdmath.h
 if USE_FORTRAN
 -nodist_finclude_HEADERS = omp_lib.h omp_lib.f90 omp_lib.mod omp_lib_kinds.mod \
 +nodist_finclude_HEADERS = omp_lib.h simdmath_f.h  omp_lib.f90 omp_lib.mod omp_lib_kinds.mod \
 	openacc_lib.h openacc.f90 openacc.mod openacc_kinds.mod
 endif
 diff -Nurp a/libgomp/Makefile.in b/libgomp/Makefile.in
 --- a/libgomp/Makefile.in	2021-01-07 17:40:08.208000000 +0800
 +++ b/libgomp/Makefile.in	2021-01-07 16:50:28.820000000 +0800
@@ -145,7 +145,7 @@ am__CONFIG_DISTCLEAN_FILES = config.stat
  configure.lineno config.status.lineno
 mkinstalldirs = $(SHELL) $(top_srcdir)/../mkinstalldirs
 CONFIG_HEADER = config.h
 -CONFIG_CLEAN_FILES = omp.h omp_lib.h omp_lib.f90 libgomp_f.h \
 +CONFIG_CLEAN_FILES = omp.h omp_lib.h simdmath.h simdmath_f.h omp_lib.f90 libgomp_f.h \
 	libgomp.spec
 CONFIG_CLEAN_VPATH_FILES =
 am__vpath_adj_setup = srcdirstrip=`echo "$(srcdir)" | sed 's|.|.|g'`;
@@ -575,8 +575,8 @@ libgomp_la_SOURCES = alloc.c atomic.c ba
 @PLUGIN_HSA_TRUE@libgomp_plugin_hsa_la_LIBADD = libgomp.la $(PLUGIN_HSA_LIBS)
 @PLUGIN_HSA_TRUE@libgomp_plugin_hsa_la_LIBTOOLFLAGS = --tag=disable-static
 nodist_noinst_HEADERS = libgomp_f.h
 -nodist_libsubinclude_HEADERS = omp.h openacc.h
 -@USE_FORTRAN_TRUE@nodist_finclude_HEADERS = omp_lib.h omp_lib.f90 omp_lib.mod omp_lib_kinds.mod \
 +nodist_libsubinclude_HEADERS = omp.h openacc.h simdmath.h
 +@USE_FORTRAN_TRUE@nodist_finclude_HEADERS = omp_lib.h simdmath_f.h omp_lib.f90 omp_lib.mod omp_lib_kinds.mod \
 @USE_FORTRAN_TRUE@	openacc_lib.h openacc.f90 openacc.mod openacc_kinds.mod
 LTLDFLAGS = $(shell $(SHELL) $(top_srcdir)/../libtool-ldflags $(LDFLAGS))
@@ -668,6 +668,10 @@ omp.h: $(top_builddir)/config.status $(s
 	cd $(top_builddir) && $(SHELL) ./config.status $@
 omp_lib.h: $(top_builddir)/config.status $(srcdir)/omp_lib.h.in
 	cd $(top_builddir) && $(SHELL) ./config.status $@
 +simdmath_f.h: $(top_builddir)/config.status $(srcdir)/simdmath_f.h.in
 +	cd $(top_builddir) && $(SHELL) ./config.status $@
 +simdmath.h: $(top_builddir)/config.status $(srcdir)/simdmath.h.in
 +	cd $(top_builddir) && $(SHELL) ./config.status $@
 omp_lib.f90: $(top_builddir)/config.status $(srcdir)/omp_lib.f90.in
 	cd $(top_builddir) && $(SHELL) ./config.status $@
 libgomp_f.h: $(top_builddir)/config.status $(srcdir)/libgomp_f.h.in
 diff -Nurp a/libgomp/simdmath_f.h.in b/libgomp/simdmath_f.h.in
 --- a/libgomp/simdmath_f.h.in	1970-01-01 08:00:00.000000000 +0800
 +++ b/libgomp/simdmath_f.h.in	2021-01-07 16:13:23.196000000 +0800
@@ -0,0 +1,11 @@
 +!GCC$ builtin (cos) attributes simd (notinbranch)
 +!GCC$ builtin (cosf) attributes simd (notinbranch)
 +!GCC$ builtin (sin) attributes simd (notinbranch)
 +!GCC$ builtin (sinf) attributes simd (notinbranch)
 +!GCC$ builtin (exp) attributes simd (notinbranch)
 +!GCC$ builtin (expf) attributes simd (notinbranch)
 +!GCC$ builtin (exp2f) attributes simd (notinbranch)
 +!GCC$ builtin (log) attributes simd (notinbranch)
 +!GCC$ builtin (logf) attributes simd (notinbranch)
 +!GCC$ builtin (pow) attributes simd (notinbranch)
 +!GCC$ builtin (powf) attributes simd (notinbranch)
 diff -Nurp a/libgomp/simdmath.h.in b/libgomp/simdmath.h.in
 --- a/libgomp/simdmath.h.in	1970-01-01 08:00:00.000000000 +0800
 +++ b/libgomp/simdmath.h.in	2021-01-07 16:13:56.144000000 +0800
@@ -0,0 +1,40 @@
 +#ifdef __cplusplus
 +extern "C" {
 +#endif
 +
 +#pragma omp declare simd simdlen(2) notinbranch
 +double cos (double x);
 +
 +#pragma omp declare simd simdlen(4) notinbranch
 +float cosf (float x);
 +
 +#pragma omp declare simd simdlen(2) notinbranch
 +double sin (double x);
 +
 +#pragma omp declare simd simdlen(4) notinbranch
 +float sinf (float x);
 +
 +#pragma omp declare simd simdlen(2) notinbranch
 +double exp (double x);
 +
 +#pragma omp declare simd simdlen(4) notinbranch
 +float expf (float x);
 +
 +#pragma omp declare simd simdlen(2) notinbranch
 +double log (double x);
 +
 +#pragma omp declare simd simdlen(4) notinbranch
 +float logf (float x);
 +
 +#pragma omp declare simd simdlen(2) notinbranch
 +double pow (double x, double y);
 +
 +#pragma omp declare simd simdlen(4) notinbranch
 +float powf (float x, float y);
 +
 +#pragma omp declare simd simdlen(4) notinbranch
 +float exp2f (float x);
 +
 +#ifdef __cplusplus
 +} // extern "C"
 +#endif
--- a/fix-CTOR-vectorization.patch
+++ b/fix-CTOR-vectorization.patch
@ -0,0 +1,18 @@
 This backport contains 1 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-fix-CTOR-vectorization.patch
 3d42842c07f4143042f3dcc39a050b262bcf1b55
 diff --git a/gcc/tree-vect-slp.c b/gcc/tree-vect-slp.c
 index 9d17e3386fa..fb13af7965e 100644
 --- a/gcc/tree-vect-slp.c
 +++ b/gcc/tree-vect-slp.c
@@ -2257,6 +2257,7 @@ vect_analyze_slp_instance (vec_info *vinfo,
 	      /* Value is defined in another basic block.  */
 	      if (!def_info)
 		return false;
 +	      def_info = vect_stmt_to_vectorize (def_info);
 	      scalar_stmts.safe_push (def_info);
 	    }
 	  else
--- a/fix-ICE-in-eliminate-stmt.patch
+++ b/fix-ICE-in-eliminate-stmt.patch
@ -0,0 +1,79 @@
 commit ee80f0c6ba50ebf0300fb0cfe1079a1321295749
 Author: Richard Biener <rguenther@suse.de>
 Date:   Thu Oct 24 11:23:54 2019 +0000
    re PR tree-optimization/92203 (ICE in eliminate_stmt, at tree-ssa-sccvn.c:5492)
    2019-10-24  Richard Biener  <rguenther@suse.de>
            PR tree-optimization/92203
            * treee-ssa-sccvn.c (eliminate_dom_walker::eliminate_stmt):
            Skip eliminating conversion stmts inserted by insertion.
            * gcc.dg/torture/pr92203.c: New testcase.
    From-SVN: r277374
 diff --git a/gcc/testsuite/gcc.dg/torture/pr92203.c b/gcc/testsuite/gcc.dg/torture/pr92203.c
 new file mode 100644
 index 00000000000..c752969d5e5
 --- /dev/null
 +++ b/gcc/testsuite/gcc.dg/torture/pr92203.c
@@ -0,0 +1,37 @@
 +/* { dg-do compile } */
 +/* { dg-additional-options "-Wno-div-by-zero" } */
 +
 +unsigned long int rr;
 +
 +void
 +cw (int z9)
 +{
 +  int m5;
 +  unsigned long int vz = 0;
 +  long int *na;
 +
 +  if (z9 == 0)
 +    rr = 0;
 +  else
 +    {
 +      na = (long int *) &m5;
 +      for (*na = 0; *na < 1; ++*na)
 +	{
 +	  na = (long int *) &vz;
 +	  rr /= 0;
 +	}
 +    }
 +
 +  m5 = rr / 5;
 +  ++vz;
 +  if (vz != 0)
 +    while (z9 < 1)
 +      {
 +	if (m5 >= 0)
 +	  rr += m5;
 +
 +	na = (long int *) &rr;
 +	if (*na >= 0)
 +	  rr = 0;
 +      }
 +}
 diff --git a/gcc/tree-ssa-sccvn.c b/gcc/tree-ssa-sccvn.c
 index 57331ab44dc..3872168a4ed 100644
 --- a/gcc/tree-ssa-sccvn.c
 +++ b/gcc/tree-ssa-sccvn.c
@@ -5459,8 +5459,13 @@ eliminate_dom_walker::eliminate_stmt (basic_block b, gimple_stmt_iterator *gsi)
 	  /* If this is an assignment from our leader (which
 	     happens in the case the value-number is a constant)
 -	     then there is nothing to do.  */
 -	  if (gimple_assign_single_p (stmt)
 +	     then there is nothing to do.  Likewise if we run into
 +	     inserted code that needed a conversion because of
 +	     our type-agnostic value-numbering of loads.  */
 +	  if ((gimple_assign_single_p (stmt)
 +	       || (is_gimple_assign (stmt)
 +		   && (CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt))
 +		       || gimple_assign_rhs_code (stmt) == VIEW_CONVERT_EXPR)))
 	      && sprime == gimple_assign_rhs1 (stmt))
 	    return;
--- a/fix-ICE-in-vect.patch
+++ b/fix-ICE-in-vect.patch
--- a/fix-range-set-by-vectorization-on-niter-IVs.patch
+++ b/fix-range-set-by-vectorization-on-niter-IVs.patch
@ -0,0 +1,74 @@
 This backport contains 1 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-tree-optimization-98117-fix-range-set-by-vectorizati.patch
 cdcbef3c3310a14f2994982b44cb1f8e14c77232
 diff --git a/gcc/testsuite/gcc.dg/torture/pr98117.c b/gcc/testsuite/gcc.dg/torture/pr98117.c
 new file mode 100644
 index 00000000000..f2160257263
 --- /dev/null
 +++ b/gcc/testsuite/gcc.dg/torture/pr98117.c
@@ -0,0 +1,19 @@
 +/* { dg-do run } */
 +/* { dg-additional-options "-fno-tree-scev-cprop" } */
 +
 +unsigned char c;
 +void __attribute__((noipa))
 +e()
 +{
 +  do
 +    {
 +    }
 +  while (++c);
 +}
 +int main()
 +{
 +  e();
 +  if (c != 0)
 +    __builtin_abort ();
 +  return 0;
 +}
 diff --git a/gcc/tree-vect-loop-manip.c b/gcc/tree-vect-loop-manip.c
 index 36179188f6d..2370b879b21 100644
 --- a/gcc/tree-vect-loop-manip.c
 +++ b/gcc/tree-vect-loop-manip.c
@@ -2034,13 +2034,29 @@ vect_gen_vector_loop_niters (loop_vec_info loop_vinfo, tree niters,
       niters_vector = force_gimple_operand (niters_vector, &stmts, true, var);
       gsi_insert_seq_on_edge_immediate (pe, stmts);
       /* Peeling algorithm guarantees that vector loop bound is at least ONE,
 -	 we set range information to make niters analyzer's life easier.  */
 +	 we set range information to make niters analyzer's life easier.
 +	 Note the number of latch iteration value can be TYPE_MAX_VALUE so
 +	 we have to represent the vector niter TYPE_MAX_VALUE + 1 >> log_vf.  */
       if (stmts != NULL && log_vf)
 -	set_range_info (niters_vector, VR_RANGE,
 -			wi::to_wide (build_int_cst (type, 1)),
 -			wi::to_wide (fold_build2 (RSHIFT_EXPR, type,
 -						  TYPE_MAX_VALUE (type),
 -						  log_vf)));
 +	{
 +	  if (niters_no_overflow)
 +	    set_range_info (niters_vector, VR_RANGE,
 +			    wi::one (TYPE_PRECISION (type)),
 +			    wi::rshift (wi::max_value (TYPE_PRECISION (type),
 +						       TYPE_SIGN (type)),
 +					exact_log2 (const_vf),
 +					TYPE_SIGN (type)));
 +	  /* For VF == 1 the vector IV might also overflow so we cannot
 +	     assert a minimum value of 1.  */
 +	  else if (const_vf > 1)
 +	    set_range_info (niters_vector, VR_RANGE,
 +			    wi::one (TYPE_PRECISION (type)),
 +			    wi::rshift (wi::max_value (TYPE_PRECISION (type),
 +						       TYPE_SIGN (type))
 +					- (const_vf - 1),
 +					exact_log2 (const_vf), TYPE_SIGN (type))
 +			    + 1);
 +	}
     }
   *niters_vector_ptr = niters_vector;
   *step_vector_ptr = step_vector;
 -- 
 2.19.1
--- a/gcc.spec
+++ b/gcc.spec
@ -1,4 +1,4 @@
-%global DATE 20210204
+%global DATE 20210428
 %global gcc_version 9.3.1
 %global gcc_major 9.3.1
@ -59,7 +59,7 @@
 Summary: Various compilers (C, C++, Objective-C, ...)
 Name: gcc
 Version: %{gcc_version}
-Release: %{DATE}.18
+Release: %{DATE}.19
 License: GPLv3+ and GPLv3+ with exceptions and GPLv2+ with exceptions and LGPLv2+ and BSD
 URL: https://gcc.gnu.org
@ -221,10 +221,21 @@ Patch104: fix-avx512vl-vcvttpd2dq-2-fail.patch
 Patch105: fix-issue604-ldist-dependency-fixup.patch
 Patch106: Apply-maximum-nunits-for-BB-SLP.patch
 Patch107: Fix-interaction-between-aka-changes-and-DR1558.patch
-Patch108: Handle-POLY_INT_CSTs-in-declare_return_value.patch
+Patch108: fix-range-set-by-vectorization-on-niter-IVs.patch
-Patch109: Handle-POLY_INT_CST-in-copy_reference_ops_from_ref.patch
+Patch109: optabs-Dont-use-scalar-conversions-for-vectors.patch
-Patch110: fix-strncpy-inline-warning.patch
+Patch110: add-fp-model-options.patch
-
+Patch111: fix-CTOR-vectorization.patch
 Patch112: PR92429-do-not-fold-when-updating.patch
 Patch113: Handle-POLY_INT_CSTs-in-declare_return_value.patch
 Patch114: Handle-POLY_INT_CST-in-copy_reference_ops_from_ref.patch
 Patch115: fix-strncpy-inline-warning.patch
 Patch116: fix-ICE-in-vect.patch
 Patch118: Fix-type-mismatch-in-SLPed-constructors.patch
 Patch119: add-check-for-pressure-in-sche1.patch
 Patch120: revert-moutline-atomics.patch
 Patch121: fix-ICE-in-eliminate-stmt.patch
 Patch122: revise-type-before-build-MULT.patch
 Patch123: Simplify-X-C1-C2.patch
 %global gcc_target_platform %{_arch}-linux-gnu
@ -777,6 +788,18 @@ not stable, so plugins must be rebuilt any time GCC is updated.
 %patch108 -p1
 %patch109 -p1
 %patch110 -p1
 %patch111 -p1
 %patch112 -p1
 %patch113 -p1
 %patch114 -p1
 %patch115 -p1
 %patch116 -p1
 %patch118 -p1
 %patch119 -p1
 %patch120 -p1
 %patch121 -p1
 %patch122 -p1
 %patch123 -p1
 %build
@ -1803,6 +1826,7 @@ end
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/include/stdnoreturn.h
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/include/stdatomic.h
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/include/gcov.h
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/include/simdmath.h
 %ifarch %{ix86} x86_64
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/include/mmintrin.h
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/include/xmmintrin.h
@ -2230,6 +2254,7 @@ end
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/finclude/ieee_arithmetic.mod
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/finclude/ieee_exceptions.mod
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/finclude/ieee_features.mod
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/finclude/simdmath_f.h
 %{_prefix}/libexec/gcc/%{gcc_target_platform}/%{gcc_major}/f951
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/libgfortran.spec
 %{_prefix}/lib/gcc/%{gcc_target_platform}/%{gcc_major}/libcaf_single.a
@ -2707,6 +2732,24 @@ end
 %doc rpm.doc/changelogs/libcc1/ChangeLog*
 %changelog
 * Wed Apr 28 2021 eastb233 <xiezhiheng@huawei.com> - 9.3.1-20210428.19
 - add-fp-model-options.patch: New file
 - enable-simd-math.patch: Enable simd math library in C and Fortran
 - fix-CTOR-vectorization.patch: New file
 - fix-range-set-by-vectorization-on-niter-IVs.patch: New file
 - medium-code-mode.patch: Fix bugs when used with fpic
 - optabs-Dont-use-scalar-conversions-for-vectors.patch: New file
 - PR92429-do-not-fold-when-updating.patch: New file
 - redundant-loop-elimination.patch: Fix some programming specifications
 - fix-ICE-in-vect.patch: New file
 - Fix-type-mismatch-in-SLPed-constructors.patch: New file
 - add-check-for-pressure-in-sche1.patch: New file
 - revert-moutline-atomics.patch: New file
 - fix-ICE-in-eliminate-stmt.patch: New file
 - revise-type-before-build-MULT.patch: New file
 - Simplify-X-C1-C2.patch: New file
 - gcc.spec: Add new patches
 *  Wed Apr 21 2021 eastb233 <xiezhiheng@huawei.com> - 9.3.1-20210204.18
 - Type:bugfix
 - ID:NA
--- a/medium-code-mode.patch
+++ b/medium-code-mode.patch
@ -1,7 +1,7 @@
 diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
--- a/gcc/config/aarch64/aarch64.c	2020-07-16 14:54:30.588000000 +0800
+--- a/gcc/config/aarch64/aarch64.c	2021-02-18 11:03:29.728000000 +0800
-+++ b/gcc/config/aarch64/aarch64.c	2020-07-16 15:06:33.000000000 +0800
+++ b/gcc/config/aarch64/aarch64.c	2021-02-18 14:59:54.432000000 +0800
-@@ -2030,6 +2030,32 @@ aarch64_load_symref_appropriately (rtx d
+@@ -2417,6 +2417,29 @@ aarch64_load_symref_appropriately (rtx d
 	emit_insn (gen_add_losym (dest, tmp_reg, imm));
 	return;
       }
@ -16,25 +16,22 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +
 +	if (mode == DImode)
 +	  {
-+			emit_insn (
+	    emit_insn (gen_load_symbol_medium_di (dest, tmp_reg, imm));
 +			gen_load_symbol_medium_di (dest, tmp_reg, imm));
 +	  }
 +	else
 +	  {
-+			emit_insn (
+	    emit_insn (gen_load_symbol_medium_si (dest, tmp_reg, imm));
 +			gen_load_symbol_medium_si (dest, tmp_reg, imm));
 +	  }
 +	if (REG_P (dest))
 +	  {
-+			set_unique_reg_note (
+	    set_unique_reg_note (get_last_insn (), REG_EQUAL, copy_rtx (imm));
 +			get_last_insn (), REG_EQUIV, copy_rtx (imm));
 +	  }
 +	return;
 +      }
     case SYMBOL_TINY_ABSOLUTE:
       emit_insn (gen_rtx_SET (dest, imm));
-@@ -2152,6 +2178,64 @@ aarch64_load_symref_appropriately (rtx d
+@@ -2539,6 +2562,60 @@ aarch64_load_symref_appropriately (rtx d
 	return;
       }
@ -52,18 +49,15 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +
 +	if (mode == DImode)
 +	  {
-+			emit_insn (
+	    emit_insn (gen_load_symbol_medium_di (tmp_reg, dest, s));
 +			gen_load_symbol_medium_di (tmp_reg, dest, s));
 +	  }
 +	else
 +	  {
-+			emit_insn (
+	    emit_insn (gen_load_symbol_medium_si (tmp_reg, dest, s));
 +			gen_load_symbol_medium_si (tmp_reg, dest, s));
 +	  }
 +	if (REG_P (dest))
 +	  {
-+			set_unique_reg_note (
+	    set_unique_reg_note (get_last_insn (), REG_EQUAL, copy_rtx (s));
 +			get_last_insn (), REG_EQUIV, copy_rtx (s));
 +	  }
 +
 +	if (mode == ptr_mode)
@ -71,14 +65,12 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +	    if (mode == DImode)
 +	      {
 +		emit_insn (gen_get_gotoff_di (dest, imm));
-+				insn = gen_ldr_got_medium_di (
+		insn = gen_ldr_got_medium_di (dest, tmp_reg, dest);
 +					   dest, tmp_reg, dest);
 +	      }
 +	    else
 +	      {
 +		emit_insn (gen_get_gotoff_si (dest, imm));
-+				insn = gen_ldr_got_medium_si (
+		insn = gen_ldr_got_medium_si (dest, tmp_reg, dest);
 +					   dest, tmp_reg, dest);
 +	      }
 +	    mem = XVECEXP (SET_SRC (insn), 0, 0);
 +	  }
@ -96,10 +88,11 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +	emit_insn (insn);
 +	return;
 +      }
 +
     case SYMBOL_SMALL_TLSGD:
       {
 	rtx_insn *insns;
-@@ -3372,11 +3456,12 @@ aarch64_expand_mov_immediate (rtx dest,
+@@ -4531,11 +4608,12 @@ aarch64_expand_mov_immediate (rtx dest,
 	  return;
@ -114,7 +107,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 	case SYMBOL_TINY_GOT:
 	case SYMBOL_TINY_TLSIE:
 	  if (const_offset != 0)
-@@ -3395,6 +3480,7 @@ aarch64_expand_mov_immediate (rtx dest,
+@@ -4554,6 +4632,7 @@ aarch64_expand_mov_immediate (rtx dest,
 	case SYMBOL_TLSLE24:
 	case SYMBOL_TLSLE32:
 	case SYMBOL_TLSLE48:
@ -122,7 +115,38 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 	  aarch64_load_symref_appropriately (dest, imm, sty);
 	  return;
-@@ -10334,6 +10420,13 @@ cost_plus:
+@@ -8450,7 +8529,14 @@ aarch64_classify_address (struct aarch64
 	  split_const (info->offset, &sym, &offs);
 	  if (GET_CODE (sym) == SYMBOL_REF
 	      && (aarch64_classify_symbol (sym, INTVAL (offs))
 -		  == SYMBOL_SMALL_ABSOLUTE))
 +		  == SYMBOL_SMALL_ABSOLUTE
 +		  /* Fix fail on dbl_mov_immediate_1.c.  If end up here with
 +		     MEDIUM_ABSOLUTE, the symbol is a constant number that is
 +		     forced to memory in reload pass, which is ok to go on with
 +		     the original design that subtitude the mov to
 +		     'adrp and ldr :losum'.  */
 +		  || aarch64_classify_symbol (sym, INTVAL (offs))
 +		     == SYMBOL_MEDIUM_ABSOLUTE))
 	    {
 	      /* The symbol and offset must be aligned to the access size.  */
 	      unsigned int align;
@@ -10365,7 +10451,13 @@ static inline bool
 aarch64_can_use_per_function_literal_pools_p (void)
 {
   return (aarch64_pcrelative_literal_loads
 -	  || aarch64_cmodel == AARCH64_CMODEL_LARGE);
 +	  || aarch64_cmodel == AARCH64_CMODEL_LARGE
 +	  /* Fix const9.C so that constants goes to function_literal_pools.
 +	     According to the orignal design of aarch64 mcmodel=medium, we
 +	     don't care where this symbol is put.  For the benefit of code size
 +	     and behaviour consistent with other mcmodel, put it into
 +	     function_literal_pools.  */
 +	  || aarch64_cmodel == AARCH64_CMODEL_MEDIUM);
 }
 static bool
@@ -11993,6 +12085,13 @@ cost_plus:
 	  if (speed)
 	    *cost += extra_cost->alu.arith;
 	}
@ -136,7 +160,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
       if (flag_pic)
 	{
-@@ -10341,6 +10434,8 @@ cost_plus:
+@@ -12000,6 +12099,8 @@ cost_plus:
 	  *cost += COSTS_N_INSNS (1);
 	  if (speed)
 	    *cost += extra_cost->ldst.load;
@ -145,7 +169,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 	}
       return true;
-@@ -11395,6 +11490,7 @@ initialize_aarch64_tls_size (struct gcc_
+@@ -13176,6 +13277,7 @@ initialize_aarch64_tls_size (struct gcc_
       if (aarch64_tls_size > 32)
 	aarch64_tls_size = 32;
       break;
@ -153,7 +177,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
     case AARCH64_CMODEL_LARGE:
       /* The maximum TLS size allowed under large is 16E.
 	 FIXME: 16E should be 64bit, we only support 48bit offset now.  */
-@@ -12187,6 +12283,9 @@ initialize_aarch64_code_model (struct gc
+@@ -13968,6 +14070,9 @@ initialize_aarch64_code_model (struct gc
 	   aarch64_cmodel = AARCH64_CMODEL_SMALL_PIC;
 #endif
 	   break;
@ -163,7 +187,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 	 case AARCH64_CMODEL_LARGE:
 	   sorry ("code model %qs with %<-f%s%>", "large",
 		  opts->x_flag_pic > 1 ? "PIC" : "pic");
-@@ -12205,6 +12304,7 @@ static void
+@@ -13986,6 +14091,7 @@ static void
 aarch64_option_save (struct cl_target_option *ptr, struct gcc_options *opts)
 {
   ptr->x_aarch64_override_tune_string = opts->x_aarch64_override_tune_string;
@ -171,7 +195,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
   ptr->x_aarch64_branch_protection_string
     = opts->x_aarch64_branch_protection_string;
 }
-@@ -12220,6 +12320,7 @@ aarch64_option_restore (struct gcc_optio
+@@ -14001,6 +14107,7 @@ aarch64_option_restore (struct gcc_optio
   opts->x_explicit_arch = ptr->x_explicit_arch;
   selected_arch = aarch64_get_arch (ptr->x_explicit_arch);
   opts->x_aarch64_override_tune_string = ptr->x_aarch64_override_tune_string;
@ -179,7 +203,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
   opts->x_aarch64_branch_protection_string
     = ptr->x_aarch64_branch_protection_string;
   if (opts->x_aarch64_branch_protection_string)
-@@ -13067,6 +13168,8 @@ aarch64_classify_symbol (rtx x, HOST_WID
+@@ -14868,6 +14975,8 @@ aarch64_classify_symbol (rtx x, HOST_WID
 	case AARCH64_CMODEL_SMALL_SPIC:
 	case AARCH64_CMODEL_SMALL_PIC:
@ -188,7 +212,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 	case AARCH64_CMODEL_SMALL:
 	  return SYMBOL_SMALL_ABSOLUTE;
-@@ -13100,6 +13203,7 @@ aarch64_classify_symbol (rtx x, HOST_WID
+@@ -14904,6 +15013,7 @@ aarch64_classify_symbol (rtx x, HOST_WID
 	  return SYMBOL_TINY_ABSOLUTE;
 	case AARCH64_CMODEL_SMALL:
@ -196,7 +220,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 	  /* Same reasoning as the tiny code model, but the offset cap here is
 	     1MB, allowing +/-3.9GB for the offset to the symbol.  */
-@@ -13121,7 +13225,48 @@ aarch64_classify_symbol (rtx x, HOST_WID
+@@ -14927,7 +15037,50 @@ aarch64_classify_symbol (rtx x, HOST_WID
 		    ?  SYMBOL_SMALL_GOT_28K : SYMBOL_SMALL_GOT_4G);
 	  return SYMBOL_SMALL_ABSOLUTE;
@ -206,8 +230,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +	    if (decl_local != NULL
 +		&& tree_fits_uhwi_p (DECL_SIZE_UNIT (decl_local)))
 +	      {
-+			HOST_WIDE_INT size = tree_to_uhwi (
+		HOST_WIDE_INT size = tree_to_uhwi (DECL_SIZE_UNIT (decl_local));
 +						 DECL_SIZE_UNIT (decl_local));
 +		/* If the data is smaller than the threshold, goto
 +		   the small code model.  Else goto the large code
 +		   model.  */
@ -223,13 +246,15 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +	    if (decl_local != NULL
 +		&& tree_fits_uhwi_p (DECL_SIZE_UNIT (decl_local)))
 +	      {
-+			HOST_WIDE_INT size = tree_to_uhwi (
+		HOST_WIDE_INT size = tree_to_uhwi (DECL_SIZE_UNIT (decl_local));
 +						 DECL_SIZE_UNIT (decl_local));
 +		if (size < HOST_WIDE_INT (aarch64_data_threshold))
 +		  {
 +		    if (!aarch64_symbol_binds_local_p (x))
 +		      {
-+					return SYMBOL_SMALL_GOT_4G;
+			/* flag_pic is 2 only when -fPIC is on, when we should
 +			   use 4G GOT.  */
 +			return flag_pic == 2 ? SYMBOL_SMALL_GOT_4G
 +					     : SYMBOL_SMALL_GOT_28K ;
 +		      }
 +		    return SYMBOL_SMALL_ABSOLUTE;
 +		  }
@ -240,12 +265,13 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 +	      }
 +	    return SYMBOL_MEDIUM_ABSOLUTE;
 +	  }
 +
 	case AARCH64_CMODEL_LARGE:
 +	AARCH64_LARGE_ROUTINE:
 	  /* This is alright even in PIC code as the constant
 	     pool reference is always PC relative and within
 	     the same translation unit.  */
-@@ -15364,6 +15509,8 @@ aarch64_asm_preferred_eh_data_format (in
+@@ -17789,6 +17942,8 @@ aarch64_asm_preferred_eh_data_format (in
      case AARCH64_CMODEL_SMALL:
      case AARCH64_CMODEL_SMALL_PIC:
      case AARCH64_CMODEL_SMALL_SPIC:
@ -254,17 +280,23 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
        /* text+got+data < 4Gb.  4-byte signed relocs are sufficient
 	  for everything.  */
        type = DW_EH_PE_sdata4;
-@@ -18454,7 +18601,8 @@ aarch64_empty_mask_is_expensive (unsigne
+@@ -21014,7 +21169,14 @@ aarch64_empty_mask_is_expensive (unsigne
 bool
 aarch64_use_pseudo_pic_reg (void)
 {
 -  return aarch64_cmodel == AARCH64_CMODEL_SMALL_SPIC;
 +  /* flag_pic is 2 when -fPIC is on, where we do not need the pseudo
 +     pic reg.  In medium code mode, when combine with -fpie/-fpic, there are
 +     possibility that some symbol size smaller than the -mlarge-data-threshold
 +     will still use SMALL_SPIC relocation, which need the pseudo pic reg.
 +     Fix spill_1.c fail.  */
 +  return aarch64_cmodel == AARCH64_CMODEL_SMALL_SPIC
-+  	  || aarch64_cmodel == AARCH64_CMODEL_MEDIUM_PIC ;
+	 || (aarch64_cmodel == AARCH64_CMODEL_MEDIUM_PIC
 +	     && flag_pic != 2);
 }
 /* Implement TARGET_UNSPEC_MAY_TRAP_P.  */
-@@ -18464,6 +18612,7 @@ aarch64_unspec_may_trap_p (const_rtx x,
+@@ -21024,6 +21186,7 @@ aarch64_unspec_may_trap_p (const_rtx x,
 {
   switch (XINT (x, 1))
     {
@ -273,8 +305,8 @@ diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
     case UNSPEC_GOTSMALLPIC28K:
     case UNSPEC_GOTTINYPIC:
 diff -Nurp a/gcc/config/aarch64/aarch64.h b/gcc/config/aarch64/aarch64.h
--- a/gcc/config/aarch64/aarch64.h	2020-07-16 14:54:30.592000000 +0800
+--- a/gcc/config/aarch64/aarch64.h	2021-02-18 11:03:28.336000000 +0800
-+++ b/gcc/config/aarch64/aarch64.h	2020-07-16 14:55:05.672000000 +0800
+++ b/gcc/config/aarch64/aarch64.h	2021-02-18 10:57:45.488000000 +0800
@@ -33,6 +33,10 @@
 #define REGISTER_TARGET_PRAGMAS() aarch64_register_pragmas ()
@ -287,9 +319,9 @@ diff -Nurp a/gcc/config/aarch64/aarch64.h b/gcc/config/aarch64/aarch64.h
 #define PROMOTE_MODE(MODE, UNSIGNEDP, TYPE)	\
 diff -Nurp a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md
--- a/gcc/config/aarch64/aarch64.md	2020-07-16 14:54:30.588000000 +0800
+--- a/gcc/config/aarch64/aarch64.md	2021-02-18 11:03:28.340000000 +0800
-+++ b/gcc/config/aarch64/aarch64.md	2020-07-16 14:55:05.676000000 +0800
+++ b/gcc/config/aarch64/aarch64.md	2021-02-18 10:57:45.488000000 +0800
-@@ -209,6 +209,11 @@
+@@ -224,6 +224,11 @@
     UNSPEC_RSQRTS
     UNSPEC_NZCV
     UNSPEC_XPACLRI
@ -301,7 +333,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md
     UNSPEC_LD1_SVE
     UNSPEC_ST1_SVE
     UNSPEC_LDNT1_SVE
-@@ -6548,6 +6553,39 @@
+@@ -6689,6 +6694,39 @@
   [(set_attr "type" "load_4")]
 )
@ -341,7 +373,7 @@ diff -Nurp a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md
 (define_insn "ldr_got_small_28k_<mode>"
   [(set (match_operand:PTR 0 "register_operand" "=r")
 	(unspec:PTR [(mem:PTR (lo_sum:PTR
-@@ -6709,6 +6747,23 @@
+@@ -6852,6 +6890,23 @@
    (set_attr "length" "12")]
 )
@ -366,8 +398,8 @@ diff -Nurp a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md
   [(unspec:PTR [(match_operand 0 "aarch64_valid_symref")] UNSPEC_TLSDESC)]
   "TARGET_TLS_DESC"
 diff -Nurp a/gcc/config/aarch64/aarch64.opt b/gcc/config/aarch64/aarch64.opt
--- a/gcc/config/aarch64/aarch64.opt	2020-07-16 14:54:30.580000000 +0800
+--- a/gcc/config/aarch64/aarch64.opt	2021-02-18 11:03:28.340000000 +0800
-+++ b/gcc/config/aarch64/aarch64.opt	2020-07-16 14:55:05.676000000 +0800
+++ b/gcc/config/aarch64/aarch64.opt	2021-02-18 10:57:45.488000000 +0800
@@ -27,6 +27,10 @@ enum aarch64_processor explicit_tune_cor
 TargetVariable
 enum aarch64_arch explicit_arch = aarch64_no_arch
@ -396,8 +428,8 @@ diff -Nurp a/gcc/config/aarch64/aarch64.opt b/gcc/config/aarch64/aarch64.opt
 Target Report RejectNegative Mask(BIG_END)
 Assume target CPU is configured as big endian.
 diff -Nurp a/gcc/config/aarch64/aarch64-opts.h b/gcc/config/aarch64/aarch64-opts.h
--- a/gcc/config/aarch64/aarch64-opts.h	2020-07-16 14:54:30.584000000 +0800
+--- a/gcc/config/aarch64/aarch64-opts.h	2020-03-12 19:07:21.000000000 +0800
-+++ b/gcc/config/aarch64/aarch64-opts.h	2020-07-16 14:55:05.676000000 +0800
+++ b/gcc/config/aarch64/aarch64-opts.h	2021-02-18 10:57:45.488000000 +0800
@@ -66,6 +66,10 @@ enum aarch64_code_model {
   /* -fpic for small memory model.
      GOT size to 28KiB (4K*8-4K) or 3580 entries.  */
@ -410,8 +442,8 @@ diff -Nurp a/gcc/config/aarch64/aarch64-opts.h b/gcc/config/aarch64/aarch64-opts
      The PIC variant is not yet implemented.  */
   AARCH64_CMODEL_LARGE
 diff -Nurp a/gcc/config/aarch64/aarch64-protos.h b/gcc/config/aarch64/aarch64-protos.h
--- a/gcc/config/aarch64/aarch64-protos.h	2020-07-16 14:54:30.584000000 +0800
+--- a/gcc/config/aarch64/aarch64-protos.h	2021-02-18 11:03:29.432000000 +0800
-+++ b/gcc/config/aarch64/aarch64-protos.h	2020-07-16 14:55:05.676000000 +0800
+++ b/gcc/config/aarch64/aarch64-protos.h	2021-02-18 10:57:45.488000000 +0800
@@ -95,9 +95,11 @@
  */
 enum aarch64_symbol_type
--- a/optabs-Dont-use-scalar-conversions-for-vectors.patch
+++ b/optabs-Dont-use-scalar-conversions-for-vectors.patch
@ -0,0 +1,69 @@
 This backport contains 1 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-optabs-Don-t-use-scalar-conversions-for-vectors-PR93.patch
 b6268016bf46dd63227dcbb73d13c30a3b4b9d2a
 diff --git a/gcc/optabs-tree.c b/gcc/optabs-tree.c
 index 3d829c27826..badd30bfda8 100644
 --- a/gcc/optabs-tree.c
 +++ b/gcc/optabs-tree.c
@@ -284,9 +284,14 @@ supportable_convert_operation (enum tree_code code,
   machine_mode m1,m2;
   bool truncp;
 +  gcc_assert (VECTOR_TYPE_P (vectype_out) && VECTOR_TYPE_P (vectype_in));
 +
   m1 = TYPE_MODE (vectype_out);
   m2 = TYPE_MODE (vectype_in);
 +  if (!VECTOR_MODE_P (m1) || !VECTOR_MODE_P (m2))
 +    return false;
 +
   /* First check if we can done conversion directly.  */
   if ((code == FIX_TRUNC_EXPR
        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
 diff --git a/gcc/testsuite/gcc.dg/vect/pr93843-1.c b/gcc/testsuite/gcc.dg/vect/pr93843-1.c
 new file mode 100644
 index 00000000000..23a79ca4c96
 --- /dev/null
 +++ b/gcc/testsuite/gcc.dg/vect/pr93843-1.c
@@ -0,0 +1,21 @@
 +char a;
 +struct S { short b, c; } d;
 +
 +__attribute__((noipa)) void
 +foo (int x)
 +{
 +  if (x != 4)
 +    __builtin_abort ();
 +}
 +
 +int
 +main ()
 +{
 +  short *g = &d.c, *h = &d.b;
 +  char e = 4 - a;
 +  int f;
 +  *h = *g = e;
 +  for (f = 0; f < 2; f++)
 +    foo (d.c);
 +  return 0;
 +}
 diff --git a/gcc/testsuite/gcc.dg/vect/pr93843-2.c b/gcc/testsuite/gcc.dg/vect/pr93843-2.c
 new file mode 100644
 index 00000000000..5fae3e5be17
 --- /dev/null
 +++ b/gcc/testsuite/gcc.dg/vect/pr93843-2.c
@@ -0,0 +1,11 @@
 +char in[2] = {2, 2};
 +short out[2] = {};
 +
 +int
 +main()
 +{
 +  for (int i = 0; i < 2; ++i)
 +    out[i] = in[i];
 +  asm("":::"memory");
 +  if (out[0] != 2) __builtin_abort();
 +}
--- a/redundant-loop-elimination.patch
+++ b/redundant-loop-elimination.patch
@ -1,6 +1,6 @@
 diff -Nurp a/gcc/common.opt b/gcc/common.opt
--- a/gcc/common.opt	2020-11-23 03:24:54.760000000 -0500
+--- a/gcc/common.opt	2021-02-18 21:32:50.724000000 -0500
-+++ b/gcc/common.opt	2020-11-23 03:23:59.716000000 -0500
+++ b/gcc/common.opt	2021-02-18 21:33:36.920000000 -0500
@@ -1150,6 +1150,10 @@ fcompare-elim
 Common Report Var(flag_compare_elim_after_reload) Optimization
 Perform comparison elimination after register allocation has finished.
@ -13,8 +13,8 @@ diff -Nurp a/gcc/common.opt b/gcc/common.opt
 Common Var(flag_conserve_stack) Optimization
 Do not perform optimizations increasing noticeably stack usage.
 diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
--- a/gcc/tree-ssa-phiopt.c	2020-11-23 03:24:54.760000000 -0500
+--- a/gcc/tree-ssa-phiopt.c	2021-02-18 21:32:52.648000000 -0500
-+++ b/gcc/tree-ssa-phiopt.c	2020-11-23 03:27:42.824000000 -0500
+++ b/gcc/tree-ssa-phiopt.c	2021-02-19 01:55:10.128000000 -0500
@@ -71,6 +71,7 @@ static hash_set<tree> * get_non_trapping
 static void replace_phi_edge_with_variable (basic_block, edge, gimple *, tree);
 static void hoist_adjacent_loads (basic_block, basic_block,
@ -48,7 +48,7 @@ diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
 +     ...
 +*/
 +static bool
-+check_uses_cond (tree ssa_name, gimple *stmt,
+check_uses_cond (const_tree ssa_name, gimple *stmt,
 +		 hash_set<tree> *hset ATTRIBUTE_UNUSED)
 +{
 +  tree_code code = gimple_cond_code (stmt);
@ -76,7 +76,7 @@ diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
 +     _tmp = SSA_NAME | _tmp2;
 +*/
 +static bool
-+check_uses_assign (tree ssa_name, gimple *stmt, hash_set<tree> *hset)
+check_uses_assign (const_tree ssa_name, gimple *stmt, hash_set<tree> *hset)
 +{
 +  tree_code code = gimple_assign_rhs_code (stmt);
 +  tree lhs, rhs1, rhs2;
@ -113,7 +113,7 @@ diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
 +     # result = PHI <SSA_NAME (bb1), 0 (bb2), 0 (bb3)>
 +*/
 +static bool
-+check_uses_phi (tree ssa_name, gimple *stmt, hash_set<tree> *hset)
+check_uses_phi (const_tree ssa_name, gimple *stmt, hash_set<tree> *hset)
 +{
 +  for (unsigned i = 0; i < gimple_phi_num_args (stmt); i++)
 +    {
@ -223,7 +223,7 @@ diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
 +}
 +
 +static bool
-+check_def_gimple (gimple *def1, gimple *def2, tree result)
+check_def_gimple (gimple *def1, gimple *def2, const_tree result)
 +{
 +  /* def1 and def2 should be POINTER_PLUS_EXPR.  */
 +  if (!is_gimple_assign (def1) || !is_gimple_assign (def2)
@ -255,7 +255,7 @@ diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
 +}
 +
 +static bool
-+check_loop_body (basic_block bb0, basic_block bb2, tree result)
+check_loop_body (basic_block bb0, basic_block bb2, const_tree result)
 +{
 +  gimple *g01 = first_stmt (bb0);
 +  if (!g01 || !is_gimple_assign (g01)
@ -373,8 +373,8 @@ diff -Nurp a/gcc/tree-ssa-phiopt.c b/gcc/tree-ssa-phiopt.c
 +   ...
 +*/
 +static bool
-+check_gimple_order (basic_block bb1, tree base, tree cst, tree result,
+check_gimple_order (basic_block bb1, const_tree base, const_tree cst,
-+		    gimple *&output)
+		    const_tree result, gimple *&output)
 +{
 +  gimple *g1 = first_stmt (bb1);
 +  if (!g1 || !is_gimple_assign (g1)
--- a/revert-moutline-atomics.patch
+++ b/revert-moutline-atomics.patch
@ -0,0 +1,418 @@
 This backport contains 1 patch from gcc main stream tree.
 The commit id of these patchs list as following in the order of time.
 0001-aarch64-Implement-moutline-atomics.patch
 3950b229a5ed6710f30241c2ddc3c74909bf4740
 diff -Nurp a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c
 --- a/gcc/config/aarch64/aarch64.c	2021-03-11 17:12:30.380000000 +0800
 +++ b/gcc/config/aarch64/aarch64.c	2021-03-11 17:13:29.992000000 +0800
@@ -18150,82 +18150,6 @@ aarch64_emit_unlikely_jump (rtx insn)
   add_reg_br_prob_note (jump, profile_probability::very_unlikely ());
 }
 -/* We store the names of the various atomic helpers in a 5x4 array.
 -   Return the libcall function given MODE, MODEL and NAMES.  */
 -
 -rtx
 -aarch64_atomic_ool_func(machine_mode mode, rtx model_rtx,
 -			const atomic_ool_names *names)
 -{
 -  memmodel model = memmodel_base (INTVAL (model_rtx));
 -  int mode_idx, model_idx;
 -
 -  switch (mode)
 -    {
 -    case E_QImode:
 -      mode_idx = 0;
 -      break;
 -    case E_HImode:
 -      mode_idx = 1;
 -      break;
 -    case E_SImode:
 -      mode_idx = 2;
 -      break;
 -    case E_DImode:
 -      mode_idx = 3;
 -      break;
 -    case E_TImode:
 -      mode_idx = 4;
 -      break;
 -    default:
 -      gcc_unreachable ();
 -    }
 -
 -  switch (model)
 -    {
 -    case MEMMODEL_RELAXED:
 -      model_idx = 0;
 -      break;
 -    case MEMMODEL_CONSUME:
 -    case MEMMODEL_ACQUIRE:
 -      model_idx = 1;
 -      break;
 -    case MEMMODEL_RELEASE:
 -      model_idx = 2;
 -      break;
 -    case MEMMODEL_ACQ_REL:
 -    case MEMMODEL_SEQ_CST:
 -      model_idx = 3;
 -      break;
 -    default:
 -      gcc_unreachable ();
 -    }
 -
 -  return init_one_libfunc_visibility (names->str[mode_idx][model_idx],
 -				      VISIBILITY_HIDDEN);
 -}
 -
 -#define DEF0(B, N) \
 -  { "__aarch64_" #B #N "_relax", \
 -    "__aarch64_" #B #N "_acq", \
 -    "__aarch64_" #B #N "_rel", \
 -    "__aarch64_" #B #N "_acq_rel" }
 -
 -#define DEF4(B)  DEF0(B, 1), DEF0(B, 2), DEF0(B, 4), DEF0(B, 8), \
 -		 { NULL, NULL, NULL, NULL }
 -#define DEF5(B)  DEF0(B, 1), DEF0(B, 2), DEF0(B, 4), DEF0(B, 8), DEF0(B, 16)
 -
 -static const atomic_ool_names aarch64_ool_cas_names = { { DEF5(cas) } };
 -const atomic_ool_names aarch64_ool_swp_names = { { DEF4(swp) } };
 -const atomic_ool_names aarch64_ool_ldadd_names = { { DEF4(ldadd) } };
 -const atomic_ool_names aarch64_ool_ldset_names = { { DEF4(ldset) } };
 -const atomic_ool_names aarch64_ool_ldclr_names = { { DEF4(ldclr) } };
 -const atomic_ool_names aarch64_ool_ldeor_names = { { DEF4(ldeor) } };
 -
 -#undef DEF0
 -#undef DEF4
 -#undef DEF5
 -
 /* Expand a compare and swap pattern.  */
 void
@@ -18272,17 +18196,6 @@ aarch64_expand_compare_and_swap (rtx ope
 						   newval, mod_s));
       cc_reg = aarch64_gen_compare_reg_maybe_ze (NE, rval, oldval, mode);
     }
 -  else if (TARGET_OUTLINE_ATOMICS)
 -    {
 -      /* Oldval must satisfy compare afterward.  */
 -      if (!aarch64_plus_operand (oldval, mode))
 -	oldval = force_reg (mode, oldval);
 -      rtx func = aarch64_atomic_ool_func (mode, mod_s, &aarch64_ool_cas_names);
 -      rval = emit_library_call_value (func, NULL_RTX, LCT_NORMAL, r_mode,
 -				      oldval, mode, newval, mode,
 -				      XEXP (mem, 0), Pmode);
 -      cc_reg = aarch64_gen_compare_reg_maybe_ze (NE, rval, oldval, mode);
 -    }
   else
     {
       /* The oldval predicate varies by mode.  Test it and force to reg.  */
 diff -Nurp a/gcc/config/aarch64/aarch64.opt b/gcc/config/aarch64/aarch64.opt
 --- a/gcc/config/aarch64/aarch64.opt	2021-03-11 17:12:30.380000000 +0800
 +++ b/gcc/config/aarch64/aarch64.opt	2021-03-11 17:13:29.992000000 +0800
@@ -272,6 +272,3 @@ user-land code.
 TargetVariable
 long aarch64_stack_protector_guard_offset = 0
 -moutline-atomics
 -Target Report Mask(OUTLINE_ATOMICS) Save
 -Generate local calls to out-of-line atomic operations.
 diff -Nurp a/gcc/config/aarch64/atomics.md b/gcc/config/aarch64/atomics.md
 --- a/gcc/config/aarch64/atomics.md	2021-03-11 17:12:30.380000000 +0800
 +++ b/gcc/config/aarch64/atomics.md	2021-03-11 17:13:29.992000000 +0800
@@ -186,27 +186,16 @@
   (match_operand:SI 3 "const_int_operand")]
   ""
   {
 +    rtx (*gen) (rtx, rtx, rtx, rtx);
 +
     /* Use an atomic SWP when available.  */
     if (TARGET_LSE)
 -      {
 -	emit_insn (gen_aarch64_atomic_exchange<mode>_lse
 -		   (operands[0], operands[1], operands[2], operands[3]));
 -      }
 -    else if (TARGET_OUTLINE_ATOMICS)
 -      {
 -	machine_mode mode = <MODE>mode;
 -	rtx func = aarch64_atomic_ool_func (mode, operands[3],
 -					    &aarch64_ool_swp_names);
 -	rtx rval = emit_library_call_value (func, operands[0], LCT_NORMAL,
 -					    mode, operands[2], mode,
 -					    XEXP (operands[1], 0), Pmode);
 -        emit_move_insn (operands[0], rval);
 -      }
 +      gen = gen_aarch64_atomic_exchange<mode>_lse;
     else
 -      {
 -	emit_insn (gen_aarch64_atomic_exchange<mode>
 -		   (operands[0], operands[1], operands[2], operands[3]));
 -      }
 +      gen = gen_aarch64_atomic_exchange<mode>;
 +
 +    emit_insn (gen (operands[0], operands[1], operands[2], operands[3]));
 +
     DONE;
   }
 )
@@ -291,39 +280,6 @@
 	  }
 	operands[1] = force_reg (<MODE>mode, operands[1]);
       }
 -    else if (TARGET_OUTLINE_ATOMICS)
 -      {
 -        const atomic_ool_names *names;
 -	switch (<CODE>)
 -	  {
 -	  case MINUS:
 -	    operands[1] = expand_simple_unop (<MODE>mode, NEG, operands[1],
 -					      NULL, 1);
 -	    /* fallthru */
 -	  case PLUS:
 -	    names = &aarch64_ool_ldadd_names;
 -	    break;
 -	  case IOR:
 -	    names = &aarch64_ool_ldset_names;
 -	    break;
 -	  case XOR:
 -	    names = &aarch64_ool_ldeor_names;
 -	    break;
 -	  case AND:
 -	    operands[1] = expand_simple_unop (<MODE>mode, NOT, operands[1],
 -					      NULL, 1);
 -	    names = &aarch64_ool_ldclr_names;
 -	    break;
 -	  default:
 -	    gcc_unreachable ();
 -	  }
 -        machine_mode mode = <MODE>mode;
 -	rtx func = aarch64_atomic_ool_func (mode, operands[2], names);
 -	emit_library_call_value (func, NULL_RTX, LCT_NORMAL, mode,
 -				 operands[1], mode,
 -				 XEXP (operands[0], 0), Pmode);
 -        DONE;
 -      }
     else
       gen = gen_aarch64_atomic_<atomic_optab><mode>;
@@ -449,40 +405,6 @@
 	}
       operands[2] = force_reg (<MODE>mode, operands[2]);
     }
 -  else if (TARGET_OUTLINE_ATOMICS)
 -    {
 -      const atomic_ool_names *names;
 -      switch (<CODE>)
 -	{
 -	case MINUS:
 -	  operands[2] = expand_simple_unop (<MODE>mode, NEG, operands[2],
 -					    NULL, 1);
 -	  /* fallthru */
 -	case PLUS:
 -	  names = &aarch64_ool_ldadd_names;
 -	  break;
 -	case IOR:
 -	  names = &aarch64_ool_ldset_names;
 -	  break;
 -	case XOR:
 -	  names = &aarch64_ool_ldeor_names;
 -	  break;
 -	case AND:
 -	  operands[2] = expand_simple_unop (<MODE>mode, NOT, operands[2],
 -					    NULL, 1);
 -	  names = &aarch64_ool_ldclr_names;
 -	  break;
 -	default:
 -	  gcc_unreachable ();
 -	}
 -      machine_mode mode = <MODE>mode;
 -      rtx func = aarch64_atomic_ool_func (mode, operands[3], names);
 -      rtx rval = emit_library_call_value (func, operands[0], LCT_NORMAL, mode,
 -					  operands[2], mode,
 -					  XEXP (operands[1], 0), Pmode);
 -      emit_move_insn (operands[0], rval);
 -      DONE;
 -    }
   else
     gen = gen_aarch64_atomic_fetch_<atomic_optab><mode>;
@@ -572,7 +494,7 @@
 {
   /* Use an atomic load-operate instruction when possible.  In this case
      we will re-compute the result from the original mem value. */
 -  if (TARGET_LSE || TARGET_OUTLINE_ATOMICS)
 +  if (TARGET_LSE)
     {
       rtx tmp = gen_reg_rtx (<MODE>mode);
       operands[2] = force_reg (<MODE>mode, operands[2]);
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_reg_1.c b/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_reg_1.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_reg_1.c	2021-03-11 17:12:34.168000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_reg_1.c	2021-03-11 17:13:30.656000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-O2 -march=armv8-a+nolse -mno-outline-atomics" } */
 +/* { dg-options "-O2 -march=armv8-a+nolse" } */
 /* { dg-skip-if "" { *-*-* } { "-mcpu=*" } { "" } } */
 int
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_strong_1.c b/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_strong_1.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_strong_1.c	2021-03-11 17:12:34.168000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic_cmp_exchange_zero_strong_1.c	2021-03-11 17:13:30.656000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-O2 -march=armv8-a+nolse -mno-outline-atomics" } */
 +/* { dg-options "-O2 -march=armv8-a+nolse" } */
 /* { dg-skip-if "" { *-*-* } { "-mcpu=*" } { "" } } */
 int
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-comp-swap-release-acquire.c b/gcc/testsuite/gcc.target/aarch64/atomic-comp-swap-release-acquire.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-comp-swap-release-acquire.c	2021-03-11 17:12:33.988000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-comp-swap-release-acquire.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -fno-ipa-icf -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2 -fno-ipa-icf" } */
 #include "atomic-comp-swap-release-acquire.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-acq_rel.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-acq_rel.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-acq_rel.c	2021-03-11 17:12:33.988000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-acq_rel.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-acq_rel.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-acquire.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-acquire.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-acquire.c	2021-03-11 17:12:33.988000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-acquire.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-acquire.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-char.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-char.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-char.c	2021-03-11 17:12:33.992000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-char.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-char.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-consume.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-consume.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-consume.c	2021-03-11 17:12:33.992000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-consume.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-consume.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-imm.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-imm.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-imm.c	2021-03-11 17:12:33.992000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-imm.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 int v = 0;
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-int.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-int.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-int.c	2021-03-11 17:12:33.992000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-int.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-int.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-long.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-long.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-long.c	2021-03-11 17:12:33.992000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-long.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 long v = 0;
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-relaxed.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-relaxed.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-relaxed.c	2021-03-11 17:12:33.992000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-relaxed.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-relaxed.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-release.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-release.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-release.c	2021-03-11 17:12:34.012000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-release.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-release.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-seq_cst.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-seq_cst.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-seq_cst.c	2021-03-11 17:12:34.012000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-seq_cst.c	2021-03-11 17:13:30.648000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-seq_cst.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/atomic-op-short.c b/gcc/testsuite/gcc.target/aarch64/atomic-op-short.c
 --- a/gcc/testsuite/gcc.target/aarch64/atomic-op-short.c	2021-03-11 17:12:34.168000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/atomic-op-short.c	2021-03-11 17:13:30.652000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "atomic-op-short.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/sync-comp-swap.c b/gcc/testsuite/gcc.target/aarch64/sync-comp-swap.c
 --- a/gcc/testsuite/gcc.target/aarch64/sync-comp-swap.c	2021-03-11 17:12:34.168000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/sync-comp-swap.c	2021-03-11 17:13:30.656000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -fno-ipa-icf -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2 -fno-ipa-icf" } */
 #include "sync-comp-swap.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/sync-op-acquire.c b/gcc/testsuite/gcc.target/aarch64/sync-op-acquire.c
 --- a/gcc/testsuite/gcc.target/aarch64/sync-op-acquire.c	2021-03-11 17:12:34.168000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/sync-op-acquire.c	2021-03-11 17:13:30.656000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "sync-op-acquire.x"
 diff -Nurp a/gcc/testsuite/gcc.target/aarch64/sync-op-full.c b/gcc/testsuite/gcc.target/aarch64/sync-op-full.c
 --- a/gcc/testsuite/gcc.target/aarch64/sync-op-full.c	2021-03-11 17:12:34.168000000 +0800
 +++ b/gcc/testsuite/gcc.target/aarch64/sync-op-full.c	2021-03-11 17:13:30.656000000 +0800
@@ -1,5 +1,5 @@
 /* { dg-do compile } */
 -/* { dg-options "-march=armv8-a+nolse -O2 -mno-outline-atomics" } */
 +/* { dg-options "-march=armv8-a+nolse -O2" } */
 #include "sync-op-full.x"
--- a/revise-type-before-build-MULT.patch
+++ b/revise-type-before-build-MULT.patch
@ -0,0 +1,80 @@
 diff -uprN a/gcc/testsuite/gcc.dg/affine-add-1.c b/gcc/testsuite/gcc.dg/affine-add-1.c
 --- a/gcc/testsuite/gcc.dg/affine-add-1.c	1970-01-01 08:00:00.000000000 +0800
 +++ b/gcc/testsuite/gcc.dg/affine-add-1.c	2021-03-18 19:41:21.308000000 +0800
@@ -0,0 +1,16 @@
 +/* { dg-do compile } */
 +/* { dg-options "-O2" } */
 +
 +extern unsigned char a[][13][23][15][11];
 +short b;
 +int c, d;
 +void e(int f, int g[][3][4][3]) {
 +  for (char h = 0;; h = 2)
 +    for (; f;)
 +      for (short i;; i = d)
 +        for (char j; j; j = c)
 +          for (char k = 0; k < 4; k = g[h][b][i][j])
 +            a[h][b][i][j][k] = 0;
 +}
 +unsigned char a[3][13][23][15][11];
 +int main() {}
 diff -uprN a/gcc/testsuite/g++.dg/affine-add-1.C b/gcc/testsuite/g++.dg/affine-add-1.C
 --- a/gcc/testsuite/g++.dg/affine-add-1.C	1970-01-01 08:00:00.000000000 +0800
 +++ b/gcc/testsuite/g++.dg/affine-add-1.C	2021-03-18 19:40:28.432000000 +0800
@@ -0,0 +1,33 @@
 +/* { dg-do compile } */
 +/* { dg-options "-O3" } */
 +
 +#include <algorithm>
 +
 +extern int a[];
 +extern unsigned char b[][151800];
 +extern long long c[][20][23][22][11];
 +char d, e;
 +int f;
 +unsigned g;
 +long h;
 +void i(unsigned long long s, unsigned short j) {
 +  for (char k = 0; k < 12; k += 3)
 +    for (short l = 0; l < 9; l = std::min(j, (unsigned short)4050683)) {
 +      for (bool m(h); m < bool(~0); m = 1)
 +        for (int t = 0; t < 4; t = std::min(s, (unsigned long long)40808803))
 +          for (int n = 0; n < 9; n += e)
 +            a[n] = 0;
 +      for (char o = 0; o < g; o = 4)
 +        for (bool p; p < f; p = d) {
 +          for (long q(s); q < 4ULL; q += 1ULL)
 +            b[k][o + q] = 0;
 +          for (int r = 0; r < 11; r += ~0 || 0)
 +            c[k][l][o][d][r] = 0;
 +        }
 +    }
 +}
 +int a[0];
 +unsigned char b[3][151800];
 +long long c[3][20][23][22][11];
 +int main() {}
 +
 diff -uprN a/gcc/tree-affine.c b/gcc/tree-affine.c
 --- a/gcc/tree-affine.c	2021-03-15 18:55:31.928000000 +0800
 +++ b/gcc/tree-affine.c	2021-03-18 16:34:05.932000000 +0800
@@ -184,9 +184,16 @@ aff_combination_add_elt (aff_tree *comb,
   if (scale == 1)
     elt = fold_convert (type, elt);
   else
 -    elt = fold_build2 (MULT_EXPR, type,
 -		       fold_convert (type, elt),
 -		       wide_int_to_tree (type, scale));
 +    {
 +      if (POINTER_TYPE_P (TREE_TYPE (elt)))
 +	{
 +	  elt = copy_node (elt);
 +	  TREE_TYPE (elt) = sizetype;
 +	}
 +      elt = fold_build2 (MULT_EXPR, type,
 +			 fold_convert (type, elt),
 +			 wide_int_to_tree (type, scale));
 +    }
   if (comb->rest)
     comb->rest = fold_build2 (PLUS_EXPR, type, comb->rest,