matmul_check - OptiTrust Trace

✔ [46] !! Loop.unroll [cFor ~body:[cPlusEq ~lhs:[cVar "s"] ()] "k"]; (* !! postprocessing (); *) )

✔Loop.unroll
- ✔Loop.unroll_nest_of_1
  - ✔Resources.detach_loop_ro_focus
  - ✔Loop_basic.unroll
  - ✔Arith.simpl_surrounding_expr

tmp_before.cpp → tmp_after.cpp RENAMED Viewed

@@ -107,39 +107,88 @@ void mm1024(float* C, float* A, float* B) {
        "Group(range(0, 4, 1), fun k -> Group(range(0, 32, 1), fun j -> "
        "&pB[bj][bk][k][j] ~> Cell))");
      __sreads("A ~> Matrix2(1024, 1024)");
      __sreads("B ~> Matrix2(1024, 1024)");
      __xmodifies("Group(range(0, 32, 1), fun j -> &sum[i][j] ~> Cell)");
      float* const s = new float(32)();
      const __ghost_fn __ghost_pair_6 =
        __ghost_begin(mindex2_contiguous_ro, "M := sum");
      MMEMCPY(s, 0, sum, i * 32 + 0, 32, sizeof(float));
      __ghost_end(__ghost_pair_6);
-     for (int k = 0; k < 4; k++) {
-      __smodifies("Group(range(0, 32, 1), fun j -> &s[j] ~> Cell)");
       __sreads("A ~> Matrix2(1024, 1024)");
       __sreads("B ~> Matrix2(1024, 1024)");
-      __xreads(
-        "Group(range(0, 32, 1), fun j -> &pB[bj][bk][k][j] ~> Cell)");
      #pragma omp simd
      for (int j = 0; j < 32; j++) {
       __sreads("A ~> Matrix2(1024, 1024)");
       __sreads("B ~> Matrix2(1024, 1024)");
       __xmodifies("&s[j] ~> Cell");
-       __xreads("&pB[bj][bk][k][j] ~> Cell");
-       const __ghost_fn __ghost_pair_2 =
-         __ghost_begin(matrix2_ro_focus,
-                "M := A, i := bi * 32 + i, j := bk * 4 + k");
-       s[j] += A[bi * 32 + i][bk * 4 + k] * pB[bj][bk][k][j];
       __ghost_end(__ghost_pair_2);
      }
      }
      __ghost(mindex2_contiguous_uninit, "M := sum");
      MMEMCPY(sum, i * 32 + 0, s, 0, 32, sizeof(float));
      __ghost(mindex2_contiguous_rev, "M := sum");
     }
    }
    for (int i = 0; i < 32; i++) {
     __consumes(
       "_Uninit(Group(range(0, 32, 1), fun j -> &C[bi * 32 + i][bj * 32 + "
       "j] ~> Cell))");
     __produces(

        "Group(range(0, 4, 1), fun k -> Group(range(0, 32, 1), fun j -> "
        "&pB[bj][bk][k][j] ~> Cell))");
      __sreads("A ~> Matrix2(1024, 1024)");
      __sreads("B ~> Matrix2(1024, 1024)");
      __xmodifies("Group(range(0, 32, 1), fun j -> &sum[i][j] ~> Cell)");
      float* const s = new float(32)();
      const __ghost_fn __ghost_pair_6 =
        __ghost_begin(mindex2_contiguous_ro, "M := sum");
      MMEMCPY(s, 0, sum, i * 32 + 0, 32, sizeof(float));
      __ghost_end(__ghost_pair_6);
+     const __ghost_fn __ghost_pair_7 = __ghost_begin(
+       group_ro_focus,
+       "i := 0, items := fun k -> Group(range(0, 32, 1), fun j -> "
+       "&pB[bj][bk][k][j] ~> Cell), bound_check_start := checked, "
+       "bound_check_stop := checked, bound_check_step := checked");
+     #pragma omp simd
+     for (int j = 0; j < 32; j++) {
       __sreads("A ~> Matrix2(1024, 1024)");
       __sreads("B ~> Matrix2(1024, 1024)");
+      __xmodifies("&s[j] ~> Cell");
+      __xreads("&pB[bj][bk][0][j] ~> Cell");
+      const __ghost_fn __ghost_pair_2 = __ghost_begin(
+        matrix2_ro_focus, "M := A, i := 32 * bi + i, j := 4 * bk");
+      s[j] += A[32 * bi + i][4 * bk] * pB[bj][bk][0][j];
+      __ghost_end(__ghost_pair_2);
+     }
+     __ghost_end(__ghost_pair_7);
+     const __ghost_fn __ghost_pair_712 = __ghost_begin(
+       group_ro_focus,
+       "i := 1, items := fun k -> Group(range(0, 32, 1), fun j -> "
+       "&pB[bj][bk][k][j] ~> Cell), bound_check_start := checked, "
+       "bound_check_stop := checked, bound_check_step := checked");
      #pragma omp simd
      for (int j = 0; j < 32; j++) {
       __sreads("A ~> Matrix2(1024, 1024)");
       __sreads("B ~> Matrix2(1024, 1024)");
       __xmodifies("&s[j] ~> Cell");
+      __xreads("&pB[bj][bk][1][j] ~> Cell");
+      const __ghost_fn __ghost_pair_2 = __ghost_begin(
+        matrix2_ro_focus, "M := A, i := 32 * bi + i, j := 4 * bk + 1");
+      s[j] += A[32 * bi + i][4 * bk + 1] * pB[bj][bk][1][j];
       __ghost_end(__ghost_pair_2);
      }
+     __ghost_end(__ghost_pair_712);
+     const __ghost_fn __ghost_pair_713 = __ghost_begin(
+       group_ro_focus,
+       "i := 2, items := fun k -> Group(range(0, 32, 1), fun j -> "
+       "&pB[bj][bk][k][j] ~> Cell), bound_check_start := checked, "
+       "bound_check_stop := checked, bound_check_step := checked");
+     #pragma omp simd
+     for (int j = 0; j < 32; j++) {
+      __sreads("A ~> Matrix2(1024, 1024)");
+      __sreads("B ~> Matrix2(1024, 1024)");
+      __xmodifies("&s[j] ~> Cell");
+      __xreads("&pB[bj][bk][2][j] ~> Cell");
+      const __ghost_fn __ghost_pair_2 = __ghost_begin(
+        matrix2_ro_focus, "M := A, i := 32 * bi + i, j := 4 * bk + 2");
+      s[j] += A[32 * bi + i][4 * bk + 2] * pB[bj][bk][2][j];
+      __ghost_end(__ghost_pair_2);
+     }
+     __ghost_end(__ghost_pair_713);
+     const __ghost_fn __ghost_pair_714 = __ghost_begin(
+       group_ro_focus,
+       "i := 3, items := fun k -> Group(range(0, 32, 1), fun j -> "
+       "&pB[bj][bk][k][j] ~> Cell), bound_check_start := checked, "
+       "bound_check_stop := checked, bound_check_step := checked");
+     #pragma omp simd
+     for (int j = 0; j < 32; j++) {
+      __sreads("A ~> Matrix2(1024, 1024)");
+      __sreads("B ~> Matrix2(1024, 1024)");
+      __xmodifies("&s[j] ~> Cell");
+      __xreads("&pB[bj][bk][3][j] ~> Cell");
+      const __ghost_fn __ghost_pair_2 = __ghost_begin(
+        matrix2_ro_focus, "M := A, i := 32 * bi + i, j := 4 * bk + 3");
+      s[j] += A[32 * bi + i][4 * bk + 3] * pB[bj][bk][3][j];
+      __ghost_end(__ghost_pair_2);
      }
+     __ghost_end(__ghost_pair_714);
      __ghost(mindex2_contiguous_uninit, "M := sum");
      MMEMCPY(sum, i * 32 + 0, s, 0, 32, sizeof(float));
      __ghost(mindex2_contiguous_rev, "M := sum");
     }
    }
    for (int i = 0; i < 32; i++) {
     __consumes(
       "_Uninit(Group(range(0, 32, 1), fun j -> &C[bi * 32 + i][bj * 32 + "
       "j] ~> Cell))");
     __produces(