@@ -17,7 +17,7 @@ target datalayout = "e-m:e-i64:64-i128:128-n32:64-S128"
1717; NOTE: The strides of the starting address values in the inner loop differ, i.e.
1818; '(i * (n + 1))' vs '(i * n)'.
1919
20- ; DEBUG-LABEL: LAA: Found a loop in diff_checks:
20+ ; DEBUG-LABEL: ' diff_checks'
2121; DEBUG: LAA: Not creating diff runtime check, since these cannot be hoisted out of the outer loop
2222; DEBUG: LAA: Adding RT check for range:
2323; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
@@ -149,7 +149,7 @@ outer.exit:
149149; We decide to do full runtime checks here (as opposed to diff checks) due to
150150; the additional load of 'dst[(i * n) + j]' in the loop.
151151
152- ; DEBUG-LABEL: LAA: Found a loop in full_checks:
152+ ; DEBUG-LABEL: ' full_checks'
153153; DEBUG-NOT: LAA: Creating diff runtime check for:
154154; DEBUG: LAA: Adding RT check for range:
155155; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
@@ -272,7 +272,7 @@ outer.exit:
272272; is accessed with a higher stride compared src, and therefore the inner loop
273273; runtime checks will vary for each outer loop iteration.
274274
275- ; DEBUG-LABEL: LAA: Found a loop in full_checks_diff_strides:
275+ ; DEBUG-LABEL: ' full_checks_diff_strides'
276276; DEBUG-NOT: LAA: Creating diff runtime check for:
277277; DEBUG: LAA: Adding RT check for range:
278278; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
@@ -402,7 +402,7 @@ outer.exit:
402402; }
403403; }
404404
405- ; DEBUG-LABEL: LAA: Found a loop in diff_checks_src_start_invariant:
405+ ; DEBUG-LABEL: ' diff_checks_src_start_invariant'
406406; DEBUG-NOT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
407407
408408define void @diff_checks_src_start_invariant (ptr nocapture noundef writeonly %dst , ptr nocapture noundef readonly %src , i32 noundef %m , i32 noundef %n ) {
@@ -508,7 +508,7 @@ outer.loop.exit:
508508; }
509509; }
510510
511- ; DEBUG-LABEL: LAA: Found a loop in full_checks_src_start_invariant:
511+ ; DEBUG-LABEL: ' full_checks_src_start_invariant'
512512; DEBUG: LAA: Adding RT check for range:
513513; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
514514; DEBUG-NEXT: Start: %dst End: ((4 * (zext i32 %m to i64) * (zext i32 %n to i64)) + %dst)
@@ -629,7 +629,7 @@ outer.loop.exit:
629629; The 'src' access varies with the outermost loop, rather than the parent of the
630630; innermost loop. Hence we don't expand `src`, although in theory we could do.
631631
632- ; DEBUG-LABEL: LAA: Found a loop in triple_nested_loop_mixed_access:
632+ ; DEBUG-LABEL: ' triple_nested_loop_mixed_access'
633633; DEBUG-NOT: LAA: Creating diff runtime check for:
634634; DEBUG: LAA: Adding RT check for range:
635635; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
@@ -795,7 +795,7 @@ exit:
795795; }
796796; Outer loop trip count is uncomputable so we shouldn't expand the ranges.
797797
798- ; DEBUG-LABEL: LAA: Found a loop in uncomputable_outer_tc:
798+ ; DEBUG-LABEL: ' uncomputable_outer_tc'
799799; DEBUG: LAA: Adding RT check for range:
800800; DEBUG-NEXT: Start: {%dst,+,(4 * (zext i32 (1 + %n) to i64))<nuw><nsw>}<%outer.loop> End: {((4 * (zext i32 %n to i64))<nuw><nsw> + %dst),+,(4 * (zext i32 (1 + %n) to i64))<nuw><nsw>}<%outer.loop>
801801; DEBUG-NEXT: LAA: Adding RT check for range:
@@ -945,7 +945,7 @@ while.end:
945945; Inner IV is decreasing, but this isn't a problem and we can still expand the
946946; runtime checks correctly to cover the whole loop.
947947
948- ; DEBUG-LABEL: LAA: Found a loop in decreasing_inner_iv:
948+ ; DEBUG-LABEL: ' decreasing_inner_iv'
949949; DEBUG: LAA: Adding RT check for range:
950950; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
951951; DEBUG-NEXT: LAA: ... but need to check stride is positive: (4 * (sext i32 %stride1 to i64))<nsw>
@@ -1111,7 +1111,7 @@ exit:
11111111; Outer IV is decreasing, but the direction of memory accesses also depends
11121112; upon the signedness of stride1.
11131113
1114- ; DEBUG-LABEL: LAA: Found a loop in decreasing_outer_iv:
1114+ ; DEBUG-LABEL: ' decreasing_outer_iv'
11151115; DEBUG: LAA: Adding RT check for range:
11161116; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
11171117; DEBUG-NEXT: LAA: ... but need to check stride is positive: (-4 * (sext i32 %stride1 to i64))<nsw>
@@ -1271,7 +1271,7 @@ exit:
12711271; }
12721272
12731273
1274- ; DEBUG-LABEL: LAA: Found a loop in unknown_inner_stride:
1274+ ; DEBUG-LABEL: ' unknown_inner_stride'
12751275; DEBUG: LAA: Adding RT check for range:
12761276; DEBUG-NEXT: LAA: Expanded RT check for range to include outer loop in order to permit hoisting
12771277; DEBUG-NEXT: Start: %dst End: ((4 * (zext i32 %n to i64))<nuw><nsw> + (4 * (zext i32 (1 + %n) to i64) * (-1 + (zext i32 %m to i64))<nsw>) + %dst)
0 commit comments