While in this area I also removed unnecessary annotations for wchar_size and also cleaned up some more function attributes.
75 lines
2.9 KiB
LLVM
75 lines
2.9 KiB
LLVM
; Confirm that the line numbers for the middle.block operations are all the
|
|
; same as the start of the loop.
|
|
|
|
; RUN: opt -S -passes=loop-vectorize -force-vector-width=4 -force-vector-interleave=4 <%s | FileCheck %s
|
|
;
|
|
; CHECK: middle.block:
|
|
; CHECK-NEXT: %{{.*}}= add <4 x i32>{{.*}}, !dbg ![[DL:[0-9]+]]
|
|
; CHECK-NEXT: %{{.*}}= add <4 x i32>{{.*}}, !dbg ![[DL]]
|
|
; CHECK-NEXT: %{{.*}}= add <4 x i32>{{.*}}, !dbg ![[DL]]
|
|
; CHECK-NEXT: %{{.*}}= call i32 @llvm.vector.reduce.add.v4i32(<4 x i32> {{.*}}), !dbg ![[DL]]
|
|
; CHECK-NEXT: %{{.*}}= icmp eq i64{{.*}}, !dbg ![[DL]]
|
|
; CHECK-NEXT: br i1 %{{.*}}, !dbg ![[DL]]
|
|
; CHECK: ![[DL]] = !DILocation(line: 5,
|
|
|
|
; This IR can be generated by running:
|
|
; clang -gmlt -S src.cpp -emit-llvm -mllvm -opt-bisect-limit=56 -O2 -o -
|
|
;
|
|
; Where src.cpp contains:
|
|
; int foo(int count, int *bar)
|
|
; {
|
|
; int ret = count;
|
|
; int tmp;
|
|
; for (int j = 0; j < count; j++) {
|
|
; tmp = bar[j];
|
|
; ret += tmp;
|
|
; }
|
|
;
|
|
; return ret;
|
|
; }
|
|
|
|
define i32 @"foo"(i32 %count, ptr nocapture readonly %bar) !dbg !8 {
|
|
entry:
|
|
%cmp8 = icmp sgt i32 %count, 0, !dbg !10
|
|
br i1 %cmp8, label %for.body.preheader, label %for.cond.cleanup, !dbg !10
|
|
|
|
for.body.preheader:
|
|
%wide.trip.count = zext i32 %count to i64
|
|
br label %for.body, !dbg !11
|
|
|
|
for.cond.cleanup.loopexit:
|
|
%add.lcssa = phi i32 [ %add, %for.body ], !dbg !12
|
|
br label %for.cond.cleanup, !dbg !13
|
|
|
|
for.cond.cleanup:
|
|
%ret.0.lcssa = phi i32 [ %count, %entry ], [ %add.lcssa, %for.cond.cleanup.loopexit ], !dbg !14
|
|
ret i32 %ret.0.lcssa, !dbg !13
|
|
|
|
for.body:
|
|
%indvars.iv = phi i64 [ 0, %for.body.preheader ], [ %indvars.iv.next, %for.body ]
|
|
%ret.09 = phi i32 [ %count, %for.body.preheader ], [ %add, %for.body ]
|
|
%arrayidx = getelementptr inbounds i32, ptr %bar, i64 %indvars.iv, !dbg !11
|
|
%0 = load i32, ptr %arrayidx, align 4, !dbg !11
|
|
%add = add nsw i32 %0, %ret.09, !dbg !12
|
|
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 1, !dbg !10
|
|
%exitcond = icmp eq i64 %indvars.iv.next, %wide.trip.count, !dbg !10
|
|
br i1 %exitcond, label %for.cond.cleanup.loopexit, label %for.body, !dbg !10, !llvm.loop !19
|
|
}
|
|
|
|
!llvm.dbg.cu = !{!0}
|
|
!llvm.module.flags = !{!4}
|
|
|
|
!0 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus, file: !1, producer: "", isOptimized: true, runtimeVersion: 0, emissionKind: LineTablesOnly, enums: !2, nameTableKind: None)
|
|
!1 = !DIFile(filename: "src.cpp", directory: "")
|
|
!2 = !{}
|
|
!4 = !{i32 2, !"Debug Info Version", i32 3}
|
|
!8 = distinct !DISubprogram(name: "foo", scope: !1, file: !1, line: 1, type: !9, scopeLine: 2, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !0, retainedNodes: !2)
|
|
!9 = !DISubroutineType(types: !2)
|
|
!10 = !DILocation(line: 5, scope: !8)
|
|
!11 = !DILocation(line: 6, scope: !8)
|
|
!12 = !DILocation(line: 7, scope: !8)
|
|
!13 = !DILocation(line: 10, scope: !8)
|
|
!14 = !DILocation(line: 0, scope: !8)
|
|
!19 = distinct !{!19, !10, !20}
|
|
!20 = !DILocation(line: 8, scope: !8)
|