Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[ScopHelper] Provide support for recognising collective invariant loads
Summary: This patch aims to provide support for detecting load patterns which are collectively invariant but right now `isHoistableLoad()` is checking each load instruction individually which cannot detect the load pattern as a whole. Patch by: Sahil Girish Yerawar Reviewers: bollu, philip.pfaffe, Meinersbur Reviewed By: philip.pfaffe, Meinersbur Differential Revision: https://reviews.llvm.org/D48026 llvm-svn: 335949
- Loading branch information
Showing
4 changed files
with
122 additions
and
14 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,56 @@ | ||
; RUN: opt %loadPolly -polly-scops -polly-invariant-load-hoisting -analyze < %s | FileCheck %s | ||
|
||
;CHECK: Function: test_init_chpl | ||
;CHECK-NEXT: Region: %bb1---%bb16 | ||
;CHECK-NEXT: Max Loop Depth: 2 | ||
;CHECK-NEXT: Invariant Accesses: { | ||
;CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0] | ||
;CHECK-NEXT: [tmp5] -> { Stmt_bb2[i0, i1] -> MemRef_arg[1] }; | ||
;CHECK-NEXT: Execution Context: [tmp5] -> { : } | ||
;CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0] | ||
;CHECK-NEXT: [tmp5] -> { Stmt_bb2[i0, i1] -> MemRef_tmp3[9] }; | ||
;CHECK-NEXT: Execution Context: [tmp5] -> { : } | ||
;CHECK-NEXT: ReadAccess := [Reduction Type: NONE] [Scalar: 0] | ||
;CHECK-NEXT: [tmp5] -> { Stmt_bb2[i0, i1] -> MemRef_tmp3[2] }; | ||
;CHECK-NEXT: Execution Context: [tmp5] -> { : } | ||
;CHECK-NEXT: } | ||
|
||
|
||
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" | ||
|
||
%array_ty = type { i64, %array_ptr*, i8 } | ||
%array_ptr = type { [2 x i64], [2 x i64], [2 x i64], i64, i64, double*, double*, i8 } | ||
|
||
; Function Attrs: noinline | ||
define weak dso_local void @test_init_chpl(%array_ty* nonnull %arg) { | ||
bb: | ||
br label %bb1 | ||
|
||
bb1: ; preds = %bb14, %bb | ||
%.0 = phi i64 [ 0, %bb ], [ %tmp15, %bb14 ] | ||
br label %bb2 | ||
|
||
bb2: ; preds = %bb2, %bb1 | ||
%.01 = phi i64 [ 0, %bb1 ], [ %tmp13, %bb2 ] | ||
%tmp = getelementptr inbounds %array_ty, %array_ty* %arg, i64 0, i32 1 | ||
%tmp3 = load %array_ptr*, %array_ptr** %tmp, align 8 | ||
%tmp4 = getelementptr inbounds %array_ptr, %array_ptr* %tmp3, i64 0, i32 1, i64 0 | ||
%tmp5 = load i64, i64* %tmp4, align 8 | ||
%tmp6 = mul nsw i64 %tmp5, %.0 | ||
%tmp7 = add nsw i64 %tmp6, %.01 | ||
%tmp8 = getelementptr inbounds %array_ptr, %array_ptr* %tmp3, i64 0, i32 6 | ||
%tmp9 = load double*, double** %tmp8, align 8 | ||
%tmp10 = getelementptr inbounds double, double* %tmp9, i64 %tmp7 | ||
store double 13.0, double* %tmp10, align 8 | ||
%tmp13 = add nuw nsw i64 %.01, 1 | ||
%exitcond = icmp ne i64 %tmp13, 1000 | ||
br i1 %exitcond, label %bb2, label %bb14 | ||
|
||
bb14: ; preds = %bb2 | ||
%tmp15 = add nuw nsw i64 %.0, 1 | ||
%exitcond8 = icmp ne i64 %tmp15, 1000 | ||
br i1 %exitcond8, label %bb1, label %bb16 | ||
|
||
bb16: ; preds = %bb14 | ||
ret void | ||
} |