You've already forked linux-packaging-mono
							
							
		
			
	
	
		
			52 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
		
		
			
		
	
	
			52 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
|   | ; RUN: opt -analyze --loop-accesses %s | FileCheck %s
 | ||
|  | 
 | ||
|  | ; This test verifies run-time boundary check of memory accesses.
 | ||
|  | ; The original loop:
 | ||
|  | ;   void fastCopy(const char* src, char* op) {
 | ||
|  | ;     int len = 32;
 | ||
|  | ;     while (len > 0) {
 | ||
|  | ;       *(reinterpret_cast<long long*>(op)) = *(reinterpret_cast<const long long*>(src));
 | ||
|  | ;       src += 8;
 | ||
|  | ;       op += 8;
 | ||
|  | ;       len -= 8;
 | ||
|  | ;     }
 | ||
|  | ;   }
 | ||
|  | ; Boundaries calculations before this patch:
 | ||
|  | ; (Low: %src High: (24 + %src))
 | ||
|  | ; and the actual distance between two pointers was 31,  (%op - %src = 31)
 | ||
|  | ; IsConflict = (24 > 31) = false -> execution is directed to the vectorized loop.
 | ||
|  | ; The loop was vectorized to 4, 32 byte memory access ( <4 x i64> ),
 | ||
|  | ; store a value at *%op touched memory under *%src.
 | ||
|  | 
 | ||
|  | ;CHECK: Printing analysis 'Loop Access Analysis' for function 'fastCopy'
 | ||
|  | ;CHECK: (Low: %op High: (32 + %op))
 | ||
|  | ;CHECK: (Low: %src High: (32 + %src))
 | ||
|  | 
 | ||
|  | define void @fastCopy(i8* nocapture readonly %src, i8* nocapture %op) { | ||
|  | entry: | ||
|  |   br label %while.body.preheader | ||
|  | 
 | ||
|  | while.body.preheader:                             ; preds = %entry
 | ||
|  |   br label %while.body | ||
|  | 
 | ||
|  | while.body:                                       ; preds = %while.body.preheader, %while.body
 | ||
|  |   %len.addr.07 = phi i32 [ %sub, %while.body ], [ 32, %while.body.preheader ] | ||
|  |   %op.addr.06 = phi i8* [ %add.ptr1, %while.body ], [ %op, %while.body.preheader ] | ||
|  |   %src.addr.05 = phi i8* [ %add.ptr, %while.body ], [ %src, %while.body.preheader ] | ||
|  |   %0 = bitcast i8* %src.addr.05 to i64* | ||
|  |   %1 = load i64, i64* %0, align 8 | ||
|  |   %2 = bitcast i8* %op.addr.06 to i64* | ||
|  |   store i64 %1, i64* %2, align 8 | ||
|  |   %add.ptr = getelementptr inbounds i8, i8* %src.addr.05, i64 8 | ||
|  |   %add.ptr1 = getelementptr inbounds i8, i8* %op.addr.06, i64 8 | ||
|  |   %sub = add nsw i32 %len.addr.07, -8 | ||
|  |   %cmp = icmp sgt i32 %len.addr.07, 8 | ||
|  |   br i1 %cmp, label %while.body, label %while.end.loopexit | ||
|  | 
 | ||
|  | while.end.loopexit:                               ; preds = %while.body
 | ||
|  |   br label %while.end | ||
|  | 
 | ||
|  | while.end:                                        ; preds = %while.end.loopexit, %entry
 | ||
|  |   ret void | ||
|  | } |