You've already forked linux-packaging-mono
Imported Upstream version 5.18.0.205
Former-commit-id: 7f59f7e792705db773f1caecdaa823092f4e2927
This commit is contained in:
parent
5cd5df71cc
commit
8e12397d70
33
external/llvm/test/CodeGen/NVPTX/fp-contract.ll
vendored
Normal file
33
external/llvm/test/CodeGen/NVPTX/fp-contract.ll
vendored
Normal file
@ -0,0 +1,33 @@
|
||||
; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 -fp-contract=fast | FileCheck %s --check-prefix=FAST
|
||||
; RUN: llc < %s -march=nvptx64 -mcpu=sm_30 | FileCheck %s --check-prefix=DEFAULT
|
||||
|
||||
target triple = "nvptx64-unknown-cuda"
|
||||
|
||||
;; Make sure we are generating proper instruction sequences for fused ops
|
||||
;; If fusion is allowed, we try to form fma.rn at the PTX level, and emit
|
||||
;; add.f32 otherwise. Without an explicit rounding mode on add.f32, ptxas
|
||||
;; is free to fuse with a multiply if it is able. If fusion is not allowed,
|
||||
;; we do not form fma.rn at the PTX level and explicitly generate add.rn
|
||||
;; for all adds to prevent ptxas from fusion the ops.
|
||||
|
||||
;; FAST-LABEL: @t0
|
||||
;; DEFAULT-LABEL: @t0
|
||||
define float @t0(float %a, float %b, float %c) {
|
||||
;; FAST: fma.rn.f32
|
||||
;; DEFAULT: mul.rn.f32
|
||||
;; DEFAULT: add.rn.f32
|
||||
%v0 = fmul float %a, %b
|
||||
%v1 = fadd float %v0, %c
|
||||
ret float %v1
|
||||
}
|
||||
|
||||
;; FAST-LABEL: @t1
|
||||
;; DEFAULT-LABEL: @t1
|
||||
define float @t1(float %a, float %b) {
|
||||
;; We cannot form an fma here, but make sure we explicitly emit add.rn.f32
|
||||
;; to prevent ptxas from fusing this with anything else.
|
||||
;; FAST: add.f32
|
||||
;; DEFAULT: add.rn.f32
|
||||
%v1 = fadd float %a, %b
|
||||
ret float %v1
|
||||
}
|
Reference in New Issue
Block a user