Changeset View
Changeset View
Standalone View
Standalone View
llvm/trunk/test/CodeGen/SystemZ/fp-strict-sqrt-02.ll
; Test strict 64-bit square root. | ; Test strict 64-bit square root. | ||||
; | ; | ||||
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z10 \ | ; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z10 \ | ||||
; RUN: | FileCheck -check-prefix=CHECK -check-prefix=CHECK-SCALAR %s | ; RUN: | FileCheck -check-prefix=CHECK -check-prefix=CHECK-SCALAR %s | ||||
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s | ; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s | ||||
declare double @llvm.experimental.constrained.sqrt.f64(double, metadata, metadata) | declare double @llvm.experimental.constrained.sqrt.f64(double, metadata, metadata) | ||||
; Check register square root. | ; Check register square root. | ||||
define double @f1(double %val) { | define double @f1(double %val) #0 { | ||||
; CHECK-LABEL: f1: | ; CHECK-LABEL: f1: | ||||
; CHECK: sqdbr %f0, %f0 | ; CHECK: sqdbr %f0, %f0 | ||||
; CHECK: br %r14 | ; CHECK: br %r14 | ||||
%res = call double @llvm.experimental.constrained.sqrt.f64( | %res = call double @llvm.experimental.constrained.sqrt.f64( | ||||
double %val, | double %val, | ||||
metadata !"round.dynamic", | metadata !"round.dynamic", | ||||
metadata !"fpexcept.strict") | metadata !"fpexcept.strict") #0 | ||||
ret double %res | ret double %res | ||||
} | } | ||||
; Check the low end of the SQDB range. | ; Check the low end of the SQDB range. | ||||
define double @f2(double *%ptr) { | define double @f2(double *%ptr) #0 { | ||||
; CHECK-LABEL: f2: | ; CHECK-LABEL: f2: | ||||
; CHECK: sqdb %f0, 0(%r2) | ; CHECK: sqdb %f0, 0(%r2) | ||||
; CHECK: br %r14 | ; CHECK: br %r14 | ||||
%val = load double, double *%ptr | %val = load double, double *%ptr | ||||
%res = call double @llvm.experimental.constrained.sqrt.f64( | %res = call double @llvm.experimental.constrained.sqrt.f64( | ||||
double %val, | double %val, | ||||
metadata !"round.dynamic", | metadata !"round.dynamic", | ||||
metadata !"fpexcept.strict") | metadata !"fpexcept.strict") #0 | ||||
ret double %res | ret double %res | ||||
} | } | ||||
; Check the high end of the aligned SQDB range. | ; Check the high end of the aligned SQDB range. | ||||
define double @f3(double *%base) { | define double @f3(double *%base) #0 { | ||||
; CHECK-LABEL: f3: | ; CHECK-LABEL: f3: | ||||
; CHECK: sqdb %f0, 4088(%r2) | ; CHECK: sqdb %f0, 4088(%r2) | ||||
; CHECK: br %r14 | ; CHECK: br %r14 | ||||
%ptr = getelementptr double, double *%base, i64 511 | %ptr = getelementptr double, double *%base, i64 511 | ||||
%val = load double, double *%ptr | %val = load double, double *%ptr | ||||
%res = call double @llvm.experimental.constrained.sqrt.f64( | %res = call double @llvm.experimental.constrained.sqrt.f64( | ||||
double %val, | double %val, | ||||
metadata !"round.dynamic", | metadata !"round.dynamic", | ||||
metadata !"fpexcept.strict") | metadata !"fpexcept.strict") #0 | ||||
ret double %res | ret double %res | ||||
} | } | ||||
; Check the next doubleword up, which needs separate address logic. | ; Check the next doubleword up, which needs separate address logic. | ||||
; Other sequences besides this one would be OK. | ; Other sequences besides this one would be OK. | ||||
define double @f4(double *%base) { | define double @f4(double *%base) #0 { | ||||
; CHECK-LABEL: f4: | ; CHECK-LABEL: f4: | ||||
; CHECK: aghi %r2, 4096 | ; CHECK: aghi %r2, 4096 | ||||
; CHECK: sqdb %f0, 0(%r2) | ; CHECK: sqdb %f0, 0(%r2) | ||||
; CHECK: br %r14 | ; CHECK: br %r14 | ||||
%ptr = getelementptr double, double *%base, i64 512 | %ptr = getelementptr double, double *%base, i64 512 | ||||
%val = load double, double *%ptr | %val = load double, double *%ptr | ||||
%res = call double @llvm.experimental.constrained.sqrt.f64( | %res = call double @llvm.experimental.constrained.sqrt.f64( | ||||
double %val, | double %val, | ||||
metadata !"round.dynamic", | metadata !"round.dynamic", | ||||
metadata !"fpexcept.strict") | metadata !"fpexcept.strict") #0 | ||||
ret double %res | ret double %res | ||||
} | } | ||||
; Check negative displacements, which also need separate address logic. | ; Check negative displacements, which also need separate address logic. | ||||
define double @f5(double *%base) { | define double @f5(double *%base) #0 { | ||||
; CHECK-LABEL: f5: | ; CHECK-LABEL: f5: | ||||
; CHECK: aghi %r2, -8 | ; CHECK: aghi %r2, -8 | ||||
; CHECK: sqdb %f0, 0(%r2) | ; CHECK: sqdb %f0, 0(%r2) | ||||
; CHECK: br %r14 | ; CHECK: br %r14 | ||||
%ptr = getelementptr double, double *%base, i64 -1 | %ptr = getelementptr double, double *%base, i64 -1 | ||||
%val = load double, double *%ptr | %val = load double, double *%ptr | ||||
%res = call double @llvm.experimental.constrained.sqrt.f64( | %res = call double @llvm.experimental.constrained.sqrt.f64( | ||||
double %val, | double %val, | ||||
metadata !"round.dynamic", | metadata !"round.dynamic", | ||||
metadata !"fpexcept.strict") | metadata !"fpexcept.strict") #0 | ||||
ret double %res | ret double %res | ||||
} | } | ||||
; Check that SQDB allows indices. | ; Check that SQDB allows indices. | ||||
define double @f6(double *%base, i64 %index) { | define double @f6(double *%base, i64 %index) #0 { | ||||
; CHECK-LABEL: f6: | ; CHECK-LABEL: f6: | ||||
; CHECK: sllg %r1, %r3, 3 | ; CHECK: sllg %r1, %r3, 3 | ||||
; CHECK: sqdb %f0, 800(%r1,%r2) | ; CHECK: sqdb %f0, 800(%r1,%r2) | ||||
; CHECK: br %r14 | ; CHECK: br %r14 | ||||
%ptr1 = getelementptr double, double *%base, i64 %index | %ptr1 = getelementptr double, double *%base, i64 %index | ||||
%ptr2 = getelementptr double, double *%ptr1, i64 100 | %ptr2 = getelementptr double, double *%ptr1, i64 100 | ||||
%val = load double, double *%ptr2 | %val = load double, double *%ptr2 | ||||
%res = call double @llvm.experimental.constrained.sqrt.f64( | %res = call double @llvm.experimental.constrained.sqrt.f64( | ||||
double %val, | double %val, | ||||
metadata !"round.dynamic", | metadata !"round.dynamic", | ||||
metadata !"fpexcept.strict") | metadata !"fpexcept.strict") #0 | ||||
ret double %res | ret double %res | ||||
} | } | ||||
attributes #0 = { strictfp } |