Please use GitHub pull requests for new patches. Phabricator shutdown timeline
Changeset View
Changeset View
Standalone View
Standalone View
llvm/test/CodeGen/RISCV/copysign-casts.ll
- This file was added.
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py | |||||
; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \ | |||||
; RUN: | FileCheck %s -check-prefix=RV32I | |||||
; RUN: llc -mtriple=riscv64 -verify-machineinstrs < %s \ | |||||
; RUN: | FileCheck %s -check-prefix=RV64I | |||||
; RUN: llc -mtriple=riscv32 -verify-machineinstrs -mattr=+f \ | |||||
; RUN: -target-abi ilp32f < %s | FileCheck %s -check-prefix=RV32IF | |||||
; RUN: llc -mtriple=riscv32 -verify-machineinstrs -mattr=+f \ | |||||
; RUN: < %s | FileCheck %s -check-prefix=RV32IF-ILP32 | |||||
; RUN: llc -mtriple=riscv32 -verify-machineinstrs -mattr=+f -mattr=+d \ | |||||
; RUN: -target-abi ilp32d < %s | FileCheck %s -check-prefix=RV32IFD | |||||
; RUN: llc -mtriple=riscv64 -verify-machineinstrs -mattr=+f -mattr=+d \ | |||||
; RUN: -target-abi lp64d < %s | FileCheck %s -check-prefix=RV64IFD | |||||
; Check that DAGCombiner only folds casts into the sign argument of copysign | |||||
; when appropriate (i.e. when it would be expanded because we don't handle mixed | |||||
; precision magnitude and sign arguments). | |||||
declare double @llvm.copysign.f64(double, double) | |||||
declare float @llvm.copysign.f32(float, float) | |||||
define double @fold_promote(double %a, float %b) nounwind { | |||||
; RV32I-LABEL: fold_promote: | |||||
; RV32I: # %bb.0: | |||||
; RV32I-NEXT: lui a3, 524288 | |||||
; RV32I-NEXT: and a2, a2, a3 | |||||
; RV32I-NEXT: addi a3, a3, -1 | |||||
; RV32I-NEXT: and a1, a1, a3 | |||||
; RV32I-NEXT: or a1, a1, a2 | |||||
; RV32I-NEXT: ret | |||||
; | |||||
; RV64I-LABEL: fold_promote: | |||||
; RV64I: # %bb.0: | |||||
; RV64I-NEXT: addi a2, zero, -1 | |||||
; RV64I-NEXT: slli a2, a2, 63 | |||||
; RV64I-NEXT: addi a2, a2, -1 | |||||
; RV64I-NEXT: and a0, a0, a2 | |||||
; RV64I-NEXT: addi a2, zero, 1 | |||||
; RV64I-NEXT: slli a2, a2, 31 | |||||
; RV64I-NEXT: and a1, a1, a2 | |||||
; RV64I-NEXT: slli a1, a1, 32 | |||||
; RV64I-NEXT: or a0, a0, a1 | |||||
; RV64I-NEXT: ret | |||||
; | |||||
; RV32IF-LABEL: fold_promote: | |||||
; RV32IF: # %bb.0: | |||||
; RV32IF-NEXT: fmv.x.w a2, fa0 | |||||
; RV32IF-NEXT: lui a3, 524288 | |||||
; RV32IF-NEXT: and a2, a2, a3 | |||||
; RV32IF-NEXT: addi a3, a3, -1 | |||||
; RV32IF-NEXT: and a1, a1, a3 | |||||
; RV32IF-NEXT: or a1, a1, a2 | |||||
; RV32IF-NEXT: ret | |||||
; | |||||
; RV32IF-ILP32-LABEL: fold_promote: | |||||
; RV32IF-ILP32: # %bb.0: | |||||
; RV32IF-ILP32-NEXT: lui a3, 524288 | |||||
; RV32IF-ILP32-NEXT: and a2, a2, a3 | |||||
; RV32IF-ILP32-NEXT: addi a3, a3, -1 | |||||
; RV32IF-ILP32-NEXT: and a1, a1, a3 | |||||
; RV32IF-ILP32-NEXT: or a1, a1, a2 | |||||
; RV32IF-ILP32-NEXT: ret | |||||
; | |||||
; RV32IFD-LABEL: fold_promote: | |||||
; RV32IFD: # %bb.0: | |||||
; RV32IFD-NEXT: fcvt.d.s ft0, fa1 | |||||
; RV32IFD-NEXT: fsgnj.d fa0, fa0, ft0 | |||||
; RV32IFD-NEXT: ret | |||||
; | |||||
; RV64IFD-LABEL: fold_promote: | |||||
; RV64IFD: # %bb.0: | |||||
; RV64IFD-NEXT: fcvt.d.s ft0, fa1 | |||||
; RV64IFD-NEXT: fsgnj.d fa0, fa0, ft0 | |||||
; RV64IFD-NEXT: ret | |||||
%c = fpext float %b to double | |||||
%t = call double @llvm.copysign.f64(double %a, double %c) | |||||
ret double %t | |||||
} | |||||
define float @fold_demote(float %a, double %b) nounwind { | |||||
; RV32I-LABEL: fold_demote: | |||||
; RV32I: # %bb.0: | |||||
; RV32I-NEXT: lui a1, 524288 | |||||
; RV32I-NEXT: and a2, a2, a1 | |||||
; RV32I-NEXT: addi a1, a1, -1 | |||||
; RV32I-NEXT: and a0, a0, a1 | |||||
; RV32I-NEXT: or a0, a0, a2 | |||||
; RV32I-NEXT: ret | |||||
; | |||||
; RV64I-LABEL: fold_demote: | |||||
; RV64I: # %bb.0: | |||||
; RV64I-NEXT: lui a2, 524288 | |||||
; RV64I-NEXT: addiw a2, a2, -1 | |||||
; RV64I-NEXT: and a0, a0, a2 | |||||
; RV64I-NEXT: addi a2, zero, -1 | |||||
; RV64I-NEXT: slli a2, a2, 63 | |||||
; RV64I-NEXT: and a1, a1, a2 | |||||
; RV64I-NEXT: srli a1, a1, 32 | |||||
; RV64I-NEXT: or a0, a0, a1 | |||||
; RV64I-NEXT: ret | |||||
; | |||||
; RV32IF-LABEL: fold_demote: | |||||
; RV32IF: # %bb.0: | |||||
; RV32IF-NEXT: addi sp, sp, -16 | |||||
; RV32IF-NEXT: sw ra, 12(sp) | |||||
; RV32IF-NEXT: fsw fs0, 8(sp) | |||||
; RV32IF-NEXT: fmv.s fs0, fa0 | |||||
; RV32IF-NEXT: call __truncdfsf2 | |||||
; RV32IF-NEXT: fsgnj.s fa0, fs0, fa0 | |||||
; RV32IF-NEXT: flw fs0, 8(sp) | |||||
; RV32IF-NEXT: lw ra, 12(sp) | |||||
; RV32IF-NEXT: addi sp, sp, 16 | |||||
; RV32IF-NEXT: ret | |||||
; | |||||
; RV32IF-ILP32-LABEL: fold_demote: | |||||
; RV32IF-ILP32: # %bb.0: | |||||
; RV32IF-ILP32-NEXT: addi sp, sp, -16 | |||||
; RV32IF-ILP32-NEXT: sw ra, 12(sp) | |||||
; RV32IF-ILP32-NEXT: fmv.w.x ft0, a0 | |||||
; RV32IF-ILP32-NEXT: fsw ft0, 8(sp) | |||||
; RV32IF-ILP32-NEXT: mv a0, a1 | |||||
; RV32IF-ILP32-NEXT: mv a1, a2 | |||||
; RV32IF-ILP32-NEXT: call __truncdfsf2 | |||||
; RV32IF-ILP32-NEXT: fmv.w.x ft0, a0 | |||||
; RV32IF-ILP32-NEXT: flw ft1, 8(sp) | |||||
; RV32IF-ILP32-NEXT: fsgnj.s ft0, ft1, ft0 | |||||
; RV32IF-ILP32-NEXT: fmv.x.w a0, ft0 | |||||
; RV32IF-ILP32-NEXT: lw ra, 12(sp) | |||||
; RV32IF-ILP32-NEXT: addi sp, sp, 16 | |||||
; RV32IF-ILP32-NEXT: ret | |||||
; | |||||
; RV32IFD-LABEL: fold_demote: | |||||
; RV32IFD: # %bb.0: | |||||
; RV32IFD-NEXT: fcvt.s.d ft0, fa1 | |||||
; RV32IFD-NEXT: fsgnj.s fa0, fa0, ft0 | |||||
; RV32IFD-NEXT: ret | |||||
; | |||||
; RV64IFD-LABEL: fold_demote: | |||||
; RV64IFD: # %bb.0: | |||||
; RV64IFD-NEXT: fcvt.s.d ft0, fa1 | |||||
; RV64IFD-NEXT: fsgnj.s fa0, fa0, ft0 | |||||
; RV64IFD-NEXT: ret | |||||
%c = fptrunc double %b to float | |||||
%t = call float @llvm.copysign.f32(float %a, float %c) | |||||
ret float %t | |||||
} |