Changeset View
Changeset View
Standalone View
Standalone View
llvm/test/CodeGen/LoongArch/double-imm.ll
- This file was added.
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py | |||||
; RUN: llc --mtriple=loongarch32 --mattr=+d < %s | FileCheck %s --check-prefix=LA32 | |||||
; RUN: llc --mtriple=loongarch64 --mattr=+d < %s | FileCheck %s --check-prefix=LA64 | |||||
define double @f64_positive_zero() nounwind { | |||||
; LA32-LABEL: f64_positive_zero: | |||||
; LA32: # %bb.0: | |||||
; LA32-NEXT: movgr2fr.w $fa0, $zero | |||||
; LA32-NEXT: fcvt.d.s $fa0, $fa0 | |||||
; LA32-NEXT: jirl $zero, $ra, 0 | |||||
; | |||||
; LA64-LABEL: f64_positive_zero: | |||||
; LA64: # %bb.0: | |||||
; LA64-NEXT: movgr2fr.d $fa0, $zero | |||||
; LA64-NEXT: jirl $zero, $ra, 0 | |||||
ret double 0.0 | |||||
} | |||||
define double @f64_negative_zero() nounwind { | |||||
; LA32-LABEL: f64_negative_zero: | |||||
; LA32: # %bb.0: | |||||
; LA32-NEXT: movgr2fr.w $fa0, $zero | |||||
; LA32-NEXT: fneg.s $fa0, $fa0 | |||||
; LA32-NEXT: fcvt.d.s $fa0, $fa0 | |||||
; LA32-NEXT: jirl $zero, $ra, 0 | |||||
; | |||||
; LA64-LABEL: f64_negative_zero: | |||||
; LA64: # %bb.0: | |||||
; LA64-NEXT: movgr2fr.d $fa0, $zero | |||||
; LA64-NEXT: fneg.d $fa0, $fa0 | |||||
; LA64-NEXT: jirl $zero, $ra, 0 | |||||
ret double -0.0 | |||||
} | |||||
define double @f64_constant_pi() nounwind { | |||||
; LA32-LABEL: f64_constant_pi: | |||||
; LA32: # %bb.0: | |||||
; LA32-NEXT: pcalau12i $a0, .LCPI2_0 | |||||
; LA32-NEXT: addi.w $a0, $a0, .LCPI2_0 | |||||
; LA32-NEXT: fld.d $fa0, $a0, 0 | |||||
; LA32-NEXT: jirl $zero, $ra, 0 | |||||
; | |||||
; LA64-LABEL: f64_constant_pi: | |||||
; LA64: # %bb.0: | |||||
; LA64-NEXT: pcalau12i $a0, .LCPI2_0 | |||||
; LA64-NEXT: addi.d $a0, $a0, .LCPI2_0 | |||||
; LA64-NEXT: fld.d $fa0, $a0, 0 | |||||
; LA64-NEXT: jirl $zero, $ra, 0 | |||||
ret double 3.1415926535897931159979634685441851615905761718750 | |||||
} | |||||
define double @f64_add_fimm1(double %a) nounwind { | |||||
; LA32-LABEL: f64_add_fimm1: | |||||
; LA32: # %bb.0: | |||||
; LA32-NEXT: addi.w $a0, $zero, 1 | |||||
; LA32-NEXT: movgr2fr.w $fa1, $a0 | |||||
; LA32-NEXT: ffint.s.w $fa1, $fa1 | |||||
; LA32-NEXT: fcvt.d.s $fa1, $fa1 | |||||
; LA32-NEXT: fadd.d $fa0, $fa0, $fa1 | |||||
; LA32-NEXT: jirl $zero, $ra, 0 | |||||
; | |||||
; LA64-LABEL: f64_add_fimm1: | |||||
; LA64: # %bb.0: | |||||
; LA64-NEXT: addi.d $a0, $zero, 1 | |||||
; LA64-NEXT: movgr2fr.d $fa1, $a0 | |||||
; LA64-NEXT: ffint.d.l $fa1, $fa1 | |||||
; LA64-NEXT: fadd.d $fa0, $fa0, $fa1 | |||||
; LA64-NEXT: jirl $zero, $ra, 0 | |||||
%1 = fadd double %a, 1.0 | |||||
ret double %1 | |||||
} | |||||
define double @f64_positive_fimm1() nounwind { | |||||
; LA32-LABEL: f64_positive_fimm1: | |||||
; LA32: # %bb.0: | |||||
; LA32-NEXT: addi.w $a0, $zero, 1 | |||||
; LA32-NEXT: movgr2fr.w $fa0, $a0 | |||||
; LA32-NEXT: ffint.s.w $fa0, $fa0 | |||||
; LA32-NEXT: fcvt.d.s $fa0, $fa0 | |||||
; LA32-NEXT: jirl $zero, $ra, 0 | |||||
; | |||||
; LA64-LABEL: f64_positive_fimm1: | |||||
; LA64: # %bb.0: | |||||
; LA64-NEXT: addi.d $a0, $zero, 1 | |||||
; LA64-NEXT: movgr2fr.d $fa0, $a0 | |||||
; LA64-NEXT: ffint.d.l $fa0, $fa0 | |||||
; LA64-NEXT: jirl $zero, $ra, 0 | |||||
xry111: I'd suggest:
```
lu52i.d $a0, $zero, 0x3ff
movgr2fr.d $fa0, $a0
```
to reduce one instruction. | |||||
Not Done ReplyInline ActionsWow that's some serious simplification. I don't think I've seen anything like this recently. Agreed this optimization is better done in a new patch, as it's more of a peephole kind, not deeply related to the generic handling done here. xen0n: Wow that's some serious simplification. I don't think I've seen anything like this recently. | |||||
Not Done ReplyInline ActionsQuite nice. Thanks for the suggestion. Let’s implement it in later patch. :) SixWeining: Quite nice. Thanks for the suggestion. Let’s implement it in later patch. :) | |||||
ret double 1.0 | |||||
} |
I'd suggest:
to reduce one instruction. The combination of lu52i.d and movgr2fr.d can always load $2^k$ as a f64 for all integral k in $[0, 1023]$.
But as it's already approved it can be done in a later revision.