aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorBen Shi <2283975856@qq.com>2023-06-11 08:36:16 +0800
committerBen Shi <2283975856@qq.com>2023-06-11 08:36:22 +0800
commite21df8296d09aff68039520ca1ab7dc4907922a2 (patch)
tree8b38d119414fff1982c7b0f833d3d414c1a22585
parent2509c93edd36a20a0aeb5e6d612dae5b770bc987 (diff)
downloadllvm-e21df8296d09aff68039520ca1ab7dc4907922a2.zip
llvm-e21df8296d09aff68039520ca1ab7dc4907922a2.tar.gz
llvm-e21df8296d09aff68039520ca1ab7dc4907922a2.tar.bz2
[AVR] Optimize 8-bit rotation when rotation bits >= 4
Fixes https://github.com/llvm/llvm-project/issues/63100 Reviewed By: aykevl, Patryk27, jacquesguan Differential Revision: https://reviews.llvm.org/D152130
-rw-r--r--llvm/lib/Target/AVR/AVRISelLowering.cpp15
-rw-r--r--llvm/test/CodeGen/AVR/rotate.ll62
2 files changed, 22 insertions, 55 deletions
diff --git a/llvm/lib/Target/AVR/AVRISelLowering.cpp b/llvm/lib/Target/AVR/AVRISelLowering.cpp
index 606e70b..d0314fb 100644
--- a/llvm/lib/Target/AVR/AVRISelLowering.cpp
+++ b/llvm/lib/Target/AVR/AVRISelLowering.cpp
@@ -427,6 +427,21 @@ SDValue AVRTargetLowering::LowerShifts(SDValue Op, SelectionDAG &DAG) const {
Victim = DAG.getNode(AVRISD::ASRBN, dl, VT, Victim,
DAG.getConstant(7, dl, VT));
ShiftAmount = 0;
+ } else if (Op.getOpcode() == ISD::ROTL && ShiftAmount == 7) {
+ // Optimize left rotation 7 bits to right rotation 1 bit.
+ Victim =
+ DAG.getNode(AVRISD::ROR, dl, VT, Victim, DAG.getConstant(1, dl, VT));
+ ShiftAmount = 0;
+ } else if (Op.getOpcode() == ISD::ROTR && ShiftAmount == 7) {
+ // Optimize right rotation 7 bits to left rotation 1 bit.
+ Victim =
+ DAG.getNode(AVRISD::ROL, dl, VT, Victim, DAG.getConstant(1, dl, VT));
+ ShiftAmount = 0;
+ } else if ((Op.getOpcode() == ISD::ROTR || Op.getOpcode() == ISD::ROTL) &&
+ ShiftAmount >= 4) {
+ // Optimize left/right rotation with the SWAP instruction.
+ Victim = DAG.getNode(AVRISD::SWAP, dl, VT, Victim);
+ ShiftAmount -= 4;
}
} else if (VT.getSizeInBits() == 16) {
if (Op.getOpcode() == ISD::SRA)
diff --git a/llvm/test/CodeGen/AVR/rotate.ll b/llvm/test/CodeGen/AVR/rotate.ll
index bf31fac..938b64f 100644
--- a/llvm/test/CodeGen/AVR/rotate.ll
+++ b/llvm/test/CodeGen/AVR/rotate.ll
@@ -30,14 +30,7 @@ start:
define i8 @rotl8_5(i8 %x) {
; CHECK-LABEL: rotl8_5:
; CHECK: ; %bb.0: ; %start
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
+; CHECK-NEXT: swap r24
; CHECK-NEXT: lsl r24
; CHECK-NEXT: adc r24, r1
; CHECK-NEXT: ret
@@ -49,20 +42,9 @@ start:
define i8 @rotl8_7(i8 %x) {
; CHECK-LABEL: rotl8_7:
; CHECK: ; %bb.0: ; %start
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
-; CHECK-NEXT: lsl r24
-; CHECK-NEXT: adc r24, r1
+; CHECK-NEXT: bst r24, 0
+; CHECK-NEXT: ror r24
+; CHECK-NEXT: bld r24, 7
; CHECK-NEXT: ret
start:
%0 = call i8 @llvm.fshl.i8(i8 %x, i8 %x, i8 7)
@@ -121,18 +103,7 @@ start:
define i8 @rotr8_5(i8 %x) {
; CHECK-LABEL: rotr8_5:
; CHECK: ; %bb.0: ; %start
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
+; CHECK-NEXT: swap r24
; CHECK-NEXT: bst r24, 0
; CHECK-NEXT: ror r24
; CHECK-NEXT: bld r24, 7
@@ -145,27 +116,8 @@ start:
define i8 @rotr8_7(i8 %x) {
; CHECK-LABEL: rotr8_7:
; CHECK: ; %bb.0: ; %start
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
-; CHECK-NEXT: bst r24, 0
-; CHECK-NEXT: ror r24
-; CHECK-NEXT: bld r24, 7
+; CHECK-NEXT: lsl r24
+; CHECK-NEXT: adc r24, r1
; CHECK-NEXT: ret
start:
%0 = call i8 @llvm.fshr.i8(i8 %x, i8 %x, i8 7)