blob: f548a8dd0532b279dd06951b144a048d9c86628c (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
|
//===-- LoongArchTargetTransformInfo.cpp - LoongArch specific TTI ---------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
/// \file
/// This file implements a TargetTransformInfo analysis pass specific to the
/// LoongArch target machine. It uses the target's detailed information to
/// provide more precise answers to certain TTI queries, while letting the
/// target independent and default TTI implementations handle the rest.
///
//===----------------------------------------------------------------------===//
#include "LoongArchTargetTransformInfo.h"
using namespace llvm;
#define DEBUG_TYPE "loongarchtti"
TypeSize LoongArchTTIImpl::getRegisterBitWidth(
TargetTransformInfo::RegisterKind K) const {
TypeSize DefSize = TargetTransformInfoImplBase::getRegisterBitWidth(K);
switch (K) {
case TargetTransformInfo::RGK_Scalar:
return TypeSize::getFixed(ST->is64Bit() ? 64 : 32);
case TargetTransformInfo::RGK_FixedWidthVector:
if (ST->hasExtLASX())
return TypeSize::getFixed(256);
if (ST->hasExtLSX())
return TypeSize::getFixed(128);
[[fallthrough]];
case TargetTransformInfo::RGK_ScalableVector:
return DefSize;
}
llvm_unreachable("Unsupported register kind");
}
unsigned LoongArchTTIImpl::getNumberOfRegisters(unsigned ClassID) const {
switch (ClassID) {
case LoongArchRegisterClass::GPRRC:
// 30 = 32 GPRs - r0 (zero register) - r21 (non-allocatable)
return 30;
case LoongArchRegisterClass::FPRRC:
return ST->hasBasicF() ? 32 : 0;
case LoongArchRegisterClass::VRRC:
return ST->hasExtLSX() ? 32 : 0;
}
llvm_unreachable("unknown register class");
}
unsigned LoongArchTTIImpl::getRegisterClassForType(bool Vector,
Type *Ty) const {
if (Vector)
return LoongArchRegisterClass::VRRC;
if (!Ty)
return LoongArchRegisterClass::GPRRC;
Type *ScalarTy = Ty->getScalarType();
if ((ScalarTy->isFloatTy() && ST->hasBasicF()) ||
(ScalarTy->isDoubleTy() && ST->hasBasicD())) {
return LoongArchRegisterClass::FPRRC;
}
return LoongArchRegisterClass::GPRRC;
}
unsigned LoongArchTTIImpl::getMaxInterleaveFactor(ElementCount VF) const {
return ST->getMaxInterleaveFactor();
}
const char *LoongArchTTIImpl::getRegisterClassName(unsigned ClassID) const {
switch (ClassID) {
case LoongArchRegisterClass::GPRRC:
return "LoongArch::GPRRC";
case LoongArchRegisterClass::FPRRC:
return "LoongArch::FPRRC";
case LoongArchRegisterClass::VRRC:
return "LoongArch::VRRC";
}
llvm_unreachable("unknown register class");
}
TargetTransformInfo::PopcntSupportKind
LoongArchTTIImpl::getPopcntSupport(unsigned TyWidth) const {
assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");
return ST->hasExtLSX() ? TTI::PSK_FastHardware : TTI::PSK_Software;
}
unsigned LoongArchTTIImpl::getCacheLineSize() const { return 64; }
unsigned LoongArchTTIImpl::getPrefetchDistance() const { return 200; }
bool LoongArchTTIImpl::enableWritePrefetching() const { return true; }
bool LoongArchTTIImpl::shouldExpandReduction(const IntrinsicInst *II) const {
switch (II->getIntrinsicID()) {
default:
return true;
case Intrinsic::vector_reduce_add:
case Intrinsic::vector_reduce_and:
case Intrinsic::vector_reduce_or:
case Intrinsic::vector_reduce_smax:
case Intrinsic::vector_reduce_smin:
case Intrinsic::vector_reduce_umax:
case Intrinsic::vector_reduce_umin:
case Intrinsic::vector_reduce_xor:
return false;
}
}
// TODO: Implement more hooks to provide TTI machinery for LoongArch.
|