X86Subtarget.h revision 221345
1241754Suqs//=====---- X86Subtarget.h - Define Subtarget for the X86 -----*- C++ -*--====//
2241754Suqs//
3241754Suqs//                     The LLVM Compiler Infrastructure
4241754Suqs//
5241754Suqs// This file is distributed under the University of Illinois Open Source
6241754Suqs// License. See LICENSE.TXT for details.
7241754Suqs//
8241754Suqs//===----------------------------------------------------------------------===//
9241754Suqs//
10241754Suqs// This file declares the X86 specific subclass of TargetSubtarget.
11241754Suqs//
12241754Suqs//===----------------------------------------------------------------------===//
13241754Suqs
14241754Suqs#ifndef X86SUBTARGET_H
15241754Suqs#define X86SUBTARGET_H
16241754Suqs
17241754Suqs#include "llvm/ADT/Triple.h"
18241754Suqs#include "llvm/Target/TargetSubtarget.h"
19241754Suqs#include "llvm/CallingConv.h"
20241754Suqs#include <string>
21241754Suqs
22241754Suqsnamespace llvm {
23241754Suqsclass GlobalValue;
24241754Suqsclass TargetMachine;
25241754Suqs
26241754Suqs/// PICStyles - The X86 backend supports a number of different styles of PIC.
27241754Suqs///
28241754Suqsnamespace PICStyles {
29241754Suqsenum Style {
30241754Suqs  StubPIC,          // Used on i386-darwin in -fPIC mode.
31241754Suqs  StubDynamicNoPIC, // Used on i386-darwin in -mdynamic-no-pic mode.
32241754Suqs  GOT,              // Used on many 32-bit unices in -fPIC mode.
33241754Suqs  RIPRel,           // Used on X86-64 when not in -static mode.
34241754Suqs  None              // Set when in -static mode (not PIC or DynamicNoPIC mode).
35241754Suqs};
36241754Suqs}
37241754Suqs
38241754Suqsclass X86Subtarget : public TargetSubtarget {
39241754Suqsprotected:
40241754Suqs  enum X86SSEEnum {
41241754Suqs    NoMMXSSE, MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42
42241754Suqs  };
43241754Suqs
44241754Suqs  enum X863DNowEnum {
45241754Suqs    NoThreeDNow, ThreeDNow, ThreeDNowA
46241754Suqs  };
47241754Suqs
48241754Suqs  /// PICStyle - Which PIC style to use
49241754Suqs  ///
50241754Suqs  PICStyles::Style PICStyle;
51241754Suqs
52241754Suqs  /// X86SSELevel - MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, or
53241754Suqs  /// none supported.
54241754Suqs  X86SSEEnum X86SSELevel;
55241754Suqs
56241754Suqs  /// X863DNowLevel - 3DNow or 3DNow Athlon, or none supported.
57241754Suqs  ///
58241754Suqs  X863DNowEnum X863DNowLevel;
59
60  /// HasCMov - True if this processor has conditional move instructions
61  /// (generally pentium pro+).
62  bool HasCMov;
63
64  /// HasX86_64 - True if the processor supports X86-64 instructions.
65  ///
66  bool HasX86_64;
67
68  /// HasPOPCNT - True if the processor supports POPCNT.
69  bool HasPOPCNT;
70
71  /// HasSSE4A - True if the processor supports SSE4A instructions.
72  bool HasSSE4A;
73
74  /// HasAVX - Target has AVX instructions
75  bool HasAVX;
76
77  /// HasAES - Target has AES instructions
78  bool HasAES;
79
80  /// HasCLMUL - Target has carry-less multiplication
81  bool HasCLMUL;
82
83  /// HasFMA3 - Target has 3-operand fused multiply-add
84  bool HasFMA3;
85
86  /// HasFMA4 - Target has 4-operand fused multiply-add
87  bool HasFMA4;
88
89  /// IsBTMemSlow - True if BT (bit test) of memory instructions are slow.
90  bool IsBTMemSlow;
91
92  /// IsUAMemFast - True if unaligned memory access is fast.
93  bool IsUAMemFast;
94
95  /// HasVectorUAMem - True if SIMD operations can have unaligned memory
96  /// operands. This may require setting a feature bit in the processor.
97  bool HasVectorUAMem;
98
99  /// stackAlignment - The minimum alignment known to hold of the stack frame on
100  /// entry to the function and which must be maintained by every function.
101  unsigned stackAlignment;
102
103  /// Max. memset / memcpy size that is turned into rep/movs, rep/stos ops.
104  ///
105  unsigned MaxInlineSizeThreshold;
106
107  /// TargetTriple - What processor and OS we're targeting.
108  Triple TargetTriple;
109
110private:
111  /// Is64Bit - True if the processor supports 64-bit instructions and
112  /// pointer size is 64 bit.
113  bool Is64Bit;
114
115public:
116
117  /// This constructor initializes the data members to match that
118  /// of the specified triple.
119  ///
120  X86Subtarget(const std::string &TT, const std::string &FS, bool is64Bit);
121
122  /// getStackAlignment - Returns the minimum alignment known to hold of the
123  /// stack frame on entry to the function and which must be maintained by every
124  /// function for this subtarget.
125  unsigned getStackAlignment() const { return stackAlignment; }
126
127  /// getMaxInlineSizeThreshold - Returns the maximum memset / memcpy size
128  /// that still makes it profitable to inline the call.
129  unsigned getMaxInlineSizeThreshold() const { return MaxInlineSizeThreshold; }
130
131  /// ParseSubtargetFeatures - Parses features string setting specified
132  /// subtarget options.  Definition of function is auto generated by tblgen.
133  std::string ParseSubtargetFeatures(const std::string &FS,
134                                     const std::string &CPU);
135
136  /// AutoDetectSubtargetFeatures - Auto-detect CPU features using CPUID
137  /// instruction.
138  void AutoDetectSubtargetFeatures();
139
140  bool is64Bit() const { return Is64Bit; }
141
142  PICStyles::Style getPICStyle() const { return PICStyle; }
143  void setPICStyle(PICStyles::Style Style)  { PICStyle = Style; }
144
145  bool hasCMov() const { return HasCMov; }
146  bool hasMMX() const { return X86SSELevel >= MMX; }
147  bool hasSSE1() const { return X86SSELevel >= SSE1; }
148  bool hasSSE2() const { return X86SSELevel >= SSE2; }
149  bool hasSSE3() const { return X86SSELevel >= SSE3; }
150  bool hasSSSE3() const { return X86SSELevel >= SSSE3; }
151  bool hasSSE41() const { return X86SSELevel >= SSE41; }
152  bool hasSSE42() const { return X86SSELevel >= SSE42; }
153  bool hasSSE4A() const { return HasSSE4A; }
154  bool has3DNow() const { return X863DNowLevel >= ThreeDNow; }
155  bool has3DNowA() const { return X863DNowLevel >= ThreeDNowA; }
156  bool hasPOPCNT() const { return HasPOPCNT; }
157  bool hasAVX() const { return HasAVX; }
158  bool hasXMM() const { return hasSSE1() || hasAVX(); }
159  bool hasXMMInt() const { return hasSSE2() || hasAVX(); }
160  bool hasAES() const { return HasAES; }
161  bool hasCLMUL() const { return HasCLMUL; }
162  bool hasFMA3() const { return HasFMA3; }
163  bool hasFMA4() const { return HasFMA4; }
164  bool isBTMemSlow() const { return IsBTMemSlow; }
165  bool isUnalignedMemAccessFast() const { return IsUAMemFast; }
166  bool hasVectorUAMem() const { return HasVectorUAMem; }
167
168  const Triple &getTargetTriple() const { return TargetTriple; }
169
170  bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
171  bool isTargetFreeBSD() const {
172    return TargetTriple.getOS() == Triple::FreeBSD;
173  }
174  bool isTargetSolaris() const {
175    return TargetTriple.getOS() == Triple::Solaris;
176  }
177
178  // ELF is a reasonably sane default and the only other X86 targets we
179  // support are Darwin and Windows. Just use "not those".
180  bool isTargetELF() const {
181    return !isTargetDarwin() && !isTargetWindows() && !isTargetCygMing();
182  }
183  bool isTargetLinux() const { return TargetTriple.getOS() == Triple::Linux; }
184
185  bool isTargetWindows() const { return TargetTriple.getOS() == Triple::Win32; }
186  bool isTargetMingw() const { return TargetTriple.getOS() == Triple::MinGW32; }
187  bool isTargetCygwin() const { return TargetTriple.getOS() == Triple::Cygwin; }
188  bool isTargetCygMing() const {
189    return isTargetMingw() || isTargetCygwin();
190  }
191
192  /// isTargetCOFF - Return true if this is any COFF/Windows target variant.
193  bool isTargetCOFF() const {
194    return isTargetMingw() || isTargetCygwin() || isTargetWindows();
195  }
196
197  bool isTargetWin64() const {
198    return Is64Bit && (isTargetMingw() || isTargetWindows());
199  }
200
201  bool isTargetEnvMacho() const {
202    return isTargetDarwin() || (TargetTriple.getEnvironment() == Triple::MachO);
203  }
204
205  bool isTargetWin32() const {
206    return !Is64Bit && (isTargetMingw() || isTargetWindows());
207  }
208
209  bool isPICStyleSet() const { return PICStyle != PICStyles::None; }
210  bool isPICStyleGOT() const { return PICStyle == PICStyles::GOT; }
211  bool isPICStyleRIPRel() const { return PICStyle == PICStyles::RIPRel; }
212
213  bool isPICStyleStubPIC() const {
214    return PICStyle == PICStyles::StubPIC;
215  }
216
217  bool isPICStyleStubNoDynamic() const {
218    return PICStyle == PICStyles::StubDynamicNoPIC;
219  }
220  bool isPICStyleStubAny() const {
221    return PICStyle == PICStyles::StubDynamicNoPIC ||
222           PICStyle == PICStyles::StubPIC; }
223
224  /// ClassifyGlobalReference - Classify a global variable reference for the
225  /// current subtarget according to how we should reference it in a non-pcrel
226  /// context.
227  unsigned char ClassifyGlobalReference(const GlobalValue *GV,
228                                        const TargetMachine &TM)const;
229
230  /// ClassifyBlockAddressReference - Classify a blockaddress reference for the
231  /// current subtarget according to how we should reference it in a non-pcrel
232  /// context.
233  unsigned char ClassifyBlockAddressReference() const;
234
235  /// IsLegalToCallImmediateAddr - Return true if the subtarget allows calls
236  /// to immediate address.
237  bool IsLegalToCallImmediateAddr(const TargetMachine &TM) const;
238
239  /// This function returns the name of a function which has an interface
240  /// like the non-standard bzero function, if such a function exists on
241  /// the current subtarget and it is considered prefereable over
242  /// memset with zero passed as the second argument. Otherwise it
243  /// returns null.
244  const char *getBZeroEntry() const;
245
246  /// getSpecialAddressLatency - For targets where it is beneficial to
247  /// backschedule instructions that compute addresses, return a value
248  /// indicating the number of scheduling cycles of backscheduling that
249  /// should be attempted.
250  unsigned getSpecialAddressLatency() const;
251
252  /// IsCalleePop - Test whether a function should pop its own arguments.
253  bool IsCalleePop(bool isVarArg, CallingConv::ID CallConv) const;
254};
255
256} // End llvm namespace
257
258#endif
259