2
0

TargetLibraryInfo.cpp 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609
  1. //===-- TargetLibraryInfo.cpp - Runtime library information ----------------==//
  2. //
  3. // The LLVM Compiler Infrastructure
  4. //
  5. // This file is distributed under the University of Illinois Open Source
  6. // License. See LICENSE.TXT for details.
  7. //
  8. //===----------------------------------------------------------------------===//
  9. //
  10. // This file implements the TargetLibraryInfo class.
  11. //
  12. //===----------------------------------------------------------------------===//
  13. #include "llvm/Analysis/TargetLibraryInfo.h"
  14. #include "llvm/ADT/Triple.h"
  15. #include "llvm/Support/CommandLine.h"
  16. using namespace llvm;
  17. #if 0 // HLSL Change Starts - option pending
  18. static cl::opt<TargetLibraryInfoImpl::VectorLibrary> ClVectorLibrary(
  19. "vector-library", cl::Hidden, cl::desc("Vector functions library"),
  20. cl::init(TargetLibraryInfoImpl::NoLibrary),
  21. cl::values(clEnumValN(TargetLibraryInfoImpl::NoLibrary, "none",
  22. "No vector functions library"),
  23. clEnumValN(TargetLibraryInfoImpl::Accelerate, "Accelerate",
  24. "Accelerate framework"),
  25. clEnumValEnd));
  26. #else
  27. static const TargetLibraryInfoImpl::VectorLibrary ClVectorLibrary = TargetLibraryInfoImpl::NoLibrary;
  28. #endif // HLSL Change Ends
  29. const char *const TargetLibraryInfoImpl::StandardNames[LibFunc::NumLibFuncs] = {
  30. #define TLI_DEFINE_STRING
  31. #include "llvm/Analysis/TargetLibraryInfo.def"
  32. };
  33. static bool hasSinCosPiStret(const Triple &T) {
  34. // Only Darwin variants have _stret versions of combined trig functions.
  35. if (!T.isOSDarwin())
  36. return false;
  37. // The ABI is rather complicated on x86, so don't do anything special there.
  38. if (T.getArch() == Triple::x86)
  39. return false;
  40. if (T.isMacOSX() && T.isMacOSXVersionLT(10, 9))
  41. return false;
  42. if (T.isiOS() && T.isOSVersionLT(7, 0))
  43. return false;
  44. return true;
  45. }
  46. /// initialize - Initialize the set of available library functions based on the
  47. /// specified target triple. This should be carefully written so that a missing
  48. /// target triple gets a sane set of defaults.
  49. static void initialize(TargetLibraryInfoImpl &TLI, const Triple &T,
  50. const char *const *StandardNames) {
  51. #ifndef NDEBUG
  52. // Verify that the StandardNames array is in alphabetical order.
  53. for (unsigned F = 1; F < LibFunc::NumLibFuncs; ++F) {
  54. if (strcmp(StandardNames[F-1], StandardNames[F]) >= 0)
  55. llvm_unreachable("TargetLibraryInfoImpl function names must be sorted");
  56. }
  57. #endif // !NDEBUG
  58. // There are no library implementations of mempcy and memset for AMD gpus and
  59. // these can be difficult to lower in the backend.
  60. if (T.getArch() == Triple::r600 ||
  61. T.getArch() == Triple::dxil || // HLSL Change
  62. T.getArch() == Triple::dxil64 || // HLSL Change
  63. T.getArch() == Triple::amdgcn) {
  64. TLI.setUnavailable(LibFunc::memcpy);
  65. TLI.setUnavailable(LibFunc::memset);
  66. TLI.setUnavailable(LibFunc::memset_pattern16);
  67. return;
  68. }
  69. // memset_pattern16 is only available on iOS 3.0 and Mac OS X 10.5 and later.
  70. if (T.isMacOSX()) {
  71. if (T.isMacOSXVersionLT(10, 5))
  72. TLI.setUnavailable(LibFunc::memset_pattern16);
  73. } else if (T.isiOS()) {
  74. if (T.isOSVersionLT(3, 0))
  75. TLI.setUnavailable(LibFunc::memset_pattern16);
  76. } else {
  77. TLI.setUnavailable(LibFunc::memset_pattern16);
  78. }
  79. if (!hasSinCosPiStret(T)) {
  80. TLI.setUnavailable(LibFunc::sinpi);
  81. TLI.setUnavailable(LibFunc::sinpif);
  82. TLI.setUnavailable(LibFunc::cospi);
  83. TLI.setUnavailable(LibFunc::cospif);
  84. TLI.setUnavailable(LibFunc::sincospi_stret);
  85. TLI.setUnavailable(LibFunc::sincospif_stret);
  86. }
  87. if (T.isMacOSX() && T.getArch() == Triple::x86 &&
  88. !T.isMacOSXVersionLT(10, 7)) {
  89. // x86-32 OSX has a scheme where fwrite and fputs (and some other functions
  90. // we don't care about) have two versions; on recent OSX, the one we want
  91. // has a $UNIX2003 suffix. The two implementations are identical except
  92. // for the return value in some edge cases. However, we don't want to
  93. // generate code that depends on the old symbols.
  94. TLI.setAvailableWithName(LibFunc::fwrite, "fwrite$UNIX2003");
  95. TLI.setAvailableWithName(LibFunc::fputs, "fputs$UNIX2003");
  96. }
  97. // iprintf and friends are only available on XCore and TCE.
  98. if (T.getArch() != Triple::xcore && T.getArch() != Triple::tce) {
  99. TLI.setUnavailable(LibFunc::iprintf);
  100. TLI.setUnavailable(LibFunc::siprintf);
  101. TLI.setUnavailable(LibFunc::fiprintf);
  102. }
  103. if (T.isOSWindows() && !T.isOSCygMing()) {
  104. // Win32 does not support long double
  105. TLI.setUnavailable(LibFunc::acosl);
  106. TLI.setUnavailable(LibFunc::asinl);
  107. TLI.setUnavailable(LibFunc::atanl);
  108. TLI.setUnavailable(LibFunc::atan2l);
  109. TLI.setUnavailable(LibFunc::ceill);
  110. TLI.setUnavailable(LibFunc::copysignl);
  111. TLI.setUnavailable(LibFunc::cosl);
  112. TLI.setUnavailable(LibFunc::coshl);
  113. TLI.setUnavailable(LibFunc::expl);
  114. TLI.setUnavailable(LibFunc::fabsf); // Win32 and Win64 both lack fabsf
  115. TLI.setUnavailable(LibFunc::fabsl);
  116. TLI.setUnavailable(LibFunc::floorl);
  117. TLI.setUnavailable(LibFunc::fmaxl);
  118. TLI.setUnavailable(LibFunc::fminl);
  119. TLI.setUnavailable(LibFunc::fmodl);
  120. TLI.setUnavailable(LibFunc::frexpl);
  121. TLI.setUnavailable(LibFunc::ldexpf);
  122. TLI.setUnavailable(LibFunc::ldexpl);
  123. TLI.setUnavailable(LibFunc::logl);
  124. TLI.setUnavailable(LibFunc::modfl);
  125. TLI.setUnavailable(LibFunc::powl);
  126. TLI.setUnavailable(LibFunc::sinl);
  127. TLI.setUnavailable(LibFunc::sinhl);
  128. TLI.setUnavailable(LibFunc::sqrtl);
  129. TLI.setUnavailable(LibFunc::tanl);
  130. TLI.setUnavailable(LibFunc::tanhl);
  131. // Win32 only has C89 math
  132. TLI.setUnavailable(LibFunc::acosh);
  133. TLI.setUnavailable(LibFunc::acoshf);
  134. TLI.setUnavailable(LibFunc::acoshl);
  135. TLI.setUnavailable(LibFunc::asinh);
  136. TLI.setUnavailable(LibFunc::asinhf);
  137. TLI.setUnavailable(LibFunc::asinhl);
  138. TLI.setUnavailable(LibFunc::atanh);
  139. TLI.setUnavailable(LibFunc::atanhf);
  140. TLI.setUnavailable(LibFunc::atanhl);
  141. TLI.setUnavailable(LibFunc::cbrt);
  142. TLI.setUnavailable(LibFunc::cbrtf);
  143. TLI.setUnavailable(LibFunc::cbrtl);
  144. TLI.setUnavailable(LibFunc::exp2);
  145. TLI.setUnavailable(LibFunc::exp2f);
  146. TLI.setUnavailable(LibFunc::exp2l);
  147. TLI.setUnavailable(LibFunc::expm1);
  148. TLI.setUnavailable(LibFunc::expm1f);
  149. TLI.setUnavailable(LibFunc::expm1l);
  150. TLI.setUnavailable(LibFunc::log2);
  151. TLI.setUnavailable(LibFunc::log2f);
  152. TLI.setUnavailable(LibFunc::log2l);
  153. TLI.setUnavailable(LibFunc::log1p);
  154. TLI.setUnavailable(LibFunc::log1pf);
  155. TLI.setUnavailable(LibFunc::log1pl);
  156. TLI.setUnavailable(LibFunc::logb);
  157. TLI.setUnavailable(LibFunc::logbf);
  158. TLI.setUnavailable(LibFunc::logbl);
  159. TLI.setUnavailable(LibFunc::nearbyint);
  160. TLI.setUnavailable(LibFunc::nearbyintf);
  161. TLI.setUnavailable(LibFunc::nearbyintl);
  162. TLI.setUnavailable(LibFunc::rint);
  163. TLI.setUnavailable(LibFunc::rintf);
  164. TLI.setUnavailable(LibFunc::rintl);
  165. TLI.setUnavailable(LibFunc::round);
  166. TLI.setUnavailable(LibFunc::roundf);
  167. TLI.setUnavailable(LibFunc::roundl);
  168. TLI.setUnavailable(LibFunc::trunc);
  169. TLI.setUnavailable(LibFunc::truncf);
  170. TLI.setUnavailable(LibFunc::truncl);
  171. // Win32 provides some C99 math with mangled names
  172. TLI.setAvailableWithName(LibFunc::copysign, "_copysign");
  173. if (T.getArch() == Triple::x86) {
  174. // Win32 on x86 implements single-precision math functions as macros
  175. TLI.setUnavailable(LibFunc::acosf);
  176. TLI.setUnavailable(LibFunc::asinf);
  177. TLI.setUnavailable(LibFunc::atanf);
  178. TLI.setUnavailable(LibFunc::atan2f);
  179. TLI.setUnavailable(LibFunc::ceilf);
  180. TLI.setUnavailable(LibFunc::copysignf);
  181. TLI.setUnavailable(LibFunc::cosf);
  182. TLI.setUnavailable(LibFunc::coshf);
  183. TLI.setUnavailable(LibFunc::expf);
  184. TLI.setUnavailable(LibFunc::floorf);
  185. TLI.setUnavailable(LibFunc::fminf);
  186. TLI.setUnavailable(LibFunc::fmaxf);
  187. TLI.setUnavailable(LibFunc::fmodf);
  188. TLI.setUnavailable(LibFunc::logf);
  189. TLI.setUnavailable(LibFunc::powf);
  190. TLI.setUnavailable(LibFunc::sinf);
  191. TLI.setUnavailable(LibFunc::sinhf);
  192. TLI.setUnavailable(LibFunc::sqrtf);
  193. TLI.setUnavailable(LibFunc::tanf);
  194. TLI.setUnavailable(LibFunc::tanhf);
  195. }
  196. // Win32 does *not* provide provide these functions, but they are
  197. // generally available on POSIX-compliant systems:
  198. TLI.setUnavailable(LibFunc::access);
  199. TLI.setUnavailable(LibFunc::bcmp);
  200. TLI.setUnavailable(LibFunc::bcopy);
  201. TLI.setUnavailable(LibFunc::bzero);
  202. TLI.setUnavailable(LibFunc::chmod);
  203. TLI.setUnavailable(LibFunc::chown);
  204. TLI.setUnavailable(LibFunc::closedir);
  205. TLI.setUnavailable(LibFunc::ctermid);
  206. TLI.setUnavailable(LibFunc::fdopen);
  207. TLI.setUnavailable(LibFunc::ffs);
  208. TLI.setUnavailable(LibFunc::fileno);
  209. TLI.setUnavailable(LibFunc::flockfile);
  210. TLI.setUnavailable(LibFunc::fseeko);
  211. TLI.setUnavailable(LibFunc::fstat);
  212. TLI.setUnavailable(LibFunc::fstatvfs);
  213. TLI.setUnavailable(LibFunc::ftello);
  214. TLI.setUnavailable(LibFunc::ftrylockfile);
  215. TLI.setUnavailable(LibFunc::funlockfile);
  216. TLI.setUnavailable(LibFunc::getc_unlocked);
  217. TLI.setUnavailable(LibFunc::getitimer);
  218. TLI.setUnavailable(LibFunc::getlogin_r);
  219. TLI.setUnavailable(LibFunc::getpwnam);
  220. TLI.setUnavailable(LibFunc::gettimeofday);
  221. TLI.setUnavailable(LibFunc::htonl);
  222. TLI.setUnavailable(LibFunc::htons);
  223. TLI.setUnavailable(LibFunc::lchown);
  224. TLI.setUnavailable(LibFunc::lstat);
  225. TLI.setUnavailable(LibFunc::memccpy);
  226. TLI.setUnavailable(LibFunc::mkdir);
  227. TLI.setUnavailable(LibFunc::ntohl);
  228. TLI.setUnavailable(LibFunc::ntohs);
  229. TLI.setUnavailable(LibFunc::open);
  230. TLI.setUnavailable(LibFunc::opendir);
  231. TLI.setUnavailable(LibFunc::pclose);
  232. TLI.setUnavailable(LibFunc::popen);
  233. TLI.setUnavailable(LibFunc::pread);
  234. TLI.setUnavailable(LibFunc::pwrite);
  235. TLI.setUnavailable(LibFunc::read);
  236. TLI.setUnavailable(LibFunc::readlink);
  237. TLI.setUnavailable(LibFunc::realpath);
  238. TLI.setUnavailable(LibFunc::rmdir);
  239. TLI.setUnavailable(LibFunc::setitimer);
  240. TLI.setUnavailable(LibFunc::stat);
  241. TLI.setUnavailable(LibFunc::statvfs);
  242. TLI.setUnavailable(LibFunc::stpcpy);
  243. TLI.setUnavailable(LibFunc::stpncpy);
  244. TLI.setUnavailable(LibFunc::strcasecmp);
  245. TLI.setUnavailable(LibFunc::strncasecmp);
  246. TLI.setUnavailable(LibFunc::times);
  247. TLI.setUnavailable(LibFunc::uname);
  248. TLI.setUnavailable(LibFunc::unlink);
  249. TLI.setUnavailable(LibFunc::unsetenv);
  250. TLI.setUnavailable(LibFunc::utime);
  251. TLI.setUnavailable(LibFunc::utimes);
  252. TLI.setUnavailable(LibFunc::write);
  253. // Win32 does *not* provide provide these functions, but they are
  254. // specified by C99:
  255. TLI.setUnavailable(LibFunc::atoll);
  256. TLI.setUnavailable(LibFunc::frexpf);
  257. TLI.setUnavailable(LibFunc::llabs);
  258. }
  259. switch (T.getOS()) {
  260. case Triple::MacOSX:
  261. // exp10 and exp10f are not available on OS X until 10.9 and iOS until 7.0
  262. // and their names are __exp10 and __exp10f. exp10l is not available on
  263. // OS X or iOS.
  264. TLI.setUnavailable(LibFunc::exp10l);
  265. if (T.isMacOSXVersionLT(10, 9)) {
  266. TLI.setUnavailable(LibFunc::exp10);
  267. TLI.setUnavailable(LibFunc::exp10f);
  268. } else {
  269. TLI.setAvailableWithName(LibFunc::exp10, "__exp10");
  270. TLI.setAvailableWithName(LibFunc::exp10f, "__exp10f");
  271. }
  272. break;
  273. case Triple::IOS:
  274. TLI.setUnavailable(LibFunc::exp10l);
  275. if (T.isOSVersionLT(7, 0)) {
  276. TLI.setUnavailable(LibFunc::exp10);
  277. TLI.setUnavailable(LibFunc::exp10f);
  278. } else {
  279. TLI.setAvailableWithName(LibFunc::exp10, "__exp10");
  280. TLI.setAvailableWithName(LibFunc::exp10f, "__exp10f");
  281. }
  282. break;
  283. case Triple::Linux:
  284. // exp10, exp10f, exp10l is available on Linux (GLIBC) but are extremely
  285. // buggy prior to glibc version 2.18. Until this version is widely deployed
  286. // or we have a reasonable detection strategy, we cannot use exp10 reliably
  287. // on Linux.
  288. //
  289. // Fall through to disable all of them.
  290. default:
  291. TLI.setUnavailable(LibFunc::exp10);
  292. TLI.setUnavailable(LibFunc::exp10f);
  293. TLI.setUnavailable(LibFunc::exp10l);
  294. }
  295. // ffsl is available on at least Darwin, Mac OS X, iOS, FreeBSD, and
  296. // Linux (GLIBC):
  297. // http://developer.apple.com/library/mac/#documentation/Darwin/Reference/ManPages/man3/ffsl.3.html
  298. // http://svn.freebsd.org/base/user/eri/pf45/head/lib/libc/string/ffsl.c
  299. // http://www.gnu.org/software/gnulib/manual/html_node/ffsl.html
  300. switch (T.getOS()) {
  301. case Triple::Darwin:
  302. case Triple::MacOSX:
  303. case Triple::IOS:
  304. case Triple::FreeBSD:
  305. case Triple::Linux:
  306. break;
  307. default:
  308. TLI.setUnavailable(LibFunc::ffsl);
  309. }
  310. // ffsll is available on at least FreeBSD and Linux (GLIBC):
  311. // http://svn.freebsd.org/base/user/eri/pf45/head/lib/libc/string/ffsll.c
  312. // http://www.gnu.org/software/gnulib/manual/html_node/ffsll.html
  313. switch (T.getOS()) {
  314. case Triple::FreeBSD:
  315. case Triple::Linux:
  316. break;
  317. default:
  318. TLI.setUnavailable(LibFunc::ffsll);
  319. }
  320. // The following functions are available on at least Linux:
  321. if (!T.isOSLinux()) {
  322. TLI.setUnavailable(LibFunc::dunder_strdup);
  323. TLI.setUnavailable(LibFunc::dunder_strtok_r);
  324. TLI.setUnavailable(LibFunc::dunder_isoc99_scanf);
  325. TLI.setUnavailable(LibFunc::dunder_isoc99_sscanf);
  326. TLI.setUnavailable(LibFunc::under_IO_getc);
  327. TLI.setUnavailable(LibFunc::under_IO_putc);
  328. TLI.setUnavailable(LibFunc::memalign);
  329. //TLI.setUnavailable(LibFunc::fopen64); // HLSL Change - duplicate 64bit versions
  330. //TLI.setUnavailable(LibFunc::fseeko64); // HLSL Change - duplicate 64bit versions
  331. TLI.setUnavailable(LibFunc::fstat64);
  332. TLI.setUnavailable(LibFunc::fstatvfs64);
  333. //TLI.setUnavailable(LibFunc::ftello64); // HLSL Change - duplicate 64bit versions
  334. TLI.setUnavailable(LibFunc::lstat64);
  335. TLI.setUnavailable(LibFunc::open64);
  336. TLI.setUnavailable(LibFunc::stat64);
  337. TLI.setUnavailable(LibFunc::statvfs64);
  338. //TLI.setUnavailable(LibFunc::tmpfile64); // HLSL Change - duplicate 64bit versions
  339. }
  340. TLI.addVectorizableFunctionsFromVecLib(ClVectorLibrary);
  341. }
  342. TargetLibraryInfoImpl::TargetLibraryInfoImpl() {
  343. // Default to everything being available.
  344. memset(AvailableArray, -1, sizeof(AvailableArray));
  345. initialize(*this, Triple(), StandardNames);
  346. }
  347. TargetLibraryInfoImpl::TargetLibraryInfoImpl(const Triple &T) {
  348. // Default to everything being available.
  349. memset(AvailableArray, -1, sizeof(AvailableArray));
  350. initialize(*this, T, StandardNames);
  351. }
  352. TargetLibraryInfoImpl::TargetLibraryInfoImpl(const TargetLibraryInfoImpl &TLI)
  353. : CustomNames(TLI.CustomNames) {
  354. memcpy(AvailableArray, TLI.AvailableArray, sizeof(AvailableArray));
  355. VectorDescs = TLI.VectorDescs;
  356. ScalarDescs = TLI.ScalarDescs;
  357. }
  358. TargetLibraryInfoImpl::TargetLibraryInfoImpl(TargetLibraryInfoImpl &&TLI)
  359. : CustomNames(std::move(TLI.CustomNames)) {
  360. std::move(std::begin(TLI.AvailableArray), std::end(TLI.AvailableArray),
  361. AvailableArray);
  362. VectorDescs = TLI.VectorDescs;
  363. ScalarDescs = TLI.ScalarDescs;
  364. }
  365. TargetLibraryInfoImpl &TargetLibraryInfoImpl::operator=(const TargetLibraryInfoImpl &TLI) {
  366. CustomNames = TLI.CustomNames;
  367. memcpy(AvailableArray, TLI.AvailableArray, sizeof(AvailableArray));
  368. return *this;
  369. }
  370. TargetLibraryInfoImpl &TargetLibraryInfoImpl::operator=(TargetLibraryInfoImpl &&TLI) {
  371. CustomNames = std::move(TLI.CustomNames);
  372. std::move(std::begin(TLI.AvailableArray), std::end(TLI.AvailableArray),
  373. AvailableArray);
  374. return *this;
  375. }
  376. static StringRef sanitizeFunctionName(StringRef funcName) {
  377. // Filter out empty names and names containing null bytes, those can't be in
  378. // our table.
  379. if (funcName.empty() || funcName.find('\0') != StringRef::npos)
  380. return StringRef();
  381. // Check for \01 prefix that is used to mangle __asm declarations and
  382. // strip it if present.
  383. return GlobalValue::getRealLinkageName(funcName);
  384. }
  385. bool TargetLibraryInfoImpl::getLibFunc(StringRef funcName,
  386. LibFunc::Func &F) const {
  387. const char *const *Start = &StandardNames[0];
  388. const char *const *End = &StandardNames[LibFunc::NumLibFuncs];
  389. funcName = sanitizeFunctionName(funcName);
  390. if (funcName.empty())
  391. return false;
  392. const char *const *I = std::lower_bound(
  393. Start, End, funcName, [](const char *LHS, StringRef RHS) {
  394. return std::strncmp(LHS, RHS.data(), RHS.size()) < 0;
  395. });
  396. if (I != End && *I == funcName) {
  397. F = (LibFunc::Func)(I - Start);
  398. return true;
  399. }
  400. return false;
  401. }
  402. void TargetLibraryInfoImpl::disableAllFunctions() {
  403. memset(AvailableArray, 0, sizeof(AvailableArray));
  404. }
  405. static bool compareByScalarFnName(const VecDesc &LHS, const VecDesc &RHS) {
  406. return std::strncmp(LHS.ScalarFnName, RHS.ScalarFnName,
  407. std::strlen(RHS.ScalarFnName)) < 0;
  408. }
  409. static bool compareByVectorFnName(const VecDesc &LHS, const VecDesc &RHS) {
  410. return std::strncmp(LHS.VectorFnName, RHS.VectorFnName,
  411. std::strlen(RHS.VectorFnName)) < 0;
  412. }
  413. static bool compareWithScalarFnName(const VecDesc &LHS, StringRef S) {
  414. return std::strncmp(LHS.ScalarFnName, S.data(), S.size()) < 0;
  415. }
  416. static bool compareWithVectorFnName(const VecDesc &LHS, StringRef S) {
  417. return std::strncmp(LHS.VectorFnName, S.data(), S.size()) < 0;
  418. }
  419. void TargetLibraryInfoImpl::addVectorizableFunctions(ArrayRef<VecDesc> Fns) {
  420. VectorDescs.insert(VectorDescs.end(), Fns.begin(), Fns.end());
  421. std::sort(VectorDescs.begin(), VectorDescs.end(), compareByScalarFnName);
  422. ScalarDescs.insert(ScalarDescs.end(), Fns.begin(), Fns.end());
  423. std::sort(ScalarDescs.begin(), ScalarDescs.end(), compareByVectorFnName);
  424. }
  425. void TargetLibraryInfoImpl::addVectorizableFunctionsFromVecLib(
  426. enum VectorLibrary VecLib) {
  427. switch (VecLib) {
  428. case Accelerate: {
  429. const VecDesc VecFuncs[] = {
  430. // Floating-Point Arithmetic and Auxiliary Functions
  431. {"ceilf", "vceilf", 4},
  432. {"fabsf", "vfabsf", 4},
  433. {"llvm.fabs.f32", "vfabsf", 4},
  434. {"floorf", "vfloorf", 4},
  435. {"sqrtf", "vsqrtf", 4},
  436. {"llvm.sqrt.f32", "vsqrtf", 4},
  437. // Exponential and Logarithmic Functions
  438. {"expf", "vexpf", 4},
  439. {"llvm.exp.f32", "vexpf", 4},
  440. {"expm1f", "vexpm1f", 4},
  441. {"logf", "vlogf", 4},
  442. {"llvm.log.f32", "vlogf", 4},
  443. {"log1pf", "vlog1pf", 4},
  444. {"log10f", "vlog10f", 4},
  445. {"llvm.log10.f32", "vlog10f", 4},
  446. {"logbf", "vlogbf", 4},
  447. // Trigonometric Functions
  448. {"sinf", "vsinf", 4},
  449. {"llvm.sin.f32", "vsinf", 4},
  450. {"cosf", "vcosf", 4},
  451. {"llvm.cos.f32", "vcosf", 4},
  452. {"tanf", "vtanf", 4},
  453. {"asinf", "vasinf", 4},
  454. {"acosf", "vacosf", 4},
  455. {"atanf", "vatanf", 4},
  456. // Hyperbolic Functions
  457. {"sinhf", "vsinhf", 4},
  458. {"coshf", "vcoshf", 4},
  459. {"tanhf", "vtanhf", 4},
  460. {"asinhf", "vasinhf", 4},
  461. {"acoshf", "vacoshf", 4},
  462. {"atanhf", "vatanhf", 4},
  463. };
  464. addVectorizableFunctions(VecFuncs);
  465. break;
  466. }
  467. case NoLibrary:
  468. break;
  469. }
  470. }
  471. bool TargetLibraryInfoImpl::isFunctionVectorizable(StringRef funcName) const {
  472. funcName = sanitizeFunctionName(funcName);
  473. if (funcName.empty())
  474. return false;
  475. std::vector<VecDesc>::const_iterator I = std::lower_bound(
  476. VectorDescs.begin(), VectorDescs.end(), funcName,
  477. compareWithScalarFnName);
  478. return I != VectorDescs.end() && StringRef(I->ScalarFnName) == funcName;
  479. }
  480. StringRef TargetLibraryInfoImpl::getVectorizedFunction(StringRef F,
  481. unsigned VF) const {
  482. F = sanitizeFunctionName(F);
  483. if (F.empty())
  484. return F;
  485. std::vector<VecDesc>::const_iterator I = std::lower_bound(
  486. VectorDescs.begin(), VectorDescs.end(), F, compareWithScalarFnName);
  487. while (I != VectorDescs.end() && StringRef(I->ScalarFnName) == F) {
  488. if (I->VectorizationFactor == VF)
  489. return I->VectorFnName;
  490. ++I;
  491. }
  492. return StringRef();
  493. }
  494. StringRef TargetLibraryInfoImpl::getScalarizedFunction(StringRef F,
  495. unsigned &VF) const {
  496. F = sanitizeFunctionName(F);
  497. if (F.empty())
  498. return F;
  499. std::vector<VecDesc>::const_iterator I = std::lower_bound(
  500. ScalarDescs.begin(), ScalarDescs.end(), F, compareWithVectorFnName);
  501. if (I == VectorDescs.end() || StringRef(I->VectorFnName) != F)
  502. return StringRef();
  503. VF = I->VectorizationFactor;
  504. return I->ScalarFnName;
  505. }
  506. TargetLibraryInfo TargetLibraryAnalysis::run(Module &M) {
  507. if (PresetInfoImpl)
  508. return TargetLibraryInfo(*PresetInfoImpl);
  509. return TargetLibraryInfo(lookupInfoImpl(Triple(M.getTargetTriple())));
  510. }
  511. TargetLibraryInfo TargetLibraryAnalysis::run(Function &F) {
  512. if (PresetInfoImpl)
  513. return TargetLibraryInfo(*PresetInfoImpl);
  514. return TargetLibraryInfo(
  515. lookupInfoImpl(Triple(F.getParent()->getTargetTriple())));
  516. }
  517. TargetLibraryInfoImpl &TargetLibraryAnalysis::lookupInfoImpl(Triple T) {
  518. std::unique_ptr<TargetLibraryInfoImpl> &Impl =
  519. Impls[T.normalize()];
  520. if (!Impl)
  521. Impl.reset(new TargetLibraryInfoImpl(T));
  522. return *Impl;
  523. }
  524. TargetLibraryInfoWrapperPass::TargetLibraryInfoWrapperPass()
  525. : ImmutablePass(ID), TLIImpl(), TLI(TLIImpl) {
  526. initializeTargetLibraryInfoWrapperPassPass(*PassRegistry::getPassRegistry());
  527. }
  528. TargetLibraryInfoWrapperPass::TargetLibraryInfoWrapperPass(const Triple &T)
  529. : ImmutablePass(ID), TLIImpl(T), TLI(TLIImpl) {
  530. initializeTargetLibraryInfoWrapperPassPass(*PassRegistry::getPassRegistry());
  531. }
  532. TargetLibraryInfoWrapperPass::TargetLibraryInfoWrapperPass(
  533. const TargetLibraryInfoImpl &TLIImpl)
  534. : ImmutablePass(ID), TLIImpl(TLIImpl), TLI(this->TLIImpl) {
  535. initializeTargetLibraryInfoWrapperPassPass(*PassRegistry::getPassRegistry());
  536. }
  537. char TargetLibraryAnalysis::PassID;
  538. // Register the basic pass.
  539. INITIALIZE_PASS(TargetLibraryInfoWrapperPass, "targetlibinfo",
  540. "Target Library Information", false, true)
  541. char TargetLibraryInfoWrapperPass::ID = 0;
  542. void TargetLibraryInfoWrapperPass::anchor() {}