diff options
| author | Matt Masten <matt.masten@intel.com> | 2016-07-29 16:42:44 +0000 |
|---|---|---|
| committer | Matt Masten <matt.masten@intel.com> | 2016-07-29 16:42:44 +0000 |
| commit | a6669a1e056be6ec4feb06d8c3c796f435e8926d (patch) | |
| tree | f8d0b451982addba50ff67bc0b79c97ca655dd05 /llvm/lib/Analysis | |
| parent | 9e69450ec7a403b0e61110b7e235caa85984cda5 (diff) | |
| download | bcm5719-llvm-a6669a1e056be6ec4feb06d8c3c796f435e8926d.tar.gz bcm5719-llvm-a6669a1e056be6ec4feb06d8c3c796f435e8926d.zip | |
Initial support for vectorization using svml (short vector math library).
Differential Revision: https://reviews.llvm.org/D19544
llvm-svn: 277166
Diffstat (limited to 'llvm/lib/Analysis')
| -rw-r--r-- | llvm/lib/Analysis/TargetLibraryInfo.cpp | 72 |
1 files changed, 71 insertions, 1 deletions
diff --git a/llvm/lib/Analysis/TargetLibraryInfo.cpp b/llvm/lib/Analysis/TargetLibraryInfo.cpp index c3e4786deae..bd5cd2c91b1 100644 --- a/llvm/lib/Analysis/TargetLibraryInfo.cpp +++ b/llvm/lib/Analysis/TargetLibraryInfo.cpp @@ -23,9 +23,10 @@ static cl::opt<TargetLibraryInfoImpl::VectorLibrary> ClVectorLibrary( "No vector functions library"), clEnumValN(TargetLibraryInfoImpl::Accelerate, "Accelerate", "Accelerate framework"), + clEnumValN(TargetLibraryInfoImpl::SVML, "SVML", + "Intel SVML library"), clEnumValEnd)); - const char *const TargetLibraryInfoImpl::StandardNames[LibFunc::NumLibFuncs] = { #define TLI_DEFINE_STRING #include "llvm/Analysis/TargetLibraryInfo.def" @@ -1075,6 +1076,75 @@ void TargetLibraryInfoImpl::addVectorizableFunctionsFromVecLib( addVectorizableFunctions(VecFuncs); break; } + case SVML: { + const VecDesc VecFuncs[] = { + {"sin", "__svml_sin2", 2}, + {"sin", "__svml_sin4", 4}, + {"sin", "__svml_sin8", 8}, + + {"sinf", "__svml_sinf4", 4}, + {"sinf", "__svml_sinf8", 8}, + {"sinf", "__svml_sinf16", 16}, + + {"cos", "__svml_cos2", 2}, + {"cos", "__svml_cos4", 4}, + {"cos", "__svml_cos8", 8}, + + {"cosf", "__svml_cosf4", 4}, + {"cosf", "__svml_cosf8", 8}, + {"cosf", "__svml_cosf16", 16}, + + {"pow", "__svml_pow2", 2}, + {"pow", "__svml_pow4", 4}, + {"pow", "__svml_pow8", 8}, + + {"powf", "__svml_powf4", 4}, + {"powf", "__svml_powf8", 8}, + {"powf", "__svml_powf16", 16}, + + {"llvm.pow.f64", "__svml_pow2", 2}, + {"llvm.pow.f64", "__svml_pow4", 4}, + {"llvm.pow.f64", "__svml_pow8", 8}, + + {"llvm.pow.f32", "__svml_powf4", 4}, + {"llvm.pow.f32", "__svml_powf8", 8}, + {"llvm.pow.f32", "__svml_powf16", 16}, + + {"exp", "__svml_exp2", 2}, + {"exp", "__svml_exp4", 4}, + {"exp", "__svml_exp8", 8}, + + {"expf", "__svml_expf4", 4}, + {"expf", "__svml_expf8", 8}, + {"expf", "__svml_expf16", 16}, + + {"llvm.exp.f64", "__svml_exp2", 2}, + {"llvm.exp.f64", "__svml_exp4", 4}, + {"llvm.exp.f64", "__svml_exp8", 8}, + + {"llvm.exp.f32", "__svml_expf4", 4}, + {"llvm.exp.f32", "__svml_expf8", 8}, + {"llvm.exp.f32", "__svml_expf16", 16}, + + {"log", "__svml_log2", 2}, + {"log", "__svml_log4", 4}, + {"log", "__svml_log8", 8}, + + {"logf", "__svml_logf4", 4}, + {"logf", "__svml_logf8", 8}, + {"logf", "__svml_logf16", 16}, + + {"llvm.log.f64", "__svml_log2", 2}, + {"llvm.log.f64", "__svml_log4", 4}, + {"llvm.log.f64", "__svml_log8", 8}, + + {"llvm.log.f32", "__svml_logf4", 4}, + {"llvm.log.f32", "__svml_logf8", 8}, + {"llvm.log.f32", "__svml_logf16", 16}, + }; + addVectorizableFunctions(VecFuncs); + break; + } case NoLibrary: break; } |

