diff options
Diffstat (limited to 'polly/lib/Transform/ScheduleOptimizer.cpp')
-rw-r--r-- | polly/lib/Transform/ScheduleOptimizer.cpp | 7 |
1 files changed, 4 insertions, 3 deletions
diff --git a/polly/lib/Transform/ScheduleOptimizer.cpp b/polly/lib/Transform/ScheduleOptimizer.cpp index 230317869f7..c64f836b4c0 100644 --- a/polly/lib/Transform/ScheduleOptimizer.cpp +++ b/polly/lib/Transform/ScheduleOptimizer.cpp @@ -910,9 +910,10 @@ getMicroKernelParams(const TargetTransformInfo *TTI, MatMulInfoTy MMI) { auto Nvec = RegisterBitwidth / ElementSize; if (Nvec == 0) Nvec = 2; - int Nr = - ceil(sqrt(Nvec * LatencyVectorFma * ThroughputVectorFma) / Nvec) * Nvec; - int Mr = ceil(Nvec * LatencyVectorFma * ThroughputVectorFma / Nr); + int Nr = ceil(sqrt((double)(Nvec * LatencyVectorFma * ThroughputVectorFma)) / + Nvec) * + Nvec; + int Mr = ceil((double)(Nvec * LatencyVectorFma * ThroughputVectorFma / Nr)); return {Mr, Nr}; } |