summaryrefslogtreecommitdiffstats
path: root/polly/lib/Transform/FlattenAlgo.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'polly/lib/Transform/FlattenAlgo.cpp')
-rw-r--r--polly/lib/Transform/FlattenAlgo.cpp417
1 files changed, 417 insertions, 0 deletions
diff --git a/polly/lib/Transform/FlattenAlgo.cpp b/polly/lib/Transform/FlattenAlgo.cpp
new file mode 100644
index 00000000000..bd1ce4d24ee
--- /dev/null
+++ b/polly/lib/Transform/FlattenAlgo.cpp
@@ -0,0 +1,417 @@
+//===------ FlattenAlgo.cpp ------------------------------------*- C++ -*-===//
+//
+// The LLVM Compiler Infrastructure
+//
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
+//
+//===----------------------------------------------------------------------===//
+//
+// Main algorithm of the FlattenSchedulePass. This is a separate file to avoid
+// the unittest for this requiring linking against LLVM.
+//
+//===----------------------------------------------------------------------===//
+
+#include "polly/FlattenAlgo.h"
+#include "llvm/Support/Debug.h"
+#define DEBUG_TYPE "polly-flatten-algo"
+
+using namespace polly;
+using namespace llvm;
+
+namespace {
+
+/// Whether a dimension of a set is bounded (lower and upper) by a constant,
+/// i.e. there are two constants Min and Max, such that every value x of the
+/// chosen dimensions is Min <= x <= Max.
+bool isDimBoundedByConstant(IslPtr<isl_set> Set, unsigned dim) {
+ auto ParamDims = isl_set_dim(Set.keep(), isl_dim_param);
+ Set = give(isl_set_project_out(Set.take(), isl_dim_param, 0, ParamDims));
+ Set = give(isl_set_project_out(Set.take(), isl_dim_set, 0, dim));
+ auto SetDims = isl_set_dim(Set.keep(), isl_dim_set);
+ Set = give(isl_set_project_out(Set.take(), isl_dim_set, 1, SetDims - 1));
+ return isl_set_is_bounded(Set.keep());
+}
+
+/// Whether a dimension of a set is (lower and upper) bounded by a constant or
+/// parameters, i.e. there are two expressions Min_p and Max_p of the parameters
+/// p, such that every value x of the chosen dimensions is
+/// Min_p <= x <= Max_p.
+bool isDimBoundedByParameter(IslPtr<isl_set> Set, unsigned dim) {
+ Set = give(isl_set_project_out(Set.take(), isl_dim_set, 0, dim));
+ auto SetDims = isl_set_dim(Set.keep(), isl_dim_set);
+ Set = give(isl_set_project_out(Set.take(), isl_dim_set, 1, SetDims - 1));
+ return isl_set_is_bounded(Set.keep());
+}
+
+/// Whether BMap's first out-dimension is not a constant.
+bool isVariableDim(NonowningIslPtr<isl_basic_map> BMap) {
+ auto FixedVal =
+ give(isl_basic_map_plain_get_val_if_fixed(BMap.keep(), isl_dim_out, 0));
+ return !FixedVal || isl_val_is_nan(FixedVal.keep());
+}
+
+/// Whether Map's first out dimension is no constant nor piecewise constant.
+bool isVariableDim(NonowningIslPtr<isl_map> Map) {
+ return foreachEltWithBreak(Map, [](IslPtr<isl_basic_map> BMap) -> isl_stat {
+ if (isVariableDim(BMap))
+ return isl_stat_error;
+ return isl_stat_ok;
+ });
+}
+
+/// Whether UMap's first out dimension is no (piecewise) constant.
+bool isVariableDim(NonowningIslPtr<isl_union_map> UMap) {
+ return foreachEltWithBreak(UMap, [](IslPtr<isl_map> Map) -> isl_stat {
+ if (isVariableDim(Map))
+ return isl_stat_error;
+ return isl_stat_ok;
+ });
+}
+
+/// If @p PwAff maps to a constant, return said constant. If @p Max/@p Min, it
+/// can also be a piecewise constant and it would return the minimum/maximum
+/// value. Otherwise, return NaN.
+IslPtr<isl_val> getConstant(IslPtr<isl_pw_aff> PwAff, bool Max, bool Min) {
+ assert(!Max || !Min);
+ IslPtr<isl_val> Result;
+ foreachPieceWithBreak(
+ PwAff, [=, &Result](IslPtr<isl_set> Set, IslPtr<isl_aff> Aff) {
+ if (Result && isl_val_is_nan(Result.keep()))
+ return isl_stat_ok;
+
+ // TODO: If Min/Max, we can also determine a minimum/maximum value if
+ // Set is constant-bounded.
+ if (!isl_aff_is_cst(Aff.keep())) {
+ Result = give(isl_val_nan(Aff.getCtx()));
+ return isl_stat_error;
+ }
+
+ auto ThisVal = give(isl_aff_get_constant_val(Aff.keep()));
+ if (!Result) {
+ Result = ThisVal;
+ return isl_stat_ok;
+ }
+
+ if (isl_val_eq(Result.keep(), ThisVal.keep()))
+ return isl_stat_ok;
+
+ if (Max && isl_val_gt(ThisVal.keep(), Result.keep())) {
+ Result = ThisVal;
+ return isl_stat_ok;
+ }
+
+ if (Min && isl_val_lt(ThisVal.keep(), Result.keep())) {
+ Result = ThisVal;
+ return isl_stat_ok;
+ }
+
+ // Not compatible
+ Result = give(isl_val_nan(Aff.getCtx()));
+ return isl_stat_error;
+ });
+ return Result;
+}
+
+/// Compute @p UPwAff - @p Val.
+IslPtr<isl_union_pw_aff> subtract(IslPtr<isl_union_pw_aff> UPwAff,
+ IslPtr<isl_val> Val) {
+ if (isl_val_is_zero(Val.keep()))
+ return UPwAff;
+
+ auto Result =
+ give(isl_union_pw_aff_empty(isl_union_pw_aff_get_space(UPwAff.keep())));
+ foreachElt(UPwAff, [=, &Result](IslPtr<isl_pw_aff> PwAff) {
+ auto ValAff = give(isl_pw_aff_val_on_domain(
+ isl_set_universe(isl_space_domain(isl_pw_aff_get_space(PwAff.keep()))),
+ Val.copy()));
+ auto Subtracted = give(isl_pw_aff_sub(PwAff.copy(), ValAff.take()));
+ Result = give(isl_union_pw_aff_union_add(
+ Result.take(), isl_union_pw_aff_from_pw_aff(Subtracted.take())));
+ });
+ return Result;
+}
+
+/// Compute @UPwAff * @p Val.
+IslPtr<isl_union_pw_aff> multiply(IslPtr<isl_union_pw_aff> UPwAff,
+ IslPtr<isl_val> Val) {
+ if (isl_val_is_one(Val.keep()))
+ return UPwAff;
+
+ auto Result =
+ give(isl_union_pw_aff_empty(isl_union_pw_aff_get_space(UPwAff.keep())));
+ foreachElt(UPwAff, [=, &Result](IslPtr<isl_pw_aff> PwAff) {
+ auto ValAff = give(isl_pw_aff_val_on_domain(
+ isl_set_universe(isl_space_domain(isl_pw_aff_get_space(PwAff.keep()))),
+ Val.copy()));
+ auto Multiplied = give(isl_pw_aff_mul(PwAff.copy(), ValAff.take()));
+ Result = give(isl_union_pw_aff_union_add(
+ Result.take(), isl_union_pw_aff_from_pw_aff(Multiplied.take())));
+ });
+ return Result;
+}
+
+/// Remove @p n dimensions from @p UMap's range, starting at @p first.
+///
+/// It is assumed that all maps in the maps have at least the necessary number
+/// of out dimensions.
+IslPtr<isl_union_map> scheduleProjectOut(NonowningIslPtr<isl_union_map> UMap,
+ unsigned first, unsigned n) {
+ if (n == 0)
+ return UMap; /* isl_map_project_out would also reset the tuple, which should
+ have no effect on schedule ranges */
+
+ auto Result = give(isl_union_map_empty(isl_union_map_get_space(UMap.keep())));
+ foreachElt(UMap, [=, &Result](IslPtr<isl_map> Map) {
+ auto Outprojected =
+ give(isl_map_project_out(Map.take(), isl_dim_out, first, n));
+ Result = give(isl_union_map_add_map(Result.take(), Outprojected.take()));
+ });
+ return Result;
+}
+
+/// Return the number of dimensions in the input map's range.
+///
+/// Because this function takes an isl_union_map, the out dimensions could be
+/// different. We return the maximum number in this case. However, a different
+/// number of dimensions is not supported by the other code in this file.
+size_t scheduleScatterDims(NonowningIslPtr<isl_union_map> Schedule) {
+ unsigned Dims = 0;
+ foreachElt(Schedule, [&Dims](IslPtr<isl_map> Map) {
+ Dims = std::max(Dims, isl_map_dim(Map.keep(), isl_dim_out));
+ });
+ return Dims;
+}
+
+/// Return the @p pos' range dimension, converted to an isl_union_pw_aff.
+IslPtr<isl_union_pw_aff> scheduleExtractDimAff(IslPtr<isl_union_map> UMap,
+ unsigned pos) {
+ auto SingleUMap =
+ give(isl_union_map_empty(isl_union_map_get_space(UMap.keep())));
+ foreachElt(UMap, [=, &SingleUMap](IslPtr<isl_map> Map) {
+ auto MapDims = isl_map_dim(Map.keep(), isl_dim_out);
+ auto SingleMap = give(isl_map_project_out(Map.take(), isl_dim_out, 0, pos));
+ SingleMap = give(isl_map_project_out(SingleMap.take(), isl_dim_out, 1,
+ MapDims - pos - 1));
+ SingleUMap =
+ give(isl_union_map_add_map(SingleUMap.take(), SingleMap.take()));
+ });
+
+ auto UAff = give(isl_union_pw_multi_aff_from_union_map(SingleUMap.take()));
+ auto FirstMAff =
+ give(isl_multi_union_pw_aff_from_union_pw_multi_aff(UAff.take()));
+ return give(isl_multi_union_pw_aff_get_union_pw_aff(FirstMAff.keep(), 0));
+}
+
+/// Flatten a sequence-like first dimension.
+///
+/// A sequence-like scatter dimension is constant, or at least only small
+/// variation, typically the result of ordering a sequence of different
+/// statements. An example would be:
+/// { Stmt_A[] -> [0, X, ...]; Stmt_B[] -> [1, Y, ...] }
+/// to schedule all instances of Stmt_A before any instance of Stmt_B.
+///
+/// To flatten, first begin with an offset of zero. Then determine the lowest
+/// possible value of the dimension, call it "i" [In the example we start at 0].
+/// Considering only schedules with that value, consider only instances with
+/// that value and determine the extent of the next dimension. Let l_X(i) and
+/// u_X(i) its minimum (lower bound) and maximum (upper bound) value. Add them
+/// as "Offset + X - l_X(i)" to the new schedule, then add "u_X(i) - l_X(i) + 1"
+/// to Offset and remove all i-instances from the old schedule. Repeat with the
+/// remaining lowest value i' until there are no instances in the old schedule
+/// left.
+/// The example schedule would be transformed to:
+/// { Stmt_X[] -> [X - l_X, ...]; Stmt_B -> [l_X - u_X + 1 + Y - l_Y, ...] }
+IslPtr<isl_union_map> tryFlattenSequence(IslPtr<isl_union_map> Schedule) {
+ auto IslCtx = Schedule.getCtx();
+ auto ScatterSet =
+ give(isl_set_from_union_set(isl_union_map_range(Schedule.copy())));
+
+ auto ParamSpace = give(isl_union_map_get_space(Schedule.keep()));
+ auto Dims = isl_set_dim(ScatterSet.keep(), isl_dim_set);
+ assert(Dims >= 2);
+
+ // Would cause an infinite loop.
+ if (!isDimBoundedByConstant(ScatterSet, 0)) {
+ DEBUG(dbgs() << "Abort; dimension is not of fixed size\n");
+ return nullptr;
+ }
+
+ auto AllDomains = give(isl_union_map_domain(Schedule.copy()));
+ auto AllDomainsToNull =
+ give(isl_union_pw_multi_aff_from_domain(AllDomains.take()));
+
+ auto NewSchedule = give(isl_union_map_empty(ParamSpace.copy()));
+ auto Counter = give(isl_pw_aff_zero_on_domain(isl_local_space_from_space(
+ isl_space_set_from_params(ParamSpace.copy()))));
+
+ while (!isl_set_is_empty(ScatterSet.keep())) {
+ DEBUG(dbgs() << "Next counter:\n " << Counter << "\n");
+ DEBUG(dbgs() << "Remaining scatter set:\n " << ScatterSet << "\n");
+ auto ThisSet =
+ give(isl_set_project_out(ScatterSet.copy(), isl_dim_set, 1, Dims - 1));
+ auto ThisFirst = give(isl_set_lexmin(ThisSet.take()));
+ auto ScatterFirst =
+ give(isl_set_add_dims(ThisFirst.take(), isl_dim_set, Dims - 1));
+
+ auto SubSchedule = give(isl_union_map_intersect_range(
+ Schedule.copy(), isl_union_set_from_set(ScatterFirst.copy())));
+ SubSchedule = scheduleProjectOut(std::move(SubSchedule), 0, 1);
+ SubSchedule = flattenSchedule(std::move(SubSchedule));
+
+ auto SubDims = scheduleScatterDims(SubSchedule);
+ auto FirstSubSchedule = scheduleProjectOut(SubSchedule, 1, SubDims - 1);
+ auto FirstScheduleAff = scheduleExtractDimAff(FirstSubSchedule, 0);
+ auto RemainingSubSchedule =
+ scheduleProjectOut(std::move(SubSchedule), 0, 1);
+
+ auto FirstSubScatter = give(
+ isl_set_from_union_set(isl_union_map_range(FirstSubSchedule.take())));
+ DEBUG(dbgs() << "Next step in sequence is:\n " << FirstSubScatter << "\n");
+
+ if (!isDimBoundedByParameter(FirstSubScatter, 0)) {
+ DEBUG(dbgs() << "Abort; sequence step is not bounded\n");
+ return nullptr;
+ }
+
+ auto FirstSubScatterMap = give(isl_map_from_range(FirstSubScatter.take()));
+
+ // isl_set_dim_max returns a strange isl_pw_aff with domain tuple_id of
+ // 'none'. It doesn't match with any space including a 0-dimensional
+ // anonymous tuple.
+ // Interesting, one can create such a set using
+ // isl_set_universe(ParamSpace). Bug?
+ auto PartMin = give(isl_map_dim_min(FirstSubScatterMap.copy(), 0));
+ auto PartMax = give(isl_map_dim_max(FirstSubScatterMap.take(), 0));
+ auto One = give(isl_pw_aff_val_on_domain(
+ isl_set_universe(isl_space_set_from_params(ParamSpace.copy())),
+ isl_val_one(IslCtx)));
+ auto PartLen = give(isl_pw_aff_add(
+ isl_pw_aff_add(PartMax.take(), isl_pw_aff_neg(PartMin.copy())),
+ One.take()));
+
+ auto AllPartMin = give(isl_union_pw_aff_pullback_union_pw_multi_aff(
+ isl_union_pw_aff_from_pw_aff(PartMin.take()), AllDomainsToNull.copy()));
+ auto FirstScheduleAffNormalized =
+ give(isl_union_pw_aff_sub(FirstScheduleAff.take(), AllPartMin.take()));
+ auto AllCounter = give(isl_union_pw_aff_pullback_union_pw_multi_aff(
+ isl_union_pw_aff_from_pw_aff(Counter.copy()), AllDomainsToNull.copy()));
+ auto FirstScheduleAffWithOffset = give(isl_union_pw_aff_add(
+ FirstScheduleAffNormalized.take(), AllCounter.take()));
+
+ auto ScheduleWithOffset = give(isl_union_map_flat_range_product(
+ isl_union_map_from_union_pw_aff(FirstScheduleAffWithOffset.take()),
+ RemainingSubSchedule.take()));
+ NewSchedule = give(
+ isl_union_map_union(NewSchedule.take(), ScheduleWithOffset.take()));
+
+ ScatterSet = give(isl_set_subtract(ScatterSet.take(), ScatterFirst.take()));
+ Counter = give(isl_pw_aff_add(Counter.take(), PartLen.take()));
+ }
+
+ DEBUG(dbgs() << "Sequence-flatten result is:\n " << NewSchedule << "\n");
+ return NewSchedule;
+}
+
+/// Flatten a loop-like first dimension.
+///
+/// A loop-like dimension is one that depends on a variable (usually a loop's
+/// induction variable). Let the input schedule look like this:
+/// { Stmt[i] -> [i, X, ...] }
+///
+/// To flatten, we determine the largest extent of X which may not depend on the
+/// actual value of i. Let l_X() the smallest possible value of X and u_X() its
+/// largest value. Then, construct a new schedule
+/// { Stmt[i] -> [i * (u_X() - l_X() + 1), ...] }
+IslPtr<isl_union_map> tryFlattenLoop(IslPtr<isl_union_map> Schedule) {
+ assert(scheduleScatterDims(Schedule) >= 2);
+
+ auto Remaining = scheduleProjectOut(Schedule, 0, 1);
+ auto SubSchedule = flattenSchedule(Remaining);
+ auto SubDims = scheduleScatterDims(SubSchedule);
+
+ auto SubExtent =
+ give(isl_set_from_union_set(isl_union_map_range(SubSchedule.copy())));
+ auto SubExtentDims = isl_set_dim(SubExtent.keep(), isl_dim_param);
+ SubExtent = give(
+ isl_set_project_out(SubExtent.take(), isl_dim_param, 0, SubExtentDims));
+ SubExtent =
+ give(isl_set_project_out(SubExtent.take(), isl_dim_set, 1, SubDims - 1));
+
+ if (!isDimBoundedByConstant(SubExtent, 0)) {
+ DEBUG(dbgs() << "Abort; dimension not bounded by constant\n");
+ return nullptr;
+ }
+
+ auto Min = give(isl_set_dim_min(SubExtent.copy(), 0));
+ DEBUG(dbgs() << "Min bound:\n " << Min << "\n");
+ auto MinVal = getConstant(Min, false, true);
+ auto Max = give(isl_set_dim_max(SubExtent.take(), 0));
+ DEBUG(dbgs() << "Max bound:\n " << Max << "\n");
+ auto MaxVal = getConstant(Max, true, false);
+
+ if (!MinVal || !MaxVal || isl_val_is_nan(MinVal.keep()) ||
+ isl_val_is_nan(MaxVal.keep())) {
+ DEBUG(dbgs() << "Abort; dimension bounds could not be determined\n");
+ return nullptr;
+ }
+
+ auto FirstSubScheduleAff = scheduleExtractDimAff(SubSchedule, 0);
+ auto RemainingSubSchedule = scheduleProjectOut(std::move(SubSchedule), 0, 1);
+
+ auto LenVal =
+ give(isl_val_add_ui(isl_val_sub(MaxVal.take(), MinVal.copy()), 1));
+ auto FirstSubScheduleNormalized = subtract(FirstSubScheduleAff, MinVal);
+
+ // TODO: Normalize FirstAff to zero (convert to isl_map, determine minimum,
+ // subtract it)
+ auto FirstAff = scheduleExtractDimAff(Schedule, 0);
+ auto Offset = multiply(FirstAff, LenVal);
+ auto Index = give(
+ isl_union_pw_aff_add(FirstSubScheduleNormalized.take(), Offset.take()));
+ auto IndexMap = give(isl_union_map_from_union_pw_aff(Index.take()));
+
+ auto Result = give(isl_union_map_flat_range_product(
+ IndexMap.take(), RemainingSubSchedule.take()));
+ DEBUG(dbgs() << "Loop-flatten result is:\n " << Result << "\n");
+ return Result;
+}
+} // anonymous namespace
+
+IslPtr<isl_union_map> polly::flattenSchedule(IslPtr<isl_union_map> Schedule) {
+ auto Dims = scheduleScatterDims(Schedule);
+ DEBUG(dbgs() << "Recursive schedule to process:\n " << Schedule << "\n");
+
+ // Base case; no dimensions left
+ if (Dims == 0) {
+ // TODO: Add one dimension?
+ return Schedule;
+ }
+
+ // Base case; already one-dimensional
+ if (Dims == 1)
+ return Schedule;
+
+ // Fixed dimension; no need to preserve variabledness.
+ if (!isVariableDim(Schedule)) {
+ DEBUG(dbgs() << "Fixed dimension; try sequence flattening\n");
+ auto NewScheduleSequence = tryFlattenSequence(Schedule);
+ if (NewScheduleSequence)
+ return NewScheduleSequence;
+ }
+
+ // Constant stride
+ DEBUG(dbgs() << "Try loop flattening\n");
+ auto NewScheduleLoop = tryFlattenLoop(Schedule);
+ if (NewScheduleLoop)
+ return NewScheduleLoop;
+
+ // Try again without loop condition (may blow up the number of pieces!!)
+ DEBUG(dbgs() << "Try sequence flattening again\n");
+ auto NewScheduleSequence = tryFlattenSequence(Schedule);
+ if (NewScheduleSequence)
+ return NewScheduleSequence;
+
+ // Cannot flatten
+ return Schedule;
+}
OpenPOWER on IntegriCloud