/******************************************************************************* * * MIT License * * Copyright 2025 AMD ROCm(TM) Software * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * in the Software without restriction, including without limitation the rights * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. * *******************************************************************************/ #pragma once #include namespace rocRoller { namespace KernelGraph { namespace RemapOutputTilesDetail { /** * @brief Workgroup count/size information. */ struct TileSizeInfo { /** * @brief MacroTileNumber size expressions for each dimension. * * The size of dangling MacroTileNumber coordinates. */ std::array sizes; /** * @brief Map from {dim, direction} pairs to set of * disconnected (dangling) MacroTileNumber * coordinates. */ std::map, std::unordered_set> danglers; /** * @brief Record the size of a tile. */ void recordSize(int dim, int tileNumTag, auto direction, auto expr); }; /** * @brief New dimensions created by workgroup mapping */ struct RemappedDimensions { RemappedDimensions(int total, int parallel, int perpendicular) : totalTiles(total) , parallelDim(parallel) , perpendicularDim(perpendicular) { } /** * @brief The total number of output tiles */ int totalTiles; /** * @brief Remapped dimension parallel to the workgroup mapping dimension */ int parallelDim; /** * @brief Remapped dimension perpendicular to the workgroup mapping dimension */ int perpendicularDim; }; /** * @brief Query the graph and return TileSizeInfo. */ TileSizeInfo getTileSizeInfo(KernelGraph const& kgraph); /** * @brief Return number of active dimensions (one, two, or three). */ int workgroupDimensions(TileSizeInfo const& info); /** * @brief Return total number of workgroups (product of sizes). * * This matches the number of workgroups required for launch. */ Expression::ExpressionPtr totalNumberOfWorkgroups(TileSizeInfo const& info); /** * @brief Connect dangling MacroTileNumber coordinate to * matching Workgroup coordinates. * * Performs Workgroup Mapping (via workgroupMapping). */ void connectWorkgroupsWithMapping(TileSizeInfo const& info, rocRoller::KernelGraph::KernelGraph& graph, int dimension, Expression::ExpressionPtr size); /** * @brief Apply Workgroup Mapping. * * Map workgroups to tiles in a Z-order-inspired blockwise manner where * the blocks are divided/bounded by `size` along `dimension` (M=0 or N=1). * The returned values are a dimension representing total number of tiles, * and the M/N dimensions after mapping. * * See shared/rocroller/docs/src/WorkgroupMapping.rst for more information. */ RemappedDimensions workgroupMapping(TileSizeInfo const& info, rocRoller::KernelGraph::KernelGraph& graph, rocRoller::Graph::Direction direction, uint dimension, Expression::ExpressionPtr size); } } }