Skip to content

Commit

Permalink
Merge branch 'main' into vroubtsov/issue-533
Browse files Browse the repository at this point in the history
  • Loading branch information
vroubtsovTT authored Dec 1, 2024
2 parents 249948c + 99331c7 commit 4849981
Show file tree
Hide file tree
Showing 31 changed files with 1,639 additions and 449 deletions.
13 changes: 8 additions & 5 deletions .github/workflows/build-and-test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -47,8 +47,9 @@ jobs:
fail-fast: false
matrix:
build: [
{runs-on: ubuntu-latest, enable_perf: OFF, name: "run", ttrt_flags: ""},
{runs-on: ubuntu-latest, enable_perf: ON, name: "perf", ttrt_flags: ""},
{runs-on: ubuntu-latest, enable_perf: OFF, enable_op_model: OFF, name: "run", ttrt_flags: ""},
{runs-on: ubuntu-latest, enable_perf: ON, enable_op_model: OFF, name: "perf", ttrt_flags: ""},
{runs-on: ubuntu-latest, enable_perf: OFF, enable_op_model: ON, name: "op_model" , ttrt_flags: ""}
]

name: Build tt-mlir
Expand Down Expand Up @@ -78,7 +79,7 @@ jobs:
uses: hendrikmuhs/[email protected]
with:
create-symlink: true
key: ${{ matrix.build.runs-on }}-run-ON-perf-${{ matrix.build.enable_perf }}-${{ env.SDK_VERSION }}
key: ${{ matrix.build.runs-on }}-run-ON-perf-${{ matrix.build.enable_perf }}-op_model-${{ matrix.build.enable_op_model }}-${{ env.SDK_VERSION }}

# Build project

Expand All @@ -97,6 +98,7 @@ jobs:
-DTTMLIR_ENABLE_RUNTIME_TESTS=ON \
-DTT_RUNTIME_ENABLE_PERF_TRACE=${{ matrix.build.enable_perf }} \
-DTTMLIR_ENABLE_STABLEHLO=ON \
-DTTMLIR_ENABLE_OP_MODEL=${{ matrix.build.enable_op_model }} \
-S ${{ steps.strings.outputs.work-dir }}
- name: Build
Expand Down Expand Up @@ -147,7 +149,7 @@ jobs:
- name: Upload Test Report
uses: actions/upload-artifact@v4
with:
name: test-reports-${{ matrix.build.runs-on }}-perf-${{ matrix.build.enable_perf }}
name: test-reports-${{ matrix.build.runs-on }}-perf-${{ matrix.build.enable_perf }}-op_model-${{ matrix.build.enable_op_model }}
path: build/test/report.xml

- name: Show Test Report
Expand Down Expand Up @@ -480,7 +482,7 @@ jobs:
uses: hendrikmuhs/[email protected]
with:
create-symlink: true
key: ${{ matrix.build.runs-on }}-run-ON-perf-${{ matrix.build.enable_perf }}-${{ env.SDK_VERSION }}
key: ${{ matrix.build.runs-on }}-run-ON-perf-${{ matrix.build.enable_perf }}-op_model-${{ matrix.build.enable_op_model }}-${{ env.SDK_VERSION }}

- name: Configure CMake
shell: bash
Expand All @@ -496,6 +498,7 @@ jobs:
-DTTMLIR_ENABLE_RUNTIME_TESTS=OFF \
-DTT_RUNTIME_ENABLE_PERF_TRACE=${{ matrix.build.enable_perf }} \
-DTTMLIR_ENABLE_STABLEHLO=OFF \
-DTTMLIR_ENABLE_OP_MODEL=${{ matrix.build.enable_op_model }} \
-S ${{ steps.strings.outputs.work-dir }}
- name: Build tt-explorer
Expand Down
13 changes: 8 additions & 5 deletions .github/workflows/nightly-uplift.yml
Original file line number Diff line number Diff line change
Expand Up @@ -62,8 +62,11 @@ jobs:
echo "Pull Request URL - ${{ steps.create-pr.outputs.pull-request-url }}"
gh pr review ${{ steps.create-pr.outputs.pull-request-number }} --approve
- name: Enable Pull Request Automerge
if: ${{ steps.create-pr.outputs.pull-request-number }}
run: gh pr merge --squash --auto "${{ steps.create-pr.outputs.pull-request-number }}"
env:
GH_TOKEN: ${{ secrets.GH_TOKEN }}
# Note: Dissable auto-merge for now until we are more confident
# that uplift won't break the downstream projects
#
# - name: Enable Pull Request Automerge
# if: ${{ steps.create-pr.outputs.pull-request-number }}
# run: gh pr merge --squash --auto "${{ steps.create-pr.outputs.pull-request-number }}"
# env:
# GH_TOKEN: ${{ secrets.GH_TOKEN }}
6 changes: 6 additions & 0 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ endif()
option(TT_RUNTIME_ENABLE_PERF_TRACE "Enable performance mode" OFF)
option(TTMLIR_ENABLE_RUNTIME "Enable runtime" OFF)
option(TTMLIR_ENABLE_STABLEHLO "Enable StableHLO support" OFF)
option(TTMLIR_ENABLE_OP_MODEL "Enable OpModel support" OFF)

if (TTMLIR_ENABLE_STABLEHLO)
add_compile_definitions(TTMLIR_ENABLE_STABLEHLO)
Expand All @@ -20,6 +21,11 @@ set(CMAKE_EXPORT_COMPILE_COMMANDS ON)

set(TTMLIR_ENABLE_BINDINGS_PYTHON ON CACHE BOOL "Enable Python bindings")

if (APPLE)
set(TTMLIR_ENABLE_OP_MODEL OFF)
message(WARNING "TTNNOpModelLib is disabled on Apple platforms. Optimizer will not get true performance.")
endif()

list(APPEND CMAKE_MODULE_PATH ${CMAKE_CURRENT_LIST_DIR}/cmake/modules)

if (TT_RUNTIME_ENABLE_PERF_TRACE)
Expand Down
6 changes: 5 additions & 1 deletion include/ttmlir/Conversion/TosaToTTIR/TosaToTTIR.h
Original file line number Diff line number Diff line change
Expand Up @@ -7,11 +7,15 @@

#include "mlir/IR/BuiltinOps.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Transforms/DialectConversion.h"

namespace mlir::tt {

void populateTosaToTTIRPatterns(MLIRContext *ctx, RewritePatternSet &patterns,
TypeConverter &typeConverter);

std::unique_ptr<OperationPass<ModuleOp>> createConvertTosaToTTIRPass();

} // namespace mlir::tt

#endif
#endif // TTMLIR_CONVERSION_TOSATOTTIR_TOSATOTTIR_H
17 changes: 11 additions & 6 deletions include/ttmlir/Dialect/TT/Utils/MemoryLayoutAnalysisParams.h
Original file line number Diff line number Diff line change
Expand Up @@ -27,18 +27,23 @@ struct MemoryLayoutAnalysisPolicyTypeParser
return false;
}

static void print(llvm::raw_ostream &os,
const MemoryLayoutAnalysisPolicyType &value) {
llvm::StringRef policy;
static std::string toString(const MemoryLayoutAnalysisPolicyType &value) {
std::string res;
switch (value) {
case MemoryLayoutAnalysisPolicyType::DFSharding:
policy = "DFSharding";
res += "DFSharding";
break;
case MemoryLayoutAnalysisPolicyType::L1Interleaved:
policy = "L1Interleaved";
res += "L1Interleaved";
break;
}
os << "memory-layout-analysis-policy=" << policy << "\n";
return res;
}

static void print(llvm::raw_ostream &os,
const MemoryLayoutAnalysisPolicyType &value) {
os << "memory-layout-analysis-policy="
<< MemoryLayoutAnalysisPolicyTypeParser::toString(value) << "\n";
}
};

Expand Down
3 changes: 2 additions & 1 deletion include/ttmlir/Dialect/TTNN/Pipelines/TTNNPipelines.h
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,8 @@
#define TTMLIR_DIALECT_TTNN_PIPELINES_TTNNPIPELINES_H

#include "ttmlir/Dialect/TT/Utils/MemoryLayoutAnalysisParams.h"
#include "ttmlir/Dialect/TTNN/Utils/OptimizerOverrides.h"
#include "ttmlir/Dialect/TTNN/Utils/PassOverrides.h"
#include "ttmlir/Dialect/TTNN/Utils/Utils.h"

#include "mlir/Pass/PassOptions.h"

Expand Down
116 changes: 82 additions & 34 deletions include/ttmlir/Dialect/TTNN/Utils/OptimizerOverrides.h
Original file line number Diff line number Diff line change
Expand Up @@ -5,50 +5,98 @@
#ifndef TTMLIR_DIALECT_TTNN_UTILS_OPTIMIZEROVERRIDES_H
#define TTMLIR_DIALECT_TTNN_UTILS_OPTIMIZEROVERRIDES_H

#include <llvm/Support/CommandLine.h>

#include "ttmlir/Dialect/TT/IR/TTOpsTypes.h"
#include "ttmlir/Dialect/TTNN/IR/TTNNOpsAttrs.h"
#include "ttmlir/Dialect/TT/Utils/MemoryLayoutAnalysisParams.h"
#include "ttmlir/Dialect/TTNN/Pipelines/TTNNPipelines.h"
#include "ttmlir/Dialect/TTNN/Utils/PassOverrides.h"

namespace mlir::tt::ttnn {

struct OutputLayoutOverrideParams {
SmallVector<int64_t, 2> grid;
BufferType bufferType;
TensorMemoryLayout tensorMemoryLayout; // INTERLEAVED / SHARDED etc...
Layout memoryLayout; // ROW_MAJOR / TILE
tt::DataType dataType;
};
class OptimizerOverridesHandler {
public:
OptimizerOverridesHandler() {};
~OptimizerOverridesHandler() {};

struct InputLayoutOverrideParams {
SmallVector<int64_t> operandIdxes;
};
// Setters for the overrides
// These are used to enable/disable the optimizer passes
void setEnableOptimizer(bool);
// These are used to enable/disable the memory configurations
void setMemoryReconfig(bool);
void setEnableMemoryLayoutAnalysis(bool);
void setEnableMemoryLayoutAnalysisPolicy(bool);
void setMemoryLayoutAnalysisPolicy(MemoryLayoutAnalysisPolicyType);
// These are used to set the input/output layout overrides
void setInputLayoutOverrides(llvm::StringMap<InputLayoutOverrideParams> &);
void setOutputLayoutOverrides(llvm::StringMap<OutputLayoutOverrideParams> &);
// These are used to add system descriptor path
void setSystemDescPath(std::string);
// These are used to set the maximum number of legal layouts for grid analysis
void setMaxLegalLayouts(int64_t);
// These are used to set the mesh shape
void setMeshShape(std::vector<int64_t>);

struct OutputLayoutOverrideParser
: public llvm::cl::parser<llvm::StringMap<OutputLayoutOverrideParams>> {
public:
OutputLayoutOverrideParser(llvm::cl::Option &opt)
: llvm::cl::parser<llvm::StringMap<OutputLayoutOverrideParams>>(opt) {}
// Getters for the overrides
// These are used to get the current state of the optimizer passes
bool getEnableOptimizer() const;
// These are used to get the current state of the memory configurations
bool getMemoryReconfig() const;
bool getEnableMemoryLayoutAnalysis() const;
bool getEnableMemoryLayoutAnalysisPolicy() const;
MemoryLayoutAnalysisPolicyType getMemoryLayoutAnalysisPolicy() const;
// These are used to get the current input/output layout overrides
llvm::StringMap<InputLayoutOverrideParams> getInputLayoutOverrides() const;
llvm::StringMap<OutputLayoutOverrideParams> getOutputLayoutOverrides() const;
// These are used to get the current system descriptor path
std::string getSystemDescPath() const;
// These are used to get the current maximum number of legal layouts for grid
// analysis
int64_t getMaxLegalLayouts() const;
// These are used to get the current mesh shape
std::vector<int64_t> getMeshShape() const;

bool parse(llvm::cl::Option &opt, StringRef argName, StringRef arg,
llvm::StringMap<OutputLayoutOverrideParams> &value);
// Method that converts the overrides to a string
std::string toString() const;

static void print(llvm::raw_ostream &os,
const llvm::StringMap<OutputLayoutOverrideParams> &value);
};
// Fill input/output layout overrides maps.
// This is used from tt-forge frontend where we define and compile the models.
void addInputLayoutOverride(StringRef, InputLayoutOverrideParams);
void addInputLayoutOverride(StringRef, SmallVector<int64_t> &);
void addOutputLayoutOverride(StringRef, OutputLayoutOverrideParams);
void addOutputLayoutOverride(StringRef, SmallVector<int64_t> &, BufferType,
TensorMemoryLayout, tt::ttnn::Layout,
tt::DataType);

struct InputLayoutOverrideParser
: public llvm::cl::parser<llvm::StringMap<InputLayoutOverrideParams>> {
public:
InputLayoutOverrideParser(llvm::cl::Option &opt)
: llvm::cl::parser<llvm::StringMap<InputLayoutOverrideParams>>(opt) {}
private:
// Options for the TTIR to TTNN backend pipeline,
// we use them to extract the names and the deafulat values.
TTIRToTTNNBackendPipelineOptions pipelineOptions;

// Flags for enabling/disabling the optimizer passes
bool enableOptimizer = false;

// Flags for enabling/disabling the memory configurations
bool enableMemoryReconfig = true;
bool enableMemoryLayoutAnalysis = false;

// Input layout overrides
llvm::StringMap<InputLayoutOverrideParams> inputLayoutOverrides;

// Output layout overrides
llvm::StringMap<OutputLayoutOverrideParams> outputLayoutOverrides;

// Memory layout analysis policy
bool enableMemoryLayoutAnalysisPolicy = false;
MemoryLayoutAnalysisPolicyType memoryLayoutAnalysisPolicy;

// System descriptor path
std::string systemDescPath;

// Maximum number of legal layouts for grid analysis
int64_t maxLegalLayouts = 0;

bool parse(llvm::cl::Option &opt, StringRef argName, StringRef arg,
llvm::StringMap<InputLayoutOverrideParams> &value);
// Mesh shape
std::vector<int64_t> meshShape;

static void print(llvm::raw_ostream &os,
const llvm::StringMap<InputLayoutOverrideParams> &value);
};
}; // class OptimizerOverridesHandler

} // namespace mlir::tt::ttnn

Expand Down
91 changes: 91 additions & 0 deletions include/ttmlir/Dialect/TTNN/Utils/PassOverrides.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,91 @@
// SPDX-FileCopyrightText: (c) 2024 Tenstorrent AI ULC
//
// SPDX-License-Identifier: Apache-2.0

#ifndef TTMLIR_DIALECT_TTNN_UTILS_PASSOVERRIDES_H
#define TTMLIR_DIALECT_TTNN_UTILS_PASSOVERRIDES_H

#include <llvm/Support/CommandLine.h>

#include "ttmlir/Dialect/TT/IR/TTOpsTypes.h"
#include "ttmlir/Dialect/TTNN/IR/TTNNOpsAttrs.h"
#include "ttmlir/Dialect/TTNN/IR/TTNNOpsTypes.h"

namespace mlir::tt::ttnn {

struct OutputLayoutOverrideParams {

SmallVector<int64_t, 2> grid;
BufferType bufferType;
TensorMemoryLayout tensorMemoryLayout; // INTERLEAVED / SHARDED etc...
Layout memoryLayout; // ROW_MAJOR / TILE
mlir::tt::DataType dataType;

bool operator==(const OutputLayoutOverrideParams rhs) const {
return grid[0] == rhs.grid[0] && grid[1] == rhs.grid[1] &&
bufferType == rhs.bufferType &&
tensorMemoryLayout == rhs.tensorMemoryLayout &&
memoryLayout == rhs.memoryLayout && dataType == rhs.dataType;
}

bool operator!=(const OutputLayoutOverrideParams &rhs) const {
return !(*this == rhs);
}
};

struct InputLayoutOverrideParams {

SmallVector<int64_t> operandIdxes;

bool operator==(const InputLayoutOverrideParams &rhs) const {
if (operandIdxes.size() != rhs.operandIdxes.size()) {
return false;
}
for (std::size_t i = 0; i < operandIdxes.size(); i++) {
if (operandIdxes[i] != rhs.operandIdxes[i]) {
return false;
}
}
return true;
}

bool operator!=(const InputLayoutOverrideParams &rhs) const {
return !(*this == rhs);
}
};

struct OutputLayoutOverrideParser
: public llvm::cl::parser<llvm::StringMap<OutputLayoutOverrideParams>> {
public:
OutputLayoutOverrideParser(llvm::cl::Option &opt)
: llvm::cl::parser<llvm::StringMap<OutputLayoutOverrideParams>>(opt) {}

bool parse(llvm::cl::Option &opt, StringRef argName, StringRef arg,
llvm::StringMap<OutputLayoutOverrideParams> &value);

static std::string
toString(const llvm::StringMap<OutputLayoutOverrideParams> &);

static void print(llvm::raw_ostream &os,
const llvm::StringMap<OutputLayoutOverrideParams> &value);
};

struct InputLayoutOverrideParser
: public llvm::cl::parser<llvm::StringMap<InputLayoutOverrideParams>> {
public:
InputLayoutOverrideParser(llvm::cl::Option &opt)
: llvm::cl::parser<llvm::StringMap<InputLayoutOverrideParams>>(opt) {}

bool parse(llvm::cl::Option &opt, StringRef argName, StringRef arg,
llvm::StringMap<InputLayoutOverrideParams> &value);

static std::string
toString(const llvm::StringMap<InputLayoutOverrideParams> &);

static void print(llvm::raw_ostream &os,
const llvm::StringMap<InputLayoutOverrideParams> &value);
};

} // namespace mlir::tt::ttnn

#endif // TTMLIR_DIALECT_TTNN_UTILS_PASSOVERRIDES_H
2 changes: 2 additions & 0 deletions include/ttmlir/Dialect/TTNN/Utils/Utils.h
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,8 @@
#ifndef TTMLIR_DIALECT_TTNN_UTILS_UTILS_H
#define TTMLIR_DIALECT_TTNN_UTILS_UTILS_H

#include <llvm/Support/CommandLine.h>

#include "ttmlir/Dialect/TT/IR/TTOpsTypes.h"
#include "ttmlir/Dialect/TTNN/IR/TTNNOpsAttrs.h"
#include "ttmlir/Dialect/TTNN/IR/TTNNOpsTypes.h"
Expand Down
Loading

0 comments on commit 4849981

Please sign in to comment.