apache · tqchen · Nov 9, 2019 · Oct 31, 2019 · Oct 29, 2019 · Oct 29, 2019
diff --git a/include/tvm/ir.h b/include/tvm/ir.h
@@ -1248,6 +1248,8 @@ constexpr const char* reduce_scope = "reduce_scope";
 constexpr const char* pragma_scope_prefix = "pragma_";
 /*! \brief Import llvm source or file into the final code gen module */
 constexpr const char* pragma_import_llvm = "pragma_import_llvm";
+/*! \brief Try to modify the AST to support Tensor Core */
+constexpr const char* pragma_tensor_core = "pragma_tensor_core";
 /*!
  * \brief Mark of prefetch scope, value=offset,
  *  run prefetch of Tensor on the current loop scope

diff --git a/include/tvm/ir_pass.h b/include/tvm/ir_pass.h
@@ -206,6 +206,20 @@ Stmt StorageFlatten(Stmt stmt,
                     Map<Tensor, Buffer> extern_buffer,
                     int cache_line_size,
                     bool create_bound_attribute = false);
+
+/*!
+ * \brief Try to modify the AST to support TensorCore
+ *
+ * \param stmt The stmt to be trasnformed.
+ * \param schedule The original schedule.
+ * \param extern_buffer Map specifies external
+ *    buffer assignment of input and outputs.
+ * \return Transformed stmt.
+ */
+Stmt RewriteForTensorCore(Stmt stmt,
+                          Schedule schedule,
+                          Map<Tensor, Buffer> extern_buffer);
+
 /*!
  * \brief Verify if there is any argument bound to compact buffer.
  *

diff --git a/python/tvm/build_module.py b/python/tvm/build_module.py
@@ -387,6 +387,7 @@ def lower(sch,
     binds, arg_list = get_binds(args, compact, binds)
 
     # Phase 1
+    stmt = ir_pass.RewriteForTensorCore(stmt, sch, binds)
     stmt = ir_pass.StorageFlatten(stmt, binds, 64, cfg.instrument_bound_checkers)
     stmt = ir_pass.CanonicalSimplify(stmt)
     for f in lower_phase1:

diff --git a/python/tvm/contrib/nvcc.py b/python/tvm/contrib/nvcc.py
@@ -103,6 +103,7 @@ def compile_cuda(code,
             "Compilation error: empty result is generated")
     return data
 
+@register_func("tvm_find_cuda_path")
 def find_cuda_path():
     """Utility function to find cuda path
 
@@ -125,7 +126,7 @@ def find_cuda_path():
         return cuda_path
     raise RuntimeError("Cannot find cuda path")
 
-
+@register_func("tvm_get_cuda_version")
 def get_cuda_version(cuda_path):
     """Utility function to get cuda version
 

diff --git a/src/api/api_pass.cc b/src/api/api_pass.cc
@@ -94,6 +94,13 @@ TVM_REGISTER_API("ir_pass.StorageFlatten")
     }
   });
 
+TVM_REGISTER_API("ir_pass.RewriteForTensorCore")
+.set_body([](TVMArgs args, TVMRetValue *ret) {
+    if (args.size() == 3) {
+      *ret = RewriteForTensorCore(args[0], args[1], args[2]);
+    }
+  });
+
 TVM_REGISTER_API("ir_pass.AttrsEqual")
 .set_body_typed<bool(const NodeRef&, const NodeRef&)>([](const NodeRef& lhs, const NodeRef& rhs) {
     return AttrsEqual()(lhs, rhs);