From ebb6bd7cbd0f559e6a9b89a4025d309fa8cb2cc4 Mon Sep 17 00:00:00 2001
From: MORITA Kazutaka <morita.kazutaka@gmail.com>
Date: Fri, 24 Apr 2020 00:05:08 +0900
Subject: [PATCH] [DOCS] Migrate HLS documents from md to rst (#5419)

---
 docs/deploy/aocl_fpga.md | 109 -----------------------
 docs/deploy/aws_fpga.md  | 170 ------------------------------------
 docs/deploy/hls.rst      | 183 +++++++++++++++++++++++++++++++++++++++
 docs/deploy/index.rst    |   3 +-
 4 files changed, 184 insertions(+), 281 deletions(-)
 delete mode 100644 docs/deploy/aocl_fpga.md
 delete mode 100644 docs/deploy/aws_fpga.md
 create mode 100644 docs/deploy/hls.rst

diff --git a/docs/deploy/aocl_fpga.md b/docs/deploy/aocl_fpga.md
deleted file mode 100644
index 24f8b65d2e99..000000000000
--- a/docs/deploy/aocl_fpga.md
+++ /dev/null
@@ -1,109 +0,0 @@
-<!--- Licensed to the Apache Software Foundation (ASF) under one -->
-<!--- or more contributor license agreements.  See the NOTICE file -->
-<!--- distributed with this work for additional information -->
-<!--- regarding copyright ownership.  The ASF licenses this file -->
-<!--- to you under the Apache License, Version 2.0 (the -->
-<!--- "License"); you may not use this file except in compliance -->
-<!--- with the License.  You may obtain a copy of the License at -->
-
-<!---   http://www.apache.org/licenses/LICENSE-2.0 -->
-
-<!--- Unless required by applicable law or agreed to in writing, -->
-<!--- software distributed under the License is distributed on an -->
-<!--- "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY -->
-<!--- KIND, either express or implied.  See the License for the -->
-<!--- specific language governing permissions and limitations -->
-<!--- under the License. -->
-
-AOCL Backend Example
-====================
-
-TVM supports Intel FPGA SDK for OpenCL also known as AOCL.  Here is a tutorial for how to use TVM with AOCL.
-
-***Note***: This feature is still experimental.  We cannot use AOCL to deploy an end to end neural networks for now.  In addition, we only tested compilation for emulation mode of AOCL.
-
-We use two python scripts for this tutorial.
-
-- build.py - a script to synthesize FPGA bitstream.
-```
-import tvm
-from tvm import te
-tgt_host="llvm"
-tgt="aocl_sw_emu"
-
-n = te.var("n")
-A = te.placeholder((n,), name='A')
-B = te.placeholder((n,), name='B')
-C = te.compute(A.shape, lambda i: A[i] + B[i], name="C")
-
-s = te.create_schedule(C.op)
-px, x = s[C].split(C.op.axis[0], nparts=1)
-
-s[C].bind(px, tvm.thread_axis("pipeline"))
-
-fadd = tvm.build(s, [A, B, C], tgt, target_host=tgt_host, name="myadd")
-
-fadd.save("myadd.o")
-fadd.imported_modules[0].save("myadd.aocx")
-
-tvm.contrib.cc.create_shared("myadd.so", ["myadd.o"])
-```
-
-- run.py - a script to use FPGA as an accelerator.
-```
-import tvm
-import numpy as np
-import os
-
-tgt="aocl_sw_emu"
-
-fadd = tvm.runtime.load("myadd.so")
-fadd_dev = tvm.runtime.load("myadd.aocx")
-fadd.import_module(fadd_dev)
-
-ctx = tvm.context(tgt, 0)
-
-n = 1024
-a = tvm.nd.array(np.random.uniform(size=n).astype("float32"), ctx)
-b = tvm.nd.array(np.random.uniform(size=n).astype("float32"), ctx)
-c = tvm.nd.array(np.zeros(n, dtype="float32"), ctx)
-
-fadd(a, b, c)
-tvm.testing.assert_allclose(c.asnumpy(), a.asnumpy() + b.asnumpy())
-```
-
-Setup
------
-
-- Install AOCL 17.1 on Ubuntu 16.04.4 LTS.
-- Install BSP for your FPGA device.
-- Install FPGA device driver.
-- Create an ICD file at /etc/OpenCL/vendors/Altera.icd so that the OpenCL platform can be found.
-```
-/opt/intelFPGA/17.1/hld/linux64/lib/libalteracl.so
-```
-- Create an FCD file for example at /opt/Intel/OpenCL/Boards/s5_ref.fcd so that your FPGA device can be found.
-```
-/opt/intelFPGA/17.1/hld/board/s5_ref/linux64/lib/libaltera_s5_ref_mmd.so
-```
-- Setup TVM with AOCL and OpenCL enabled.
-
-Emulation
----------
-
-- Run software emulation
-```
-export CL_CONTEXT_EMULATOR_DEVICE_INTELFPGA=1
-
-python build.py
-python run.py
-```
-
-- Run on FPGA devices (not tested)
-    - Change tgt value to "aocl -device=s5_ref" on build.py and run.py
-```
-unset CL_CONTEXT_EMULATOR_DEVICE_INTELFPGA
-
-python build.py
-python run.py
-```
diff --git a/docs/deploy/aws_fpga.md b/docs/deploy/aws_fpga.md
deleted file mode 100644
index 894585f14b8a..000000000000
--- a/docs/deploy/aws_fpga.md
+++ /dev/null
@@ -1,170 +0,0 @@
-<!--- Licensed to the Apache Software Foundation (ASF) under one -->
-<!--- or more contributor license agreements.  See the NOTICE file -->
-<!--- distributed with this work for additional information -->
-<!--- regarding copyright ownership.  The ASF licenses this file -->
-<!--- to you under the Apache License, Version 2.0 (the -->
-<!--- "License"); you may not use this file except in compliance -->
-<!--- with the License.  You may obtain a copy of the License at -->
-
-<!---   http://www.apache.org/licenses/LICENSE-2.0 -->
-
-<!--- Unless required by applicable law or agreed to in writing, -->
-<!--- software distributed under the License is distributed on an -->
-<!--- "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY -->
-<!--- KIND, either express or implied.  See the License for the -->
-<!--- specific language governing permissions and limitations -->
-<!--- under the License. -->
-
-HLS Backend Example
-===================
-
-TVM supports Xilinx FPGA board with SDAccel.  Here is a tutorial for how to deploy TVM to AWS F1 FPGA instance.
-
-***Note***: This feature is still experimental.  We cannot use SDAccel to deploy an end to end neural networks for now.
-
-We use two python scripts for this tutorial.
-
-- build.py - a script to synthesize FPGA bitstream.
-```python
-import tvm
-from tvm import te
-
-tgt_host="llvm"
-tgt="sdaccel"
-
-n = te.var("n")
-A = te.placeholder((n,), name='A')
-B = te.placeholder((n,), name='B')
-C = te.compute(A.shape, lambda i: A[i] + B[i], name="C")
-
-s = te.create_schedule(C.op)
-px, x = s[C].split(C.op.axis[0], nparts=1)
-
-s[C].bind(px, tvm.thread_axis("pipeline"))
-
-fadd = tvm.build(s, [A, B, C], tgt, target_host=tgt_host, name="myadd")
-
-fadd.save("myadd.o")
-fadd.imported_modules[0].save("myadd.xclbin")
-
-tvm.contrib.cc.create_shared("myadd.so", ["myadd.o"])
-```
-
-- run.py - a script to use FPGA as an accelerator.
-```python
-import tvm
-import numpy as np
-import os
-
-tgt="sdaccel"
-
-fadd = tvm.runtime.load("myadd.so")
-if os.environ.get("XCL_EMULATION_MODE"):
-    fadd_dev = tvm.runtime.load("myadd.xclbin")
-else:
-    fadd_dev = tvm.runtime.load("myadd.awsxclbin")
-fadd.import_module(fadd_dev)
-
-ctx = tvm.context(tgt, 0)
-
-n = 1024
-a = tvm.nd.array(np.random.uniform(size=n).astype("float32"), ctx)
-b = tvm.nd.array(np.random.uniform(size=n).astype("float32"), ctx)
-c = tvm.nd.array(np.zeros(n, dtype="float32"), ctx)
-
-fadd(a, b, c)
-tvm.testing.assert_allclose(c.asnumpy(), a.asnumpy() + b.asnumpy())
-```
-
-Setup
------
-
-- Launch an instance using the FPGA Developer AMI.  We don't need an F1 instance for emulation and synthesis, so it is recommended to use a lower cost instance for them.
-
-- Setup AWS FPGA development kit.
-```bash
-git clone https://github.com/aws/aws-fpga.git
-cd aws-fpga
-source sdaccel_setup.sh
-source ${XILINX_SDX}/settings64.sh
-```
-
-- Setup TVM with OpenCL enabled.
-
-Emulation
----------
-
-- Create emconfig.json for emulation.
-```bash
-emconfigutil --platform ${AWS_PLATFORM} --nd 1
-```
-
-- Copy emconfig.json to the python binary directory.  It is because the current Xilinx toolkit assumes that both host binary and the emconfig.json file are in the same path.
-```bash
-cp emconfig.json $(dirname $(which python))
-```
-
-- Run software emulation
-```bash
-export XCL_EMULATION_MODE=1
-export XCL_TARGET=sw_emu
-
-python build.py
-python run.py
-```
-
-- Run hardware emulation
-```bash
-export XCL_EMULATION_MODE=1
-export XCL_TARGET=hw_emu
-
-python build.py
-python run.py
-```
-
-
-Synthesis
----------
-
-- Run synthesis with the following script.
-
-```bash
-unset XCL_EMULATION_MODE
-export XCL_TARGET=hw
-
-python build.py
-```
-
-- Create AWS FPGA image and upload it to AWS S3.
-```
-${SDACCEL_DIR}/tools/create_sdaccel_afi.sh -xclbin=myadd.xclbin -o=myadd \
-    -s3_bucket=<bucket-name> -s3_dcp_key=<dcp-folder-name> -s3_logs_key=<logs-folder-name>
-```
-This also generates an awsxclbin file, which is necessary to use the AWS FPGA image on F1 instances.
-
-Run
----
-
-- Launch Amazon EC2 F1 instance.
-
-- Copy `myadd.so`, `myadd.awsxclbin`, and `run.py` to the F1 instance.
-
-- Setup AWS FPGA development kit.
-```bash
-git clone https://github.com/aws/aws-fpga.git
-cd aws-fpga
-source sdaccel_setup.sh
-```
-
-- Setup TVM with OpenCL enabled.
-
-- Become root and setup environment variables.
-```bash
-sudo sh
-source ${INSTALL_ROOT}/setup.sh
-```
-
-- Run
-```bash
-python run.py
-```
diff --git a/docs/deploy/hls.rst b/docs/deploy/hls.rst
new file mode 100644
index 000000000000..64717ed1e678
--- /dev/null
+++ b/docs/deploy/hls.rst
@@ -0,0 +1,183 @@
+..  Licensed to the Apache Software Foundation (ASF) under one
+    or more contributor license agreements.  See the NOTICE file
+    distributed with this work for additional information
+    regarding copyright ownership.  The ASF licenses this file
+    to you under the Apache License, Version 2.0 (the
+    "License"); you may not use this file except in compliance
+    with the License.  You may obtain a copy of the License at
+
+..    http://www.apache.org/licenses/LICENSE-2.0
+
+..  Unless required by applicable law or agreed to in writing,
+    software distributed under the License is distributed on an
+    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+    KIND, either express or implied.  See the License for the
+    specific language governing permissions and limitations
+    under the License.
+
+
+HLS Backend Example
+===================
+
+TVM supports Xilinx FPGA board with SDAccel.  Here is a tutorial for how to deploy TVM to AWS F1 FPGA instance.
+
+.. note::
+
+    This feature is still experimental.  We cannot use SDAccel to deploy an end to end neural networks for now.
+
+We use two python scripts for this tutorial.
+
+- build.py - a script to synthesize FPGA bitstream.
+
+  .. code:: python
+
+      import tvm
+      from tvm import te
+
+      tgt_host="llvm"
+      tgt="sdaccel"
+
+      n = te.var("n")
+      A = te.placeholder((n,), name='A')
+      B = te.placeholder((n,), name='B')
+      C = te.compute(A.shape, lambda i: A[i] + B[i], name="C")
+
+      s = te.create_schedule(C.op)
+      px, x = s[C].split(C.op.axis[0], nparts=1)
+
+      s[C].bind(px, tvm.thread_axis("pipeline"))
+
+      fadd = tvm.build(s, [A, B, C], tgt, target_host=tgt_host, name="myadd")
+
+      fadd.save("myadd.o")
+      fadd.imported_modules[0].save("myadd.xclbin")
+
+      tvm.contrib.cc.create_shared("myadd.so", ["myadd.o"])
+
+- run.py - a script to use FPGA as an accelerator.
+
+  .. code:: python
+
+      import tvm
+      import numpy as np
+      import os
+
+      tgt="sdaccel"
+
+      fadd = tvm.runtime.load("myadd.so")
+      if os.environ.get("XCL_EMULATION_MODE"):
+          fadd_dev = tvm.runtime.load("myadd.xclbin")
+      else:
+          fadd_dev = tvm.runtime.load("myadd.awsxclbin")
+      fadd.import_module(fadd_dev)
+
+      ctx = tvm.context(tgt, 0)
+
+      n = 1024
+      a = tvm.nd.array(np.random.uniform(size=n).astype("float32"), ctx)
+      b = tvm.nd.array(np.random.uniform(size=n).astype("float32"), ctx)
+      c = tvm.nd.array(np.zeros(n, dtype="float32"), ctx)
+
+      fadd(a, b, c)
+      tvm.testing.assert_allclose(c.asnumpy(), a.asnumpy() + b.asnumpy())
+
+
+Setup
+-----
+
+- Launch an instance using the FPGA Developer AMI.  We don't need an F1 instance for emulation and synthesis, so it is recommended to use a lower cost instance for them.
+- Setup AWS FPGA development kit.
+
+  .. code:: bash
+
+      git clone https://github.com/aws/aws-fpga.git
+      cd aws-fpga
+      source sdaccel_setup.sh
+      source ${XILINX_SDX}/settings64.sh
+
+- Setup TVM with OpenCL enabled.
+
+Emulation
+---------
+
+- Create emconfig.json for emulation.
+
+  .. code:: bash
+
+      emconfigutil --platform ${AWS_PLATFORM} --nd 1
+
+- Copy emconfig.json to the python binary directory.  It is because the current Xilinx toolkit assumes that both host binary and the emconfig.json file are in the same path.
+
+  .. code:: bash
+
+      cp emconfig.json $(dirname $(which python))
+
+- Run software emulation
+
+  .. code:: bash
+
+      export XCL_EMULATION_MODE=1
+      export XCL_TARGET=sw_emu
+
+      python build.py
+      python run.py
+
+- Run hardware emulation
+
+  .. code:: bash
+
+      export XCL_EMULATION_MODE=1
+      export XCL_TARGET=hw_emu
+
+      python build.py
+      python run.py
+
+Synthesis
+---------
+
+- Run synthesis with the following script.
+
+  .. code:: bash
+
+      unset XCL_EMULATION_MODE
+      export XCL_TARGET=hw
+
+      python build.py
+
+- Create AWS FPGA image and upload it to AWS S3.
+
+  .. code:: bash
+
+      ${SDACCEL_DIR}/tools/create_sdaccel_afi.sh \
+          -xclbin=myadd.xclbin -o=myadd \
+          -s3_bucket=<bucket-name> -s3_dcp_key=<dcp-folder-name> \
+          -s3_logs_key=<logs-folder-name>
+
+  This also generates an awsxclbin file, which is necessary to use the AWS FPGA image on F1 instances.
+
+Run
+---
+
+- Launch Amazon EC2 F1 instance.
+- Copy ``myadd.so``, ``myadd.awsxclbin``, and ``run.py`` to the F1 instance.
+- Setup AWS FPGA development kit.
+
+  .. code:: bash
+
+      git clone https://github.com/aws/aws-fpga.git
+      cd aws-fpga
+      source sdaccel_setup.sh
+
+- Setup TVM with OpenCL enabled.
+- Become root and setup environment variables.
+
+  .. code:: bash
+
+      sudo sh
+      source ${INSTALL_ROOT}/setup.sh
+
+- Run
+
+  .. code:: bash
+
+      python run.py
diff --git a/docs/deploy/index.rst b/docs/deploy/index.rst
index db2938635b82..53455ed50881 100644
--- a/docs/deploy/index.rst
+++ b/docs/deploy/index.rst
@@ -67,5 +67,4 @@ target device without relying on RPC. see the following resources on how to do s
    cpp_deploy
    android
    integrate
-   aocl_fpga
-   aws_fpga
+   hls