From c38e5298e895130615d765bb2ee39fdf6f5148ad Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jorn.tuyls@gmail.com>
Date: Tue, 26 Jan 2021 07:24:04 -0800
Subject: [PATCH 1/9] Fix bug in vitis ai codegen out tensor names matching &
 update docs & update docker

---
 docker/Dockerfile.demo_vitis_ai         |  2 +-
 docs/deploy/vitis_ai.rst                | 36 ++++++++++++++++---------
 python/tvm/contrib/target/vitis_ai.py   |  4 +--
 python/tvm/relay/op/contrib/vitis_ai.py |  4 +++
 4 files changed, 31 insertions(+), 15 deletions(-)

diff --git a/docker/Dockerfile.demo_vitis_ai b/docker/Dockerfile.demo_vitis_ai
index 58326b66bf0c..dd974fda374e 100644
--- a/docker/Dockerfile.demo_vitis_ai
+++ b/docker/Dockerfile.demo_vitis_ai
@@ -18,7 +18,7 @@
 # CI docker VAI env
 FROM xilinx/vitis-ai:latest
 
-RUN apt-get update --fix-missing
+RUN apt-get update --fix-missing && apt-get install -y gpg-agent
 
 
 COPY install/ubuntu_install_core.sh /install/ubuntu_install_core.sh
diff --git a/docs/deploy/vitis_ai.rst b/docs/deploy/vitis_ai.rst
index df29f16f9d8d..39ff0e1ca8ce 100755
--- a/docs/deploy/vitis_ai.rst
+++ b/docs/deploy/vitis_ai.rst
@@ -309,7 +309,7 @@ Edge hardware setup
    https://github.com/Xilinx/PYNQ/releases/tag/v2.5
 2. Follow Pynq instructions for setting up the board: `pynq
    setup <https://pynq.readthedocs.io/en/latest/getting_started.html>`__
-3. After connecting to the board, make sure to run as root. Execute
+3. After connecting to the board, make sure to run as root. **Execute**
    ``su``
 4. Set up DPU on Pynq by following the steps here: `DPU Pynq
    setup <https://github.com/Xilinx/DPU-PYNQ>`__
@@ -441,7 +441,7 @@ TVM.
    import tvm
    import tvm.relay as relay
    from tvm.contrib.target import vitis_ai
-   from tvm.contrib import util, graph_runtime
+   from tvm.contrib import utils, graph_runtime
    from tvm.relay.build_module import bind_params_by_name
    from tvm.relay.op.contrib.vitis_ai import annotation
 
@@ -541,7 +541,7 @@ TVM.
    import tvm
    import tvm.relay as relay
    from tvm.contrib.target import vitis_ai
-   from tvm.contrib import util, graph_runtime
+   from tvm.contrib import utils, graph_runtime
    from tvm.relay.build_module import bind_params_by_name
    from tvm.relay.op.contrib.vitis_ai import annotation
 
@@ -572,13 +572,9 @@ can be included.
 
 .. code:: python
 
-   from tvm.contrib import util
-
-   temp = util.tempdir()
-
    tvm_target = 'llvm'
    target='DPUCZDX8G-zcu104'
-   export_rt_mod_file = temp.relpath("vitis_ai.rtmod")
+   export_rt_mod_file = "vitis_ai.rtmod"
 
    with tvm.transform.PassContext(opt_level=3, config= {'relay.ext.vitis_ai.options.target': target,
    						        'relay.ext.vitis_ai.options.export_runtime_module': export_rt_mod_file}):
@@ -604,9 +600,9 @@ Save the TVM lib module so that the Vitis-AI runtime module will also be exporte
 
 .. code:: python
 
-   from tvm.contrib import util
+   from tvm.contrib import utils
 
-   temp = util.tempdir()
+   temp = utils.tempdir()
    lib.export_library(temp.relpath("tvm_lib.so"))
 
 After quantizing and compiling the model for Vitis-AI acceleration using the
@@ -638,15 +634,31 @@ Edge steps
 ^^^^^^^^^^
 
 After setting up TVM with Vitis-AI on the edge device, you can now load
-the TVM runtime module into memory and feed inputs for inference.
+the TVM runtime module into memory and feed inputs for inference. A nearly
+complete runtiem script can be found underneath. Make sure to run the script
+as root (execute ``su`` in terminal to log into root).
+
+
+.. note::
+
+    You will see a warning about the 'cpu-tf' runtime not being found. This warning is
+    expected on the board and can be ignored. Note also that you **shouldn't** import the
+    PyXIR targets in the run script (``import pyxir.contrib.target.DPUCZDX8G``).
 
 .. code:: python
 
+   import pyxir
+   import tvm
+   from tvm.contrib import graph_runtime
+
    ctx = tvm.cpu()
+   
+   # input_name = ...
+   # input_data = ...
 
    # load the module into memory
    lib = tvm.runtime.load_module("tvm_dpu_arm.so")
 
    module = graph_runtime.GraphModule(lib["default"](tvm.cpu()))
-   module.set_input(name, data)
+   module.set_input(input_name, input_data)
    module.run()
diff --git a/python/tvm/contrib/target/vitis_ai.py b/python/tvm/contrib/target/vitis_ai.py
index d4931d9e3f48..2bc0e355a930 100644
--- a/python/tvm/contrib/target/vitis_ai.py
+++ b/python/tvm/contrib/target/vitis_ai.py
@@ -132,12 +132,12 @@ def vitis_ai_compiler(ref):
         layers = xgraph.get_layers()
 
         # Get the output tensor names using XGraph and output Relay ids
-        out_tensor_names = []
+        out_tensor_names = [1] * len(output_relay_ids)
         for layer in layers:
             if not layer.internal:
                 for relay_id in layer.attrs["relay_id"]:
                     if relay_id in output_relay_ids:
-                        out_tensor_names.append(layer.name)
+                        out_tensor_names[output_relay_ids.index(relay_id)] = layer.name
                         break
         if not out_tensor_names:
             raise ValueError(
diff --git a/python/tvm/relay/op/contrib/vitis_ai.py b/python/tvm/relay/op/contrib/vitis_ai.py
index fa17c63fc00a..aaa9f99e61ed 100644
--- a/python/tvm/relay/op/contrib/vitis_ai.py
+++ b/python/tvm/relay/op/contrib/vitis_ai.py
@@ -85,6 +85,10 @@ def visit_call(self, call):
 
 def annotation(mod, params, target):
     """Annotate Relay expression for Vitis-AI DPU accelerators"""
+    # We need type information for supporting models that contain operations that don't
+    #   have a Relay to XLayer translation
+    mod = relay.transform.InferType()(mod)
+
     xgraph = pyxir.frontend.tvm.from_relay(mod, params, postprocessing=None)
     xgraph = pyxir.partition(xgraph, targets=[target])
 

From 90fd26c50aaf24e2fe37d63f5657785c05fe1c4b Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jtuyls@users.noreply.github.com>
Date: Wed, 27 Jan 2021 13:59:34 +0000
Subject: [PATCH 2/9] Update vitis_ai.rst

---
 docs/deploy/vitis_ai.rst | 32 ++++++++++++++++++++++++++++++++
 1 file changed, 32 insertions(+)

diff --git a/docs/deploy/vitis_ai.rst b/docs/deploy/vitis_ai.rst
index 39ff0e1ca8ce..91cd4393e8e1 100755
--- a/docs/deploy/vitis_ai.rst
+++ b/docs/deploy/vitis_ai.rst
@@ -524,6 +524,8 @@ model in TVM with Vitis-AI at the edge. The first couple of steps will
 have to be run on the host machine and take care of quantization and
 compilation for deployment at the edge.
 
+A complete ResNet 18 example can be found `here <https://github.com/Xilinx/pyxir/tree/master/examples/tvm>`__.
+
 Host steps
 ^^^^^^^^^^
 
@@ -549,12 +551,42 @@ After importing a convolutional neural network model using the usual
 Relay API's, annotate the Relay expression for the given Vitis-AI DPU
 target and partition the graph.
 
+.. note::
+
+    We recommend switching DPU convolutions' data layouts to NHWC and CPU comvolutions'
+    data layouts to NCHW for best DPU and CPU performance. You can use the ConvertLayout
+    transformation pass two times to achieve this as demonstrated in the code block
+    underneath.
+
 .. code:: python
 
    mod["main"] = bind_params_by_name(mod["main"], params)
+   
+   # For edge DPU we recommend switching the convolutions'data layout
+   #    to NHWC for best performance. Therefore, we first convert the layouts
+   #    of all convolutions to NHWC before partitioning. Afterwards, we can
+   #    convert any remaining convolutions (to be executed on CPU) back to NCHW.
+   desired_layouts = {'nn.conv2d': ['NHWC', 'default']}
+   seq = tvm.transform.Sequential([relay.transform.RemoveUnusedFunctions(),
+                                   relay.transform.ConvertLayout(desired_layouts),
+                                   relay.transform.FoldConstant()])
+   with tvm.transform.PassContext(opt_level=3):
+       mod = seq(mod)
+            
+   # Annotate and partition the Relay expression for the given target
    mod = annotation(mod, params, target)
    mod = relay.transform.MergeCompilerRegions()(mod)
    mod = relay.transform.PartitionGraph()(mod)
+   
+   # After partitioning we recommend transforming the remaining convolutions
+   #    (that will be executed on CPU, if any) back to NCHW data layout
+   #    for best CPU performance
+   desired_layouts = {'nn.conv2d': ['NCHW', 'default']}
+   seq = tvm.transform.Sequential([relay.transform.RemoveUnusedFunctions(),
+                                   relay.transform.ConvertLayout(desired_layouts),
+                                   relay.transform.FoldConstant()])
+   with tvm.transform.PassContext(opt_level=3):
+       mod = seq(mod)
 
 Now, we can build the TVM runtime library for executing the model. The
 TVM target is 'llvm' as the operations that can't be handled by the DPU

From 7c6b76ae5b75b4e1ffbf184732a0164f49075055 Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jornt.tuyls@gmail.com>
Date: Wed, 27 Jan 2021 06:33:41 -0800
Subject: [PATCH 3/9] Move gpg-agent package installation to vitis ai core
 script

---
 docker/Dockerfile.demo_vitis_ai                | 3 +--
 docker/install/ubuntu_install_vitis_ai_core.sh | 5 +++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docker/Dockerfile.demo_vitis_ai b/docker/Dockerfile.demo_vitis_ai
index dd974fda374e..b14ddfaecb84 100644
--- a/docker/Dockerfile.demo_vitis_ai
+++ b/docker/Dockerfile.demo_vitis_ai
@@ -18,8 +18,7 @@
 # CI docker VAI env
 FROM xilinx/vitis-ai:latest
 
-RUN apt-get update --fix-missing && apt-get install -y gpg-agent
-
+RUN apt-get update --fix-missing
 
 COPY install/ubuntu_install_core.sh /install/ubuntu_install_core.sh
 RUN bash /install/ubuntu_install_core.sh
diff --git a/docker/install/ubuntu_install_vitis_ai_core.sh b/docker/install/ubuntu_install_vitis_ai_core.sh
index ea05ffd170fe..4f5c17fc9bd9 100644
--- a/docker/install/ubuntu_install_vitis_ai_core.sh
+++ b/docker/install/ubuntu_install_vitis_ai_core.sh
@@ -22,8 +22,9 @@ set -o pipefail
 
 # install libraries for building Vitis-AI on ubuntu
 apt-get update && apt-get install -y --no-install-recommends \
-    graphviz\
-    gnupg2
+    graphviz \
+    gnupg2 \
+    gpg-agent
 
 apt-get update && apt-get install -y gcc-aarch64-linux-gnu
 

From a459bac9ce475298198e5415a6f7f8c3c97fb2df Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jornt.tuyls@gmail.com>
Date: Wed, 27 Jan 2021 07:50:32 -0800
Subject: [PATCH 4/9] Refactor install_vitis_ai_core script

---
 docker/install/ubuntu_install_vitis_ai_core.sh | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/docker/install/ubuntu_install_vitis_ai_core.sh b/docker/install/ubuntu_install_vitis_ai_core.sh
index 4f5c17fc9bd9..a2d7c2ebe332 100644
--- a/docker/install/ubuntu_install_vitis_ai_core.sh
+++ b/docker/install/ubuntu_install_vitis_ai_core.sh
@@ -21,10 +21,9 @@ set -u
 set -o pipefail
 
 # install libraries for building Vitis-AI on ubuntu
-apt-get update && apt-get install -y --no-install-recommends \
+apt-get update && apt-get install -y \
     graphviz \
     gnupg2 \
-    gpg-agent
-
-apt-get update && apt-get install -y gcc-aarch64-linux-gnu
-
+    gpg-agent \
+    gcc-aarch64-linux-gnu \
+    && rm -rf /var/lib/apt/lists/*

From 012af91e50451cbfd8fcfa5bbe44b0b37223362d Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jtuyls@users.noreply.github.com>
Date: Sun, 31 Jan 2021 11:48:04 +0000
Subject: [PATCH 5/9] Update docs/deploy/vitis_ai.rst

Co-authored-by: Cody Yu <comaniac0422@gmail.com>
---
 docs/deploy/vitis_ai.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/deploy/vitis_ai.rst b/docs/deploy/vitis_ai.rst
index 91cd4393e8e1..faf7bea5ca50 100755
--- a/docs/deploy/vitis_ai.rst
+++ b/docs/deploy/vitis_ai.rst
@@ -553,7 +553,7 @@ target and partition the graph.
 
 .. note::
 
-    We recommend switching DPU convolutions' data layouts to NHWC and CPU comvolutions'
+    We recommend converting DPU convolutions' data layouts to NHWC and CPU convolutions'
     data layouts to NCHW for best DPU and CPU performance. You can use the ConvertLayout
     transformation pass two times to achieve this as demonstrated in the code block
     underneath.

From c7a120073fec7ac4afc501b1045787701b6f3514 Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jtuyls@users.noreply.github.com>
Date: Sun, 31 Jan 2021 11:48:21 +0000
Subject: [PATCH 6/9] Update docs/deploy/vitis_ai.rst

Co-authored-by: Cody Yu <comaniac0422@gmail.com>
---
 docs/deploy/vitis_ai.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/deploy/vitis_ai.rst b/docs/deploy/vitis_ai.rst
index faf7bea5ca50..0a4ce470d3f9 100755
--- a/docs/deploy/vitis_ai.rst
+++ b/docs/deploy/vitis_ai.rst
@@ -562,7 +562,7 @@ target and partition the graph.
 
    mod["main"] = bind_params_by_name(mod["main"], params)
    
-   # For edge DPU we recommend switching the convolutions'data layout
+   # For edge DPU we recommend converting the convolutions' data layout
    #    to NHWC for best performance. Therefore, we first convert the layouts
    #    of all convolutions to NHWC before partitioning. Afterwards, we can
    #    convert any remaining convolutions (to be executed on CPU) back to NCHW.

From 0858842930cc8f64ab4282a34ca050f865870ab7 Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jornt.tuyls@gmail.com>
Date: Sun, 31 Jan 2021 04:23:51 -0800
Subject: [PATCH 7/9] Update vitis-ai docs pynq/edge setup & adjustements for
 comments

---
 docs/deploy/vitis_ai.rst              | 33 +++++++++++++++++++--------
 python/tvm/contrib/target/vitis_ai.py |  2 +-
 2 files changed, 24 insertions(+), 11 deletions(-)

diff --git a/docs/deploy/vitis_ai.rst b/docs/deploy/vitis_ai.rst
index 0a4ce470d3f9..7de8f58ce54f 100755
--- a/docs/deploy/vitis_ai.rst
+++ b/docs/deploy/vitis_ai.rst
@@ -304,15 +304,22 @@ Edge hardware setup
   This section provides instructions for setting up with the `Pynq <http://www.pynq.io/>`__ platform but
   Petalinux based flows are also supported.
 
-1. Download the Pynq v2.5 image for your target (use Z1 or Z2 for
+1. Download the Pynq v2.6 image for your target (use Z1 or Z2 for
    Ultra96 target depending on board version) Link to image:
-   https://github.com/Xilinx/PYNQ/releases/tag/v2.5
+   https://github.com/Xilinx/PYNQ/releases/tag/v2.6.0
 2. Follow Pynq instructions for setting up the board: `pynq
    setup <https://pynq.readthedocs.io/en/latest/getting_started.html>`__
 3. After connecting to the board, make sure to run as root. **Execute**
    ``su``
-4. Set up DPU on Pynq by following the steps here: `DPU Pynq
-   setup <https://github.com/Xilinx/DPU-PYNQ>`__
+4. Set up DPU on Pynq:
+
+    .. code:: bash
+
+     git clone --branch v1.2.0 --recursive --shallow-submodules https://github.com/Xilinx/DPU-PYNQ.git
+     cd DPU-PYNQ/upgrade
+     make
+     pip3 install pynq-dpu==1.2.0
+
 5. Run the following command to download the DPU bitstream:
 
    .. code:: bash
@@ -343,7 +350,7 @@ interface between TVM and Vitis-AI tools.
    .. code:: bash
 
       apt-get install libhdf5-dev
-      pip3 install pydot h5py
+      pip3 install pydot==1.4.1 h5py==2.8.0
 
 2. Install PyXIR
 
@@ -362,16 +369,17 @@ interface between TVM and Vitis-AI tools.
       mkdir build
       cp cmake/config.cmake build
       cd build
+      echo set\(USE_LLVM OFF\) >> config.cmake
       echo set\(USE_VITIS_AI ON\) >> config.cmake
       cmake ..
-      make
+      make tvm_runtime -j$(nproc)
 
 4. Install TVM
 
    .. code:: bash
 
       cd tvm/python
-      pip3 install -e . --user
+      pip3 install -e .
 
 5. Check whether the setup was successful in the Python shell:
 
@@ -554,9 +562,14 @@ target and partition the graph.
 .. note::
 
     We recommend converting DPU convolutions' data layouts to NHWC and CPU convolutions'
-    data layouts to NCHW for best DPU and CPU performance. You can use the ConvertLayout
-    transformation pass two times to achieve this as demonstrated in the code block
-    underneath.
+    data layouts to NCHW for best DPU and out of the box CPU performance. You can use the
+    ConvertLayout transformation pass two times to achieve this as demonstrated in the code
+    block underneath. You can also leave the CPU convolution layouts in NHWC and tune ARM CPU
+    performance for this data layout to avoid the layout transformation overheads introduced by
+    executing DPU convolutions in NHWC and CPU convolutions in NCHW
+    (check out the `AutoScheduling <https://tvm.apache.org/docs/tutorials/index.html#autoscheduler-template-free-auto-scheduling>`__
+    and `AutoTuning <https://tvm.apache.org/docs/tutorials/autotvm/tune_relay_arm.html>`__
+    tutorials for this).
 
 .. code:: python
 
diff --git a/python/tvm/contrib/target/vitis_ai.py b/python/tvm/contrib/target/vitis_ai.py
index 2bc0e355a930..ae47011e77ac 100644
--- a/python/tvm/contrib/target/vitis_ai.py
+++ b/python/tvm/contrib/target/vitis_ai.py
@@ -132,7 +132,7 @@ def vitis_ai_compiler(ref):
         layers = xgraph.get_layers()
 
         # Get the output tensor names using XGraph and output Relay ids
-        out_tensor_names = [1] * len(output_relay_ids)
+        out_tensor_names = ["unknown_name"] * len(output_relay_ids)
         for layer in layers:
             if not layer.internal:
                 for relay_id in layer.attrs["relay_id"]:

From b8bf18b83001a2286e9397a426d2016e65904326 Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jtuyls@users.noreply.github.com>
Date: Tue, 16 Feb 2021 20:31:03 +0000
Subject: [PATCH 8/9] Update python/tvm/contrib/target/vitis_ai.py

Co-authored-by: Cody Yu <comaniac0422@gmail.com>
---
 python/tvm/contrib/target/vitis_ai.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/tvm/contrib/target/vitis_ai.py b/python/tvm/contrib/target/vitis_ai.py
index ae47011e77ac..f319fd799829 100644
--- a/python/tvm/contrib/target/vitis_ai.py
+++ b/python/tvm/contrib/target/vitis_ai.py
@@ -139,7 +139,7 @@ def vitis_ai_compiler(ref):
                     if relay_id in output_relay_ids:
                         out_tensor_names[output_relay_ids.index(relay_id)] = layer.name
                         break
-        if not out_tensor_names:
+        if any([name == "unkown_name" for name in out_tensor_names]):
             raise ValueError(
                 "During codegeneration the loading of subexpression \
                              failed due to output tensor name mismatch in Relay PyXIR interface."

From 2daac84575a1a335ca54118c154266eac1519d72 Mon Sep 17 00:00:00 2001
From: Jorn Tuyls <jornt.tuyls@gmail.com>
Date: Tue, 23 Feb 2021 01:50:19 -0800
Subject: [PATCH 9/9] Reorg Vitis AI dockerfile to make sure gpg-agent is
 installed before llvm

---
 docker/Dockerfile.demo_vitis_ai | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docker/Dockerfile.demo_vitis_ai b/docker/Dockerfile.demo_vitis_ai
index b14ddfaecb84..8cc623e2f38c 100644
--- a/docker/Dockerfile.demo_vitis_ai
+++ b/docker/Dockerfile.demo_vitis_ai
@@ -23,6 +23,10 @@ RUN apt-get update --fix-missing
 COPY install/ubuntu_install_core.sh /install/ubuntu_install_core.sh
 RUN bash /install/ubuntu_install_core.sh
 
+# Install Vitis-AI ubuntu dependencies
+COPY install/ubuntu_install_vitis_ai_core.sh /install/ubuntu_install_vitis_ai_core.sh
+RUN bash /install/ubuntu_install_vitis_ai_core.sh
+
 COPY install/ubuntu_install_python.sh /install/ubuntu_install_python.sh
 RUN bash /install/ubuntu_install_python.sh
 
@@ -42,10 +46,6 @@ ENV PATH $PATH:$CARGO_HOME/bin:/usr/lib/go-1.10/bin
 COPY install/ubuntu_install_java.sh /install/ubuntu_install_java.sh
 RUN bash /install/ubuntu_install_java.sh
 
-# Install Vitis-AI ubuntu dependencies
-COPY install/ubuntu_install_vitis_ai_core.sh /install/ubuntu_install_vitis_ai_core.sh
-RUN bash /install/ubuntu_install_vitis_ai_core.sh
-
 # Install dependencies inside vitis-ai-tensorflow conda
 RUN . $VAI_ROOT/conda/etc/profile.d/conda.sh && \
     conda activate vitis-ai-tensorflow && \